Iter #50: [tensor([-0.4017, -0.0879, -0.0052, -0.0112, -0.0216, -0.0933, -0.0201, -0.0149,
        -0.0845, -0.0169, -0.0154, -0.0086, -0.0144, -0.0782, -0.0131, -0.0315,
        -0.0243, -0.0095, -0.0292, -0.0052, -0.0055, -0.0079,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.3216, -0.1533, -0.0218, -0.0377, -0.0241, -0.0254, -0.0493, -0.0245,
        -0.0227, -0.0226, -0.0515, -0.0606, -0.1290, -0.0240, -0.0150, -0.0169,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.3694, -0.1363, -0.0146, -0.0337, -0.0256, -0.0228, -0.0371, -0.0163,
        -0.0160, -0.0116, -0.0364, -0.0267, -0.0349, -0.0415, -0.1329, -0.0163,
        -0.0113, -0.0165,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.3184, -0.1778, -0.0191, -0.0392, -0.0282, -0.0225, -0.0476, -0.0229,
        -0.0185, -0.0196, -0.0290, -0.0752, -0.0278, -0.0494, -0.0287, -0.0490,
        -0.0110, -0.0159,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.3779, -0.0947, -0.0160, -0.0191, -0.0142, -0.0222, -0.0184, -0.0153,
        -0.0398, -0.0158, -0.0150, -0.0120, -0.1021, -0.0056, -0.0183, -0.0110,
        -0.0144, -0.0920, -0.0073, -0.0090, -0.0370, -0.0089, -0.0090, -0.0154,
        -0.0032, -0.0062], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.3158, -0.0893, -0.0162, -0.0180, -0.0143, -0.0214, -0.0169, -0.0136,
        -0.0395, -0.0210, -0.0115, -0.0144, -0.0926, -0.0089, -0.0217, -0.0111,
        -0.0194, -0.0815, -0.0184, -0.0007, -0.0137, -0.0296, -0.0106, -0.0829,
        -0.0118, -0.0048], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.3483, -0.1079, -0.0095, -0.0166, -0.0140, -0.0237, -0.0146, -0.0135,
        -0.0420, -0.0169, -0.0147, -0.0123, -0.1078, -0.0055, -0.0193, -0.0079,
        -0.0172, -0.0909, -0.0101, -0.0134, -0.0389,  0.0017, -0.0120, -0.0355,
         0.0020, -0.0038], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.4032, -0.0436, -0.0200, -0.0432, -0.0255, -0.0552, -0.1434, -0.0155,
        -0.0539, -0.0137, -0.0176, -0.0408, -0.0291, -0.0351, -0.0368, -0.0064,
        -0.0168,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.4186, -0.0426, -0.0189, -0.0414, -0.0244, -0.0558, -0.1481, -0.0135,
        -0.0454, -0.0077, -0.0218, -0.0374, -0.0185, -0.0360, -0.0227, -0.0149,
        -0.0135, -0.0188,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4861, 0.0341, 0.0133, 0.0267, 0.0143, 0.0458, 0.1089, 0.0103, 0.0466,
        0.0101, 0.0133, 0.0459, 0.0245, 0.0185, 0.0355, 0.0141, 0.0255, 0.0058,
        0.0206, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.4486,  0.0269,  0.0203,  0.0427,  0.0229,  0.0401,  0.0834,  0.0403,
         0.0096,  0.0235,  0.0270,  0.0078,  0.0038,  0.0683,  0.0275,  0.0319,
        -0.0455,  0.0090,  0.0210,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.6303, 0.0261, 0.0125, 0.0288, 0.0098, 0.0101, 0.0141, 0.0240, 0.0245,
        0.0105, 0.0123, 0.0320, 0.0131, 0.0253, 0.0142, 0.0164, 0.0360, 0.0304,
        0.0154, 0.0022, 0.0119, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #100: [tensor([-0.2481, -0.1652, -0.0010, -0.0171, -0.0107, -0.0050, -0.0061, -0.0118,
        -0.0413, -0.0147, -0.0127, -0.1453, -0.0154, -0.0088, -0.0093, -0.1471,
        -0.0086, -0.0360, -0.0138, -0.0367, -0.0373, -0.0008, -0.0073,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3761, 0.2348, 0.0118, 0.0588, 0.0585, 0.0130, 0.0154, 0.0137, 0.0267,
        0.0083, 0.0090, 0.0636, 0.0170, 0.0086, 0.0143, 0.0207, 0.0215, 0.0133,
        0.0148, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3560, 0.1725, 0.0062, 0.0465, 0.0296, 0.0100, 0.0092, 0.0098, 0.0165,
        0.0050, 0.0078, 0.0427, 0.0128, 0.0067, 0.0104, 0.1400, 0.0108, 0.0382,
        0.0019, 0.0206, 0.0096, 0.0223, 0.0077, 0.0072, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3398, 0.2566, 0.0117, 0.0706, 0.0548, 0.0153, 0.0128, 0.0152, 0.0321,
        0.0117, 0.0120, 0.0618, 0.0140, 0.0081, 0.0140, 0.0209, 0.0297, 0.0056,
        0.0133, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3818, 0.2718, 0.0269, 0.0196, 0.0090, 0.0472, 0.0261, 0.0077, 0.0059,
        0.0081, 0.0124, 0.0086, 0.0050, 0.0155, 0.0722, 0.0251, 0.0120, 0.0212,
        0.0118, 0.0122, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([4.5900e-01, 2.4263e-01, 1.7815e-02, 1.7914e-02, 5.7610e-03, 3.9139e-02,
        2.6623e-02, 6.4862e-03, 5.7709e-03, 2.4841e-03, 1.0634e-02, 6.3955e-02,
        2.3809e-02, 1.4460e-02, 1.1644e-02, 1.3422e-02, 3.5337e-03, 1.0267e-02,
        1.2177e-02, 2.9093e-04, 6.9073e-03, 5.2781e-03, 0.0000e+00, 0.0000e+00,
        0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00,
        0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00,
        0.0000e+00, 0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2994, 0.2639, 0.0296, 0.0156, 0.0164, 0.0569, 0.0260, 0.0104, 0.0064,
        0.0071, 0.0127, 0.0757, 0.0118, 0.0674, 0.0089, 0.0211, 0.0149, 0.0126,
        0.0173, 0.0091, 0.0167, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.5252, 0.0162, 0.0057, 0.0276, 0.0103, 0.0206, 0.0144, 0.0123, 0.0094,
        0.0067, 0.0031, 0.0084, 0.0353, 0.0102, 0.0081, 0.0157, 0.0092, 0.0094,
        0.0077, 0.0059, 0.0049, 0.0379, 0.0072, 0.0047, 0.0065, 0.0146, 0.0048,
        0.0059, 0.0116, 0.0040, 0.0102, 0.0167, 0.0137, 0.0257, 0.0456, 0.0086,
        0.0049, 0.0108], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.5267, 0.0261, 0.0078, 0.0416, 0.0126, 0.0306, 0.0280, 0.0222, 0.0105,
        0.0169, 0.0051, 0.0147, 0.0706, 0.0181, 0.0156, 0.0267, 0.0108, 0.0121,
        0.0100, 0.0285, 0.0133, 0.0239, 0.0078, 0.0196, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 5.3927e-01,  2.3033e-02,  3.3677e-03,  6.0633e-02,  1.6858e-02,
         1.8632e-02,  3.5025e-02,  2.9776e-02,  1.5783e-02,  1.2337e-02,
         5.7065e-03,  1.0330e-02,  3.9477e-02,  2.2923e-02,  1.6808e-02,
         1.1864e-02,  3.5367e-02,  1.0124e-02,  1.0492e-02,  4.1156e-03,
         1.6844e-02, -3.2587e-04,  2.0439e-02,  1.2693e-02,  1.3347e-02,
         7.8695e-03,  6.5655e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.2713, -0.2334, -0.0151, -0.0157, -0.0120, -0.1645, -0.0197, -0.0196,
        -0.0073, -0.0067, -0.0091, -0.1341, -0.0161, -0.0137, -0.0139, -0.0197,
        -0.0081, -0.0084, -0.0116,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2900, 0.1954, 0.0157, 0.0181, 0.0130, 0.1502, 0.0164, 0.0252, 0.0084,
        0.0066, 0.0134, 0.1672, 0.0158, 0.0164, 0.0219, 0.0047, 0.0072, 0.0144,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #150: [tensor([0.2455, 0.1669, 0.0067, 0.0146, 0.0064, 0.0031, 0.0365, 0.0059, 0.0142,
        0.2004, 0.0054, 0.0049, 0.0057, 0.0069, 0.0021, 0.0038, 0.1079, 0.0081,
        0.0155, 0.0141, 0.0062, 0.0019, 0.0163, 0.0077, 0.0090, 0.0706, 0.0055,
        0.0018, 0.0067, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2958, 0.3122, 0.0059, 0.0182, 0.0100, 0.0126, 0.0112, 0.0038, 0.0142,
        0.0123, 0.0016, 0.0045, 0.0061, 0.0076, 0.0109, 0.0034, 0.0070, 0.2453,
        0.0034, 0.0031, 0.0024, 0.0086, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3348, 0.3970, 0.0081, 0.0148, 0.0106, 0.0136, 0.0133, 0.0048, 0.0118,
        0.0097, 0.0031, 0.0028, 0.0052, 0.0095, 0.0144, 0.0210, 0.0109, 0.0129,
        0.0837, 0.0082, 0.0042, 0.0056, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2919, 0.3338, 0.0031, 0.0149, 0.0096, 0.0146, 0.0078, 0.0080, 0.0108,
        0.0084, 0.0022, 0.0018, 0.0039, 0.0110, 0.0146, 0.0155, 0.0063, 0.0063,
        0.2209, 0.0016, 0.0029, 0.0017, 0.0084, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2749, 0.1281, 0.0120, 0.0101, 0.2362, 0.0063, 0.0123, 0.0046, 0.0083,
        0.1400, 0.0004, 0.0126, 0.0101, 0.0030, 0.0052, 0.0179, 0.0399, 0.0075,
        0.0040, 0.0104, 0.0027, 0.0061, 0.0248, 0.0047, 0.0073, 0.0033, 0.0073,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 2.1858e-01,  1.5402e-01,  9.6656e-03,  6.1244e-03,  1.3666e-01,
         4.1572e-03,  7.4905e-03,  3.4697e-03,  5.5194e-03,  1.1741e-01,
         1.3400e-03,  9.8058e-03,  3.9514e-03,  3.1352e-03,  4.2080e-03,
         3.3138e-02,  6.1050e-03,  2.9888e-02,  2.5167e-02,  4.5130e-03,
         8.5392e-03,  5.3914e-03,  2.2834e-03,  7.0843e-03,  9.8508e-03,
         5.4079e-04,  9.7512e-03,  2.5659e-02,  8.8483e-03, -6.9100e-05,
         1.1721e-01,  8.8785e-03,  2.9935e-03,  2.9155e-03,  1.9009e-03,
         3.7518e-03], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2173, 0.1517, 0.0094, 0.0033, 0.1128, 0.0051, 0.0059, 0.0020, 0.0048,
        0.0840, 0.0011, 0.0086, 0.0064, 0.0031, 0.0039, 0.0261, 0.0059, 0.0229,
        0.0072, 0.1306, 0.0037, 0.0058, 0.0041, 0.1258, 0.0097, 0.0034, 0.0164,
        0.0033, 0.0032, 0.0026, 0.0035, 0.0025, 0.0039, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2008, 0.2471, 0.0168, 0.0055, 0.0108, 0.0063, 0.0703, 0.0161, 0.0096,
        0.2702, 0.0088, 0.0097, 0.0040, 0.0068, 0.0156, 0.0726, 0.0167, 0.0056,
        0.0066, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2027, 0.1918, 0.0109, 0.0056, 0.0099, 0.0070, 0.0673, 0.0147, 0.0122,
        0.2137, 0.0061, 0.0094, 0.0049, 0.0062, 0.2035, 0.0041, 0.0170, 0.0049,
        0.0081, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2679, 0.1873, 0.0124, 0.0052, 0.0102, 0.0074, 0.0527, 0.0149, 0.0083,
        0.1074, 0.0068, 0.0087, 0.0033, 0.0064, 0.2647, 0.0079, 0.0045, 0.0139,
        0.0039, 0.0062, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([2.3981e-01, 1.0009e-02, 1.0497e-04, 7.5117e-03, 1.1672e-02, 3.6960e-02,
        8.3847e-03, 4.9551e-03, 1.0267e-02, 6.0114e-03, 1.0568e-02, 7.8290e-03,
        1.0968e-02, 7.5981e-03, 2.0456e-01, 5.8007e-03, 3.7781e-03, 5.5124e-03,
        8.6791e-03, 5.7723e-02, 8.6657e-03, 7.4316e-02, 7.8008e-03, 7.6360e-03,
        2.3447e-01, 2.4632e-03, 5.9484e-03, 0.0000e+00, 0.0000e+00, 0.0000e+00,
        0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.3237,  0.0095, -0.0006,  0.0090,  0.0130,  0.0393,  0.0085,  0.0065,
         0.0094,  0.0076,  0.0205,  0.0120,  0.0081,  0.0066,  0.2194,  0.0050,
         0.0033,  0.0040,  0.0074,  0.0664,  0.0058,  0.0660,  0.1346,  0.0091,
         0.0047,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #200: [tensor([0.3211, 0.0573, 0.0044, 0.0086, 0.0101, 0.0021, 0.0027, 0.0074, 0.0068,
        0.0079, 0.0007, 0.1122, 0.0074, 0.0021, 0.0044, 0.1334, 0.0085, 0.0102,
        0.0080, 0.0039, 0.0099, 0.0071, 0.0013, 0.0120, 0.0054, 0.0043, 0.0107,
        0.0454, 0.0112, 0.0097, 0.1418, 0.0132, 0.0033, 0.0055, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2947, 0.1614, 0.0052, 0.0138, 0.0170, 0.0040, 0.0052, 0.0080, 0.0081,
        0.0125, 0.0035, 0.1157, 0.0075, 0.0030, 0.0058, 0.0589, 0.0093, 0.0155,
        0.0006, 0.0030, 0.0051, 0.0064, 0.0589, 0.0229, 0.0153, 0.0420, 0.0675,
        0.0075, 0.0134, 0.0025, 0.0055, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.6083, 0.0123, 0.0204, 0.0010, 0.0073, 0.0533, 0.0043, 0.0075, 0.0128,
        0.0112, 0.0033, 0.0038, 0.0112, 0.0670, 0.0134, 0.0030, 0.0086, 0.0094,
        0.0086, 0.0036, 0.0090, 0.0094, 0.0129, 0.0694, 0.0220, 0.0070, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 0.5836,  0.0056,  0.0167,  0.0012,  0.0128,  0.0737,  0.0037,  0.0092,
         0.0082,  0.0053,  0.0038,  0.0020,  0.0141,  0.0692,  0.0103,  0.0022,
         0.0081,  0.0117,  0.0160,  0.0023,  0.0107, -0.0010,  0.0121,  0.0891,
         0.0231,  0.0046,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3999, 0.0104, 0.0213, 0.0024, 0.0098, 0.0751, 0.0051, 0.0096, 0.0099,
        0.0121, 0.0019, 0.0051, 0.0149, 0.0731, 0.0217, 0.0026, 0.0120, 0.0137,
        0.0141, 0.0123, 0.0083, 0.2260, 0.0168, 0.0104, 0.0115, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2552, 0.0682, 0.0054, 0.0075, 0.0866, 0.0023, 0.0060, 0.0033, 0.0039,
        0.0060, 0.0053, 0.0380, 0.0047, 0.0085, 0.0059, 0.0031, 0.0035, 0.0045,
        0.0764, 0.0006, 0.0028, 0.0022, 0.0043, 0.1242, 0.0049, 0.0023, 0.0042,
        0.0964, 0.0042, 0.0059, 0.0064, 0.1344, 0.0016, 0.0028, 0.0025, 0.0058,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 2.3086e-01,  7.6185e-02,  6.8576e-03,  5.5792e-03,  1.2554e-01,
        -1.4365e-03,  7.5852e-03,  1.0188e-03,  8.4148e-03,  5.9805e-03,
         3.3834e-03,  3.8915e-02,  5.8495e-03,  1.0241e-02,  6.6324e-03,
         5.0413e-03,  6.6660e-03,  5.0604e-03,  6.4607e-02,  2.5675e-03,
         2.2803e-03,  2.9507e-03,  6.0358e-03,  1.1959e-01,  8.5739e-03,
        -1.9850e-04,  3.5804e-03,  8.3967e-02,  8.5730e-03,  5.2440e-03,
         1.1963e-01,  5.5642e-03,  6.2683e-03,  4.1444e-03,  1.9100e-03,
         3.0803e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3026, 0.0754, 0.0054, 0.0056, 0.0816, 0.0006, 0.0044, 0.0028, 0.0051,
        0.0037, 0.0044, 0.0236, 0.0051, 0.0112, 0.0052, 0.0053, 0.0056, 0.0054,
        0.0733, 0.0021, 0.0039, 0.0013, 0.0027, 0.0983, 0.0061, 0.0028, 0.0030,
        0.1010, 0.0045, 0.0042, 0.0054, 0.1107, 0.0017, 0.0025, 0.0034, 0.0032,
        0.0025, 0.0095, 0.0024, 0.0023], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2411, 0.0048, 0.0390, 0.1736, 0.0054, 0.0087, 0.0072, 0.0090, 0.0882,
        0.0125, 0.0023, 0.0048, 0.0073, 0.1077, 0.0051, 0.0125, 0.0098, 0.0114,
        0.0946, 0.0104, 0.0060, 0.0074, 0.1162, 0.0074, 0.0026, 0.0048, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2306, 0.0059, 0.0333, 0.1227, 0.0063, 0.0087, 0.0086, 0.0078, 0.1343,
        0.0147, 0.0045, 0.0031, 0.0059, 0.1208, 0.0041, 0.0069, 0.0087, 0.0077,
        0.0907, 0.0094, 0.0062, 0.0058, 0.1401, 0.0057, 0.0022, 0.0053, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.1983, 0.0043, 0.0424, 0.1546, 0.0047, 0.0100, 0.0082, 0.0067, 0.1640,
        0.0110, 0.0026, 0.0024, 0.0079, 0.1397, 0.0059, 0.0085, 0.0674, 0.0097,
        0.0079, 0.0076, 0.1215, 0.0044, 0.0034, 0.0069, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 5.3850e-01,  3.9162e-03,  2.9914e-02,  8.7891e-03,  1.4923e-02,
         7.2080e-03,  1.4948e-02,  1.5670e-02,  1.0458e-02,  2.0167e-01,
         8.8839e-03,  1.5092e-02,  3.2305e-02,  3.5039e-03,  1.0648e-02,
         7.1001e-03,  2.3627e-02,  1.3151e-02,  7.5455e-03,  4.6433e-03,
         1.2935e-02, -2.1530e-04,  4.5919e-03,  9.7589e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #250: [tensor([ 0.3108,  0.0067,  0.0233,  0.0075,  0.0034,  0.0031,  0.1044,  0.0050,
         0.0074,  0.0131,  0.0024,  0.0037,  0.0427,  0.0033,  0.0032,  0.0108,
         0.0406,  0.0082,  0.0196,  0.0578,  0.0020, -0.0004,  0.0059,  0.0518,
         0.0417,  0.0097,  0.0177,  0.0070,  0.0166,  0.0105,  0.0048,  0.0034,
         0.0411,  0.0051,  0.0118,  0.0204,  0.0035,  0.0056,  0.0073,  0.0406,
         0.0050,  0.0034,  0.0074], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3299, 0.0097, 0.0223, 0.0177, 0.0063, 0.0047, 0.2320, 0.0045, 0.0065,
        0.0124, 0.0053, 0.0035, 0.0537, 0.0055, 0.0066, 0.0095, 0.0480, 0.0096,
        0.0256, 0.0594, 0.0026, 0.0011, 0.0064, 0.0572, 0.0316, 0.0088, 0.0063,
        0.0050, 0.0031, 0.0053, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 3.0081e-01,  7.3110e-03,  2.6650e-02,  1.3022e-02,  6.4709e-03,
         3.5373e-03,  1.7776e-01,  4.1206e-03,  6.9927e-03,  1.0542e-02,
         6.7922e-03,  2.5334e-03,  4.7648e-02,  4.1482e-03,  7.3629e-03,
         1.1219e-02,  2.9463e-02,  7.4269e-03,  2.0246e-02,  4.5322e-02,
         7.6809e-05, -4.7657e-04,  4.3146e-03,  5.7822e-02,  1.4897e-03,
         1.0617e-02,  1.1950e-02,  2.0103e-02,  1.2917e-01,  8.8394e-03,
         9.0349e-03,  2.0737e-03,  4.6536e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2983, 0.0074, 0.0296, 0.0201, 0.0082, 0.0034, 0.1544, 0.0042, 0.0089,
        0.0141, 0.0048, 0.0031, 0.0453, 0.0041, 0.0066, 0.0083, 0.0357, 0.0089,
        0.0262, 0.0495, 0.0023, 0.0016, 0.0059, 0.0815, 0.0348, 0.0212, 0.0429,
        0.0552, 0.0065, 0.0004, 0.0065, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4042, 0.0082, 0.0292, 0.0168, 0.0060, 0.0065, 0.2500, 0.0066, 0.0074,
        0.0144, 0.0086, 0.0031, 0.0538, 0.0087, 0.0040, 0.0119, 0.0426, 0.0094,
        0.0247, 0.0471, 0.0028, 0.0015, 0.0051, 0.0014, 0.0078, 0.0077, 0.0023,
        0.0007, 0.0078, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3800, 0.0085, 0.0349, 0.0069, 0.0069, 0.0071, 0.1832, 0.0029, 0.0093,
        0.0132, 0.0043, 0.0023, 0.0517, 0.0032, 0.0060, 0.0137, 0.0402, 0.0101,
        0.0258, 0.0651, 0.0025, 0.0011, 0.0043, 0.0099, 0.0340, 0.0131, 0.0185,
        0.0137, 0.0136, 0.0035, 0.0033, 0.0072, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2209, 0.0096, 0.0565, 0.0155, 0.0060, 0.0055, 0.2063, 0.0047, 0.0088,
        0.0113, 0.0063, 0.0048, 0.0482, 0.0060, 0.0074, 0.0152, 0.0551, 0.0099,
        0.0167, 0.0602, 0.0007, 0.0020, 0.0054, 0.0752, 0.0433, 0.0177, 0.0023,
        0.0157, 0.0492, 0.0035, 0.0052, 0.0048, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.5168, 0.0051, 0.0261, 0.0073, 0.0065, 0.0038, 0.0920, 0.0034, 0.0051,
        0.0094, 0.0037, 0.0028, 0.0425, 0.0024, 0.0039, 0.0090, 0.0295, 0.0067,
        0.0206, 0.0348, 0.0006, 0.0006, 0.0059, 0.0433, 0.0310, 0.0161, 0.0087,
        0.0049, 0.0019, 0.0010, 0.0047, 0.0043, 0.0120, 0.0005, 0.0055, 0.0068,
        0.0071, 0.0055, 0.0041, 0.0040, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.4418,  0.0095,  0.0296,  0.0223,  0.0049,  0.0042,  0.0955,  0.0046,
         0.0073,  0.0108,  0.0041,  0.0037,  0.0456,  0.0048,  0.0048,  0.0123,
         0.0522,  0.0073,  0.0204,  0.0426,  0.0024, -0.0011,  0.0054,  0.0122,
         0.0368,  0.0151,  0.0081,  0.0025,  0.0245,  0.0568,  0.0013,  0.0014,
         0.0041,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 3.1411e-01,  8.8358e-03,  4.0974e-02,  1.6229e-02,  8.0145e-03,
         4.8027e-03,  1.3555e-01,  4.9632e-03,  6.8262e-03,  1.3229e-02,
         7.1581e-03,  4.5647e-03,  5.8273e-02,  5.2797e-03,  4.5001e-03,
         1.5164e-02,  5.8097e-02,  1.0448e-02,  2.0692e-02,  6.0135e-02,
         1.1338e-03,  9.4315e-07,  6.9853e-03,  7.8095e-02,  6.4920e-02,
         1.5484e-02,  4.8212e-03,  6.4912e-03,  1.5624e-02, -7.5162e-04,
         2.2737e-03,  5.5679e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 2.4063e-01,  8.2442e-03,  3.6511e-02,  1.1330e-02,  4.2984e-03,
         4.7993e-03,  1.6019e-01,  3.1177e-03,  7.5102e-03,  1.2536e-02,
         5.1759e-03,  2.0905e-03,  4.9812e-02,  6.6929e-03,  6.2422e-03,
         1.0232e-02,  3.1036e-02,  8.5887e-03,  1.5690e-02,  5.0865e-02,
         1.0710e-03, -1.5793e-04,  6.1384e-03,  5.5706e-02,  4.4837e-02,
         8.2106e-03,  6.1172e-03,  8.2262e-03,  2.3258e-02,  1.0312e-02,
         1.4673e-01,  5.3766e-03,  3.4256e-03,  4.8524e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3857, 0.0135, 0.0485, 0.0075, 0.0250, 0.0087, 0.0109, 0.2135, 0.0113,
        0.0032, 0.0058, 0.0114, 0.0183, 0.0121, 0.0118, 0.0123, 0.1689, 0.0121,
        0.0063, 0.0134, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #300: [tensor([0.3122, 0.1917, 0.0004, 0.0134, 0.0036, 0.0089, 0.0101, 0.0085, 0.0074,
        0.0079, 0.1446, 0.0088, 0.0130, 0.0109, 0.0105, 0.0163, 0.2082, 0.0074,
        0.0059, 0.0106, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2576, 0.0864, 0.0034, 0.0089, 0.0054, 0.0091, 0.0087, 0.0074, 0.0067,
        0.0128, 0.0077, 0.0056, 0.1470, 0.0067, 0.0025, 0.0061, 0.1139, 0.0026,
        0.0097, 0.2570, 0.0058, 0.0104, 0.0080, 0.0032, 0.0020, 0.0054, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.3110,  0.0793,  0.0027,  0.0097,  0.0086,  0.0105,  0.0113,  0.0142,
         0.0116,  0.0205,  0.0074,  0.0059,  0.2117, -0.0004,  0.0021,  0.0095,
         0.1549,  0.0044,  0.0109,  0.0882,  0.0035,  0.0062,  0.0042,  0.0114,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([4.4330e-01, 1.3950e-01, 1.7983e-03, 8.7266e-03, 5.8035e-03, 8.1954e-03,
        8.2172e-03, 6.9398e-03, 8.9555e-03, 8.7404e-03, 7.0389e-03, 4.7033e-03,
        8.8780e-02, 3.8250e-03, 1.5901e-03, 6.8656e-03, 8.9024e-02, 3.5729e-03,
        7.1293e-03, 5.6567e-03, 9.2059e-03, 8.8327e-03, 1.0935e-01, 5.8398e-03,
        3.9522e-04, 8.0104e-03, 0.0000e+00, 0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([3.3941e-01, 1.4067e-01, 1.6159e-02, 5.5982e-03, 2.8583e-03, 6.2777e-03,
        6.6876e-02, 2.8258e-04, 1.4215e-02, 6.9618e-03, 1.5787e-01, 7.0920e-03,
        2.1617e-02, 1.4817e-02, 1.2831e-02, 1.0466e-02, 4.9582e-03, 9.1222e-03,
        8.0551e-02, 3.6130e-03, 5.6429e-02, 9.5568e-03, 2.7869e-03, 8.9802e-03,
        0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 4.0916e-01,  1.6382e-01,  7.2242e-03,  6.0840e-03,  1.6552e-03,
         3.7737e-03,  6.4275e-02,  2.0458e-03,  1.2056e-02,  5.7410e-03,
         1.8953e-01,  2.9291e-03,  1.0673e-02,  9.4526e-03,  1.4552e-02,
         8.2801e-03,  5.6480e-03,  9.0227e-03,  5.0259e-02,  9.7105e-04,
         1.1515e-02, -4.0367e-04,  1.6340e-03,  9.2953e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3167, 0.1347, 0.0085, 0.0055, 0.0009, 0.0048, 0.0803, 0.0021, 0.0189,
        0.0067, 0.1824, 0.0045, 0.0149, 0.0127, 0.0087, 0.0060, 0.0050, 0.0080,
        0.0705, 0.0075, 0.0104, 0.0059, 0.0167, 0.0116, 0.0109, 0.0336, 0.0034,
        0.0083], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3321, 0.1108, 0.0106, 0.0077, 0.0008, 0.0065, 0.0171, 0.0134, 0.0068,
        0.0038, 0.0066, 0.0044, 0.0074, 0.2480, 0.0045, 0.0048, 0.0088, 0.0484,
        0.0136, 0.0140, 0.0297, 0.0668, 0.0039, 0.0163, 0.0029, 0.0101, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4015, 0.1097, 0.0130, 0.0111, 0.0026, 0.0114, 0.0153, 0.0112, 0.0052,
        0.0018, 0.0102, 0.0039, 0.0071, 0.1786, 0.0016, 0.0007, 0.0088, 0.0759,
        0.0091, 0.0189, 0.0074, 0.0103, 0.0659, 0.0089, 0.0022, 0.0077, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([4.2356e-01, 9.9265e-02, 7.7809e-03, 1.0112e-02, 1.9426e-03, 9.4362e-03,
        1.6821e-02, 1.4812e-02, 3.3678e-03, 3.2589e-03, 9.5196e-03, 2.8880e-03,
        4.1650e-03, 2.1607e-01, 1.9894e-03, 4.0945e-04, 9.3175e-03, 7.9034e-02,
        1.1532e-02, 1.2728e-02, 1.0923e-02, 1.8340e-02, 8.8589e-03, 1.5456e-02,
        3.3537e-03, 5.0559e-03, 0.0000e+00, 0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([4.2090e-01, 1.3149e-02, 5.2230e-02, 1.1404e-02, 7.1836e-03, 4.2733e-03,
        2.0620e-02, 6.1815e-03, 1.6373e-01, 6.4427e-03, 1.6565e-04, 5.5825e-03,
        8.1946e-02, 1.7350e-02, 1.2484e-02, 1.0720e-02, 2.7449e-02, 7.8367e-02,
        5.5352e-03, 1.0600e-02, 1.1479e-02, 1.2271e-02, 6.5808e-03, 3.2208e-03,
        2.5718e-03, 7.5731e-03, 0.0000e+00, 0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([3.5700e-01, 9.4351e-03, 6.9259e-02, 8.6187e-03, 7.3947e-03, 3.6752e-03,
        1.9580e-02, 7.2351e-03, 1.3072e-01, 3.6892e-03, 1.6370e-04, 7.2447e-03,
        5.9555e-02, 1.0166e-02, 1.3942e-02, 8.1603e-03, 1.3237e-02, 1.5356e-01,
        5.0808e-03, 5.3100e-02, 9.3472e-03, 8.0374e-03, 1.3410e-02, 1.9005e-02,
        2.0310e-03, 7.3501e-03, 0.0000e+00, 0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #350: [tensor([0.2488, 0.0865, 0.0016, 0.0454, 0.1895, 0.0072, 0.0071, 0.0149, 0.0075,
        0.0046, 0.0100, 0.0124, 0.0459, 0.0088, 0.0036, 0.0066, 0.0070, 0.0082,
        0.0039, 0.0648, 0.0139, 0.0021, 0.0051, 0.0444, 0.0064, 0.0743, 0.0205,
        0.0104, 0.0012, 0.0279, 0.0042, 0.0054, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3538, 0.0240, 0.0103, 0.0137, 0.0350, 0.2984, 0.0354, 0.0159, 0.0318,
        0.0190, 0.0075, 0.0184, 0.0542, 0.0162, 0.0089, 0.0190, 0.0151, 0.0236,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4144, 0.0136, 0.0053, 0.0178, 0.0180, 0.2362, 0.0199, 0.0131, 0.0217,
        0.0143, 0.0094, 0.0150, 0.0151, 0.0360, 0.0124, 0.0097, 0.0955, 0.0128,
        0.0092, 0.0106, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2681, 0.0135, 0.0049, 0.0137, 0.0150, 0.2033, 0.0226, 0.0114, 0.0167,
        0.0140, 0.0026, 0.0103, 0.0133, 0.0137, 0.3066, 0.0172, 0.0078, 0.0146,
        0.0110, 0.0076, 0.0120, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2166, 0.2142, 0.0064, 0.0027, 0.0068, 0.0175, 0.2010, 0.0129, 0.0029,
        0.0081, 0.0070, 0.0101, 0.0099, 0.0025, 0.0065, 0.1829, 0.0083, 0.0052,
        0.0068, 0.0090, 0.0057, 0.0292, 0.0098, 0.0094, 0.0015, 0.0071, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.2063,  0.2064,  0.0126,  0.0042,  0.0088,  0.0401,  0.1737,  0.0121,
         0.0044,  0.0081,  0.0100,  0.0126,  0.0112,  0.0028,  0.0067,  0.2082,
         0.0122,  0.0081,  0.0122,  0.0191,  0.0104, -0.0013,  0.0085,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2692, 0.1319, 0.0148, 0.0038, 0.0088, 0.0176, 0.2015, 0.0100, 0.0037,
        0.0074, 0.0062, 0.0114, 0.0112, 0.0017, 0.0083, 0.1682, 0.0118, 0.0050,
        0.0094, 0.0116, 0.0066, 0.0622, 0.0088, 0.0016, 0.0070, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3845, 0.0682, 0.0042, 0.0074, 0.0043, 0.0190, 0.0101, 0.0050, 0.0039,
        0.1045, 0.0033, 0.0022, 0.0020, 0.0066, 0.0019, 0.0152, 0.0044, 0.0096,
        0.0042, 0.0996, 0.0050, 0.0051, 0.0045, 0.0375, 0.0115, 0.0047, 0.0037,
        0.0903, 0.0030, 0.0023, 0.0013, 0.0077, 0.0035, 0.0147, 0.0029, 0.0122,
        0.0036, 0.0073, 0.0045, 0.0057, 0.0013, 0.0030, 0.0011, 0.0037],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2674, 0.0760, 0.0143, 0.0076, 0.0077, 0.0306, 0.0091, 0.0078, 0.0025,
        0.0782, 0.0036, 0.0036, 0.0021, 0.0093, 0.0055, 0.0248, 0.0069, 0.0153,
        0.0048, 0.1292, 0.0023, 0.0368, 0.0099, 0.0073, 0.0036, 0.1682, 0.0041,
        0.0040, 0.0006, 0.0059, 0.0060, 0.0207, 0.0038, 0.0145, 0.0059, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2355, 0.0819, 0.0067, 0.0073, 0.0044, 0.0236, 0.0122, 0.0044, 0.0057,
        0.0867, 0.0040, 0.0036, 0.0019, 0.0086, 0.0050, 0.0190, 0.0056, 0.0123,
        0.0051, 0.1671, 0.0066, 0.0053, 0.0042, 0.0489, 0.0168, 0.0046, 0.0052,
        0.1290, 0.0037, 0.0006, 0.0075, 0.0131, 0.0034, 0.0236, 0.0053, 0.0151,
        0.0065, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2755, 0.1291, 0.0034, 0.0162, 0.0094, 0.0022, 0.0047, 0.0022, 0.0072,
        0.0087, 0.1207, 0.0051, 0.0023, 0.0085, 0.0034, 0.0074, 0.1207, 0.0075,
        0.0049, 0.0115, 0.0118, 0.2238, 0.0020, 0.0077, 0.0042, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.2891,  0.1416,  0.0032,  0.0101,  0.0125, -0.0003,  0.0057,  0.0007,
         0.0075,  0.0077,  0.1062,  0.0070,  0.0047,  0.0074,  0.0014,  0.0075,
         0.1235,  0.0056,  0.0038,  0.0183,  0.0131,  0.2038,  0.0095,  0.0099,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #400: [tensor([0.1284, 0.1384, 0.0025, 0.0086, 0.0123, 0.0074, 0.0093, 0.0050, 0.0086,
        0.0112, 0.0089, 0.0253, 0.1509, 0.0096, 0.0101, 0.1374, 0.0097, 0.0103,
        0.0037, 0.0067, 0.0399, 0.0061, 0.0481, 0.1890, 0.0054, 0.0074, 0.0000,
        0.0000, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1547, 0.0094, 0.0119, 0.2641, 0.0038, 0.0094, 0.0057, 0.0029, 0.0101,
        0.0036, 0.0095, 0.1174, 0.0020, 0.0068, 0.0047, 0.0055, 0.0463, 0.0170,
        0.0036, 0.0065, 0.1349, 0.0064, 0.0567, 0.0091, 0.0058, 0.0614, 0.0131,
        0.0072, 0.0035, 0.0069], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.2291,  0.0090,  0.0073,  0.2428,  0.0035,  0.0083,  0.0041,  0.0039,
         0.0097,  0.0027,  0.0114,  0.1479,  0.0020,  0.0069,  0.0074,  0.0069,
         0.0495,  0.0164,  0.0008,  0.0078,  0.1357,  0.0130,  0.0501,  0.0087,
         0.0081, -0.0007,  0.0064,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2723, 0.0099, 0.0126, 0.2172, 0.0012, 0.0079, 0.0051, 0.0058, 0.0117,
        0.0042, 0.0083, 0.1172, 0.0015, 0.0035, 0.0064, 0.0042, 0.0479, 0.0134,
        0.0027, 0.0059, 0.1002, 0.0089, 0.0472, 0.0077, 0.0067, 0.0597, 0.0048,
        0.0059, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.3134,  0.1367,  0.0171,  0.0215,  0.0090,  0.0022,  0.0135,  0.1999,
         0.0086,  0.0074,  0.0072,  0.0761,  0.0203,  0.0828,  0.0123,  0.0099,
         0.0108,  0.0124,  0.0099,  0.0075,  0.0113, -0.0003,  0.0097,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.1914, 0.1486, 0.0123, 0.0216, 0.0070, 0.0027, 0.0186, 0.1970, 0.0138,
        0.0060, 0.0098, 0.0180, 0.0752, 0.2130, 0.0166, 0.0189, 0.0142, 0.0071,
        0.0081, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1227, 0.1688, 0.0136, 0.0283, 0.0095, 0.0028, 0.0179, 0.2348, 0.0127,
        0.0078, 0.0065, 0.0727, 0.0158, 0.0625, 0.0121, 0.1898, 0.0073, 0.0047,
        0.0097, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2528, 0.1583, 0.0055, 0.0055, 0.0115, 0.1140, 0.0064, 0.0168, 0.0026,
        0.0047, 0.0091, 0.0080, 0.0077, 0.0050, 0.0288, 0.0662, 0.0113, 0.0036,
        0.0084, 0.0669, 0.0079, 0.0760, 0.0062, 0.0279, 0.0719, 0.0092, 0.0031,
        0.0048, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2577, 0.1025, 0.0086, 0.0063, 0.0129, 0.1542, 0.0076, 0.0163, 0.0039,
        0.0051, 0.0111, 0.0082, 0.0040, 0.0062, 0.0366, 0.0465, 0.0143, 0.0026,
        0.0062, 0.2024, 0.0098, 0.0049, 0.0555, 0.0077, 0.0015, 0.0077, 0.0000,
        0.0000, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2412, 0.0639, 0.0051, 0.0059, 0.0066, 0.1224, 0.0043, 0.0177, 0.0048,
        0.0046, 0.0091, 0.0074, 0.0074, 0.0051, 0.0200, 0.0451, 0.0111, 0.0051,
        0.0056, 0.0491, 0.0056, 0.0667, 0.0106, 0.0267, 0.2336, 0.0084, 0.0018,
        0.0049, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2245, 0.1003, 0.0096, 0.0711, 0.0109, 0.0062, 0.0174, 0.2035, 0.0090,
        0.0058, 0.0099, 0.0076, 0.0043, 0.0097, 0.0724, 0.0128, 0.0499, 0.1494,
        0.0029, 0.0116, 0.0030, 0.0081, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2881, 0.1007, 0.0074, 0.1046, 0.0094, 0.0080, 0.0235, 0.2146, 0.0090,
        0.0119, 0.0149, 0.0101, 0.0040, 0.0085, 0.0720, 0.0155, 0.0681, 0.0122,
        0.0080, 0.0093, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #450: [tensor([0.2726, 0.1904, 0.0136, 0.0305, 0.0035, 0.0486, 0.0796, 0.0153, 0.0147,
        0.0108, 0.0588, 0.0044, 0.0039, 0.0085, 0.0707, 0.0086, 0.0577, 0.0158,
        0.0168, 0.0158, 0.0087, 0.0161, 0.0049, 0.0199, 0.0097, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2236, 0.1992, 0.0128, 0.0254, 0.0103, 0.0398, 0.0938, 0.0196, 0.0243,
        0.0154, 0.0710, 0.0073, 0.0074, 0.0119, 0.0975, 0.0139, 0.0791, 0.0232,
        0.0107, 0.0138, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2420, 0.1030, 0.0105, 0.0141, 0.0009, 0.0386, 0.0783, 0.0179, 0.0214,
        0.0113, 0.0641, 0.0078, 0.0060, 0.0086, 0.0823, 0.0079, 0.0642, 0.0164,
        0.0157, 0.0114, 0.0790, 0.0059, 0.0098, 0.0635, 0.0131, 0.0063, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1320, 0.0170, 0.0186, 0.0089, 0.0059, 0.0399, 0.0896, 0.0191, 0.0076,
        0.0108, 0.0997, 0.0128, 0.0362, 0.0247, 0.0300, 0.4167, 0.0177, 0.0127,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1976, 0.0246, 0.0262, 0.0111, 0.0124, 0.0538, 0.1372, 0.0271, 0.0162,
        0.0112, 0.1485, 0.0167, 0.0496, 0.0824, 0.1344, 0.0302, 0.0209, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3104, 0.0414, 0.0356, 0.0220, 0.0099, 0.1108, 0.2116, 0.0364, 0.0119,
        0.0216, 0.0293, 0.0635, 0.0508, 0.0133, 0.0314, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1458, 0.1135, 0.0023, 0.0151, 0.0099, 0.0059, 0.0055, 0.1459, 0.0073,
        0.0072, 0.1541, 0.0051, 0.0122, 0.0071, 0.0132, 0.0069, 0.0121, 0.0082,
        0.0023, 0.0044, 0.0049, 0.2437, 0.0060, 0.0184, 0.0173, 0.0035, 0.0060,
        0.0022, 0.0072, 0.0029, 0.0041, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1100, 0.1164, 0.0051, 0.0120, 0.0146, 0.0059, 0.0044, 0.1385, 0.0053,
        0.0076, 0.1076, 0.0113, 0.0080, 0.0076, 0.0093, 0.0077, 0.0104, 0.0063,
        0.0022, 0.0040, 0.0058, 0.2162, 0.0058, 0.0118, 0.0112, 0.0073, 0.0669,
        0.0069, 0.0104, 0.0072, 0.0098, 0.0368, 0.0034, 0.0064, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1023, 0.1428, 0.0014, 0.0130, 0.0195, 0.0040, 0.0053, 0.1216, 0.0052,
        0.0080, 0.1519, 0.0049, 0.0144, 0.0121, 0.0124, 0.0053, 0.0098, 0.0075,
        0.0041, 0.0042, 0.0069, 0.1863, 0.0062, 0.0034, 0.0075, 0.0017, 0.0611,
        0.0059, 0.0118, 0.0132, 0.0268, 0.0011, 0.0048, 0.0024, 0.0049, 0.0063],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2686, 0.0032, 0.0199, 0.0130, 0.0042, 0.0090, 0.0386, 0.0114, 0.0274,
        0.0080, 0.0096, 0.0150, 0.0264, 0.0133, 0.1151, 0.0071, 0.0075, 0.0106,
        0.0143, 0.0082, 0.0117, 0.0132, 0.3156, 0.0115, 0.0060, 0.0114, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.4354,  0.0163,  0.0362,  0.0378,  0.0188,  0.0230,  0.0427,  0.0260,
         0.0425,  0.0125,  0.0295,  0.0400,  0.0372,  0.0151, -0.0008,  0.0334,
         0.0466,  0.0226,  0.0380,  0.0162,  0.0297,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3917, 0.0067, 0.0214, 0.0145, 0.0043, 0.0133, 0.0293, 0.0129, 0.0230,
        0.0080, 0.0146, 0.0190, 0.0190, 0.0149, 0.0136, 0.0107, 0.0202, 0.0693,
        0.0219, 0.0077, 0.0140, 0.0549, 0.1101, 0.0223, 0.0249, 0.0202, 0.0036,
        0.0138, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #500: [tensor([0.0874, 0.0099, 0.0047, 0.0157, 0.0480, 0.1471, 0.0040, 0.0074, 0.0111,
        0.0037, 0.0070, 0.3508, 0.0048, 0.0645, 0.0094, 0.1990, 0.0061, 0.0105,
        0.0089, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.1312, 0.0138, 0.0047, 0.0124, 0.0673, 0.3031, 0.0048, 0.0079, 0.0145,
        0.0055, 0.0087, 0.0122, 0.0102, 0.0158, 0.0467, 0.3042, 0.0036, 0.0082,
        0.0089, 0.0069, 0.0093, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 0.0832,  0.2241, -0.0005,  0.0062,  0.0023,  0.0072,  0.0113,  0.0047,
         0.0131,  0.0014,  0.0189,  0.0072,  0.0658,  0.3492,  0.0049,  0.0092,
         0.0057,  0.0073,  0.0681,  0.0131,  0.0064,  0.0063,  0.0146,  0.0124,
         0.0198,  0.0267,  0.0036,  0.0070,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.0727, 0.1026, 0.0022, 0.0050, 0.0004, 0.0036, 0.0063, 0.0041, 0.0079,
        0.0028, 0.0095, 0.0053, 0.0287, 0.2908, 0.0053, 0.0095, 0.0047, 0.0066,
        0.0466, 0.0117, 0.0063, 0.0048, 0.0268, 0.3047, 0.0085, 0.0119, 0.0039,
        0.0066, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.1547, 0.1963, 0.0054, 0.0035, 0.0041, 0.0051, 0.0058, 0.0062, 0.0091,
        0.0033, 0.0149, 0.0055, 0.0356, 0.3006, 0.0047, 0.0064, 0.0042, 0.0063,
        0.0531, 0.0099, 0.0058, 0.0620, 0.0512, 0.0071, 0.0083, 0.0059, 0.0100,
        0.0071, 0.0020, 0.0060, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.0701, 0.1672, 0.0042, 0.0086, 0.0067, 0.0296, 0.0093, 0.0249, 0.1750,
        0.0039, 0.0074, 0.0079, 0.0059, 0.0046, 0.0098, 0.0023, 0.0058, 0.1735,
        0.0046, 0.0540, 0.0321, 0.1740, 0.0048, 0.0078, 0.0063, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.0758, 0.1903, 0.0064, 0.0118, 0.0104, 0.0345, 0.0146, 0.0400, 0.1806,
        0.0063, 0.0087, 0.0089, 0.0093, 0.0067, 0.0095, 0.0020, 0.0086, 0.2174,
        0.0076, 0.0124, 0.1274, 0.0031, 0.0077, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.0837, 0.2083, 0.0072, 0.0135, 0.0062, 0.0412, 0.0107, 0.0469, 0.1865,
        0.0054, 0.0086, 0.0071, 0.0082, 0.0065, 0.0120, 0.0031, 0.0087, 0.2640,
        0.0087, 0.0551, 0.0037, 0.0048, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([3.8770e-04, 2.0888e-01, 2.1215e-03, 1.4280e-02, 9.9382e-03, 1.2728e-02,
        4.3270e-02, 2.1141e-02, 8.6374e-03, 1.0263e-02, 1.2361e-02, 1.7607e-02,
        1.1406e-02, 5.5860e-03, 7.6913e-03, 4.1339e-01, 1.2192e-02, 7.5679e-03,
        1.2100e-02, 2.3621e-02, 1.7102e-02, 8.1134e-03, 1.2665e-02, 3.9340e-02,
        2.8745e-02, 1.0101e-02, 1.3135e-02, 4.5705e-03, 1.1055e-02, 0.0000e+00,
        0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.0718, 0.1036, 0.0040, 0.0080, 0.0054, 0.0084, 0.0246, 0.0120, 0.0084,
        0.0074, 0.0066, 0.0138, 0.0091, 0.0033, 0.0059, 0.1766, 0.0087, 0.0384,
        0.0052, 0.2568, 0.0106, 0.0303, 0.1698, 0.0072, 0.0006, 0.0036, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.0859, 0.2130, 0.0048, 0.0134, 0.0098, 0.0105, 0.0564, 0.0175, 0.0084,
        0.0161, 0.0088, 0.0167, 0.0128, 0.0056, 0.0095, 0.2550, 0.0128, 0.0092,
        0.0332, 0.0277, 0.0086, 0.0157, 0.0118, 0.0274, 0.0249, 0.0179, 0.0156,
        0.0256, 0.0112, 0.0039, 0.0104], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.1099, 0.1982, 0.0018, 0.0060, 0.0039, 0.0084, 0.0088, 0.0326, 0.2890,
        0.0098, 0.0085, 0.0106, 0.0143, 0.0149, 0.0043, 0.0090, 0.2055, 0.0111,
        0.0117, 0.0103, 0.0168, 0.0027, 0.0034, 0.0082, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #550: [tensor([-0.0844, -0.3864, -0.0010, -0.0013, -0.0040, -0.1781, -0.0045, -0.0005,
        -0.0045, -0.1024, -0.0026, -0.0337, -0.0056, -0.1814, -0.0038, -0.0014,
        -0.0043,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0867, -0.3194, -0.0010, -0.0029, -0.0040, -0.1375, -0.0043, -0.0016,
        -0.0062, -0.1879, -0.0021, -0.0071, -0.0040, -0.2246, -0.0042, -0.0023,
        -0.0039,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0831, -0.3249, -0.0013, -0.0020, -0.0028, -0.1867, -0.0028, -0.0009,
        -0.0033, -0.1476, -0.0025, -0.0229, -0.0065, -0.0051, -0.1891, -0.0078,
        -0.0054, -0.0019, -0.0035,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0996, -0.3173, -0.0047, -0.0503, -0.0020, -0.0055, -0.0317, -0.0325,
        -0.0025, -0.0012, -0.0037, -0.1878, -0.0035, -0.0316, -0.0161, -0.1749,
        -0.0018, -0.0122, -0.0163,  0.0005, -0.0015, -0.0029,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0930, -0.3963, -0.0039, -0.0566, -0.0016, -0.0088, -0.0149, -0.0367,
        -0.0032, -0.0009, -0.0030, -0.2917, -0.0053, -0.0333, -0.0055, -0.0054,
        -0.0248, -0.0079, -0.0025, -0.0046,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-4.7272e-02, -4.2514e-01, -3.4694e-03, -6.6011e-02, -1.9663e-03,
        -7.3394e-03, -1.6144e-02, -3.4560e-02, -2.7069e-03, -3.2020e-04,
        -3.6370e-03, -3.0567e-01, -5.0671e-03, -3.3054e-02, -2.7884e-03,
        -8.7033e-03, -1.8572e-02, -6.0352e-03, -3.0978e-03, -3.0528e-03,
        -1.2596e-03, -4.1338e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.0380e-01, -1.9435e-01, -2.0799e-03, -2.7008e-03, -1.8955e-01,
        -1.8536e-03, -3.2851e-03, -3.9103e-03, -4.6722e-03, -7.0499e-03,
        -4.1005e-04, -3.1091e-03, -1.4224e-01, -1.5681e-03, -3.0067e-02,
        -3.0124e-03, -1.3261e-01, -1.0380e-03, -5.6880e-03, -1.5502e-01,
        -4.2453e-03, -3.5600e-03, -1.6395e-04, -4.0199e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.0745, 0.2822, 0.0009, 0.0045, 0.2830, 0.0007, 0.0035, 0.0051, 0.0055,
        0.0083, 0.0013, 0.0029, 0.2383, 0.0028, 0.0453, 0.0009, 0.0099, 0.0210,
        0.0056, 0.0040, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0687, -0.4657, -0.0027, -0.0071, -0.3454, -0.0035, -0.0080, -0.0069,
        -0.0078, -0.0086,  0.0012, -0.0041, -0.0079, -0.0412, -0.0067, -0.0042,
        -0.0053, -0.0008, -0.0043,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1387, -0.1859, -0.0005, -0.0036, -0.1493, -0.0027, -0.0019, -0.1482,
        -0.0010, -0.0011, -0.0007, -0.0030, -0.0020, -0.0009, -0.0021, -0.1150,
        -0.0022, -0.0167, -0.0028, -0.1256, -0.0004, -0.0046, -0.0803, -0.0044,
        -0.0027, -0.0007, -0.0029], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1120, -0.2521, -0.0018, -0.0037, -0.1587, -0.0027, -0.0021, -0.1636,
        -0.0006, -0.0016, -0.0030, -0.0035, -0.0021, -0.0016, -0.0023, -0.1138,
        -0.0023, -0.0137, -0.0032, -0.1390, -0.0048, -0.0056, -0.0030, -0.0012,
        -0.0020,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1085, -0.2709, -0.0019, -0.0057, -0.1888, -0.0020, -0.0027, -0.2055,
        -0.0020, -0.0017, -0.0013, -0.0032, -0.0027, -0.0014, -0.0018, -0.0904,
        -0.0025, -0.0026, -0.0992,  0.0003, -0.0017, -0.0034,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #600: [tensor([-4.8856e-01, -1.2920e-01, -7.3735e-03, -9.8144e-03, -4.9507e-03,
         3.8979e-03, -1.9302e-03,  3.0680e-03,  3.4953e-03,  3.4447e-03,
        -4.0203e-03, -3.2757e-03,  8.5798e-03, -1.6636e-03, -6.2662e-03,
         1.4304e-02, -9.5486e-03, -6.0394e-03, -1.1751e-01, -4.2595e-02,
        -1.2399e-02, -8.3112e-03,  2.3577e-02,  4.2049e-04, -1.6652e-02,
         1.9081e-03, -5.4480e-03, -1.2573e-02, -1.2176e-03, -7.5020e-03,
        -2.0939e-03,  1.1758e-02,  8.8065e-04, -1.9681e-02,  3.4408e-03,
        -1.2821e-03, -1.3107e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1759, -0.2099, -0.0097, -0.0128, -0.0045,  0.0057, -0.0042,  0.0025,
        -0.0038, -0.0098, -0.0069, -0.0051,  0.0007, -0.0072, -0.0085, -0.0281,
        -0.0099, -0.0028, -0.2340, -0.0480, -0.0073, -0.0153, -0.0072,  0.0029,
        -0.0361, -0.0059, -0.0123, -0.0123,  0.0506,  0.0085, -0.0434, -0.0020,
        -0.0012, -0.0051,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-2.6030e-01, -2.1419e-01, -1.3059e-02, -1.1524e-02, -4.2600e-03,
         5.0091e-03, -6.1197e-03,  1.1576e-02,  8.1421e-04, -3.0955e-04,
        -3.0012e-03, -4.6388e-03,  7.7403e-03, -1.2088e-03, -9.7998e-03,
        -1.5644e-02, -1.0302e-02, -1.4473e-03, -1.7374e-01, -3.9994e-02,
        -1.4582e-02, -8.8079e-03,  2.9817e-02, -2.3863e-03, -1.9176e-02,
         1.0871e-04, -1.4643e-02, -1.7057e-02,  6.9376e-02,  1.0867e-02,
         7.1761e-03,  4.3088e-03, -5.1836e-03, -1.8323e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.3378, -0.1462, -0.0119, -0.0146, -0.0099,  0.0043, -0.0069,  0.0080,
         0.0025, -0.0009, -0.0057, -0.0062,  0.0043, -0.0062, -0.0049,  0.0190,
        -0.0137, -0.0067, -0.1549, -0.0570, -0.0098, -0.0079,  0.0117, -0.0044,
        -0.0212, -0.0018, -0.0111, -0.0111,  0.0653,  0.0085, -0.0144,  0.0086,
        -0.0016, -0.0010,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-4.5058e-01, -1.0413e-01, -8.9778e-03, -7.3961e-03, -3.3399e-03,
         4.7959e-03, -4.4529e-03,  5.2855e-03,  7.0251e-04, -2.1987e-04,
        -1.5200e-03, -1.4632e-03,  1.8267e-03,  2.5808e-03, -3.0460e-03,
         2.9168e-03, -3.5644e-03, -4.2061e-03, -1.1892e-01, -1.2578e-02,
        -7.4859e-03, -4.3337e-03,  2.5485e-02, -2.3629e-03, -1.6672e-02,
        -1.3987e-03, -1.0068e-02, -2.8355e-03, -7.0751e-02, -2.4529e-03,
        -1.1965e-04,  2.4203e-03,  2.9677e-03, -3.0549e-03,  4.5263e-03,
         7.4855e-04, -6.4052e-02,  4.0311e-03,  3.3467e-03, -7.1540e-04,
        -1.2605e-03,  1.4146e-03, -8.3906e-04, -1.5005e-04, -1.4539e-03,
         1.6721e-02,  2.5166e-03, -3.2298e-03,  7.9805e-05,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-3.9023e-01, -1.4348e-01, -1.2704e-02, -1.3092e-02, -3.0344e-03,
        -2.2317e-03, -8.2255e-03,  9.5842e-03,  2.6662e-03, -1.0383e-04,
        -2.5790e-03, -3.0688e-03,  5.5080e-03, -3.8559e-03, -1.1012e-02,
         1.9957e-02,  1.6857e-04, -7.3263e-03, -9.6546e-02, -2.3770e-02,
        -9.3939e-03, -8.1791e-04,  1.8464e-02, -2.5833e-03, -1.8331e-02,
         5.5020e-04, -1.9424e-02, -9.7744e-03,  2.4530e-03,  6.0465e-04,
         7.7634e-03,  9.3786e-03,  3.6086e-03, -6.0273e-04, -5.3984e-02,
        -2.1279e-03, -1.4951e-03, -1.7910e-03,  8.0455e-04, -9.8899e-04,
         2.2443e-03,  4.2544e-02,  4.8667e-03,  6.7159e-03, -1.0741e-02,
        -7.8178e-04, -2.5897e-03,  1.6321e-03,  2.4747e-03, -1.1132e-03,
         2.1884e-04], device='cuda:0', grad_fn=<DivBackward0>), tensor([-4.3485e-01, -1.2379e-01, -1.4170e-02, -1.5211e-02, -2.6083e-03,
         8.4930e-03, -3.4018e-03,  1.1434e-02,  2.7105e-03,  4.0116e-03,
        -1.3633e-03,  5.0293e-04,  6.3841e-03,  8.8608e-04, -5.3572e-03,
        -3.8558e-03, -6.3917e-03, -5.0019e-03, -1.3933e-01, -6.3110e-02,
        -9.8813e-03,  6.0325e-03,  1.8560e-02,  6.8327e-04, -1.1581e-02,
         2.6399e-03, -1.7134e-02, -1.0412e-02,  3.9852e-02,  1.0323e-02,
         1.2262e-02, -6.3138e-03,  7.0253e-04, -6.0301e-04,  1.4947e-04,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-4.1462e-01, -1.6264e-01, -7.9310e-03, -9.5393e-03, -1.9035e-03,
         6.4842e-03, -2.3486e-03,  4.7242e-03, -3.3814e-05,  3.7309e-04,
        -2.5914e-03, -3.6940e-03,  3.5043e-03, -7.5843e-04, -8.9570e-03,
        -1.2106e-02, -5.9608e-03, -7.1083e-03, -1.6626e-01, -4.0266e-02,
        -7.0120e-03, -1.3675e-04, -1.8591e-02, -1.8958e-03, -1.8709e-02,
        -8.0607e-04, -1.0005e-02, -8.3781e-03,  3.8563e-02,  6.1850e-03,
        -1.0801e-02, -1.2967e-03,  7.0386e-03,  5.4331e-03, -1.6621e-03,
        -1.6842e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-2.7125e-01, -2.0971e-01, -1.3737e-02, -1.0543e-02, -2.8925e-03,
         5.4132e-03, -7.0064e-03,  5.0368e-03, -8.0839e-04, -2.0885e-03,
         7.3480e-04, -2.9688e-03, -1.8896e-04, -4.6878e-03, -1.2456e-02,
        -1.7910e-02, -3.8997e-03, -3.7226e-03, -1.4454e-01, -2.9114e-02,
        -1.0043e-02, -1.7624e-03,  2.5495e-02,  6.3855e-04, -4.3205e-03,
         3.1589e-03, -1.5805e-02, -1.3882e-02,  1.3213e-03, -2.1559e-04,
         7.0528e-03,  3.1085e-03,  4.5725e-03, -1.7541e-03, -1.3186e-01,
        -1.1104e-03,  4.5010e-03, -8.9970e-03,  6.6778e-04, -1.2008e-03,
        -5.2716e-03, -3.1098e-03, -1.4384e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1989, -0.1975, -0.0049, -0.0104, -0.0026, -0.0017, -0.0030, -0.0045,
         0.0007, -0.0002, -0.0032, -0.0020,  0.0018, -0.0030, -0.0080,  0.0087,
        -0.0063, -0.0083, -0.1880, -0.0363, -0.0081, -0.0181,  0.0057,  0.0029,
        -0.0213,  0.0027, -0.0104, -0.0113, -0.1565,  0.0015, -0.0038,  0.0071,
        -0.0028, -0.0009,  0.0119, -0.0047,  0.0341, -0.0033,  0.0007, -0.0021,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-3.7244e-01, -1.4703e-01, -1.2394e-02, -1.3449e-02, -6.3419e-03,
         2.3939e-03, -4.0137e-03,  4.9516e-03,  3.6027e-03,  4.6978e-03,
        -3.4770e-03, -1.0533e-03,  4.4816e-03, -1.0659e-02, -4.9380e-03,
         2.8361e-02, -8.2051e-03, -5.1736e-03, -1.7030e-01, -5.1661e-02,
        -1.1531e-02, -6.1714e-03,  9.9083e-03, -1.1991e-03, -1.6113e-02,
        -2.2336e-03, -2.1461e-02, -1.2024e-02,  2.2814e-03, -3.5660e-03,
        -2.1484e-03,  7.7871e-04, -1.9594e-02,  8.7451e-03,  5.6339e-03,
         5.2695e-03,  1.1109e-02,  2.6874e-04, -3.3686e-04,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.3439, -0.0097, -0.0255, -0.0269, -0.0148, -0.3932,  0.0072, -0.0087,
        -0.0217, -0.0131,  0.0490, -0.0040, -0.0193, -0.0048, -0.0027,  0.0461,
        -0.0026, -0.0029, -0.0039,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #650: [tensor([-0.3767,  0.0372,  0.0112,  0.0135, -0.1898,  0.0147,  0.0239,  0.0228,
        -0.1593, -0.0070,  0.0118, -0.0119, -0.0060,  0.0261, -0.0008,  0.0541,
         0.0057,  0.0174,  0.0032, -0.0068,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-3.2421e-01, -3.4898e-03, -9.1725e-03, -2.4918e-02, -1.4015e-02,
        -6.3130e-02, -7.7145e-02, -3.7057e-03, -1.1349e-02, -2.0001e-02,
        -3.7488e-01, -7.5264e-03, -1.5531e-02, -1.7007e-02, -1.9970e-03,
        -2.2196e-03, -3.2643e-05, -1.7330e-02, -5.4891e-03,  1.0102e-03,
        -5.8308e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2705, -0.0108, -0.0249, -0.0215, -0.0125, -0.0772, -0.0054, -0.0029,
        -0.0122, -0.0205, -0.4466, -0.0070, -0.0115, -0.0074,  0.0223, -0.0012,
        -0.0216,  0.0033, -0.0043, -0.0023, -0.0024,  0.0006, -0.0009,  0.0049,
        -0.0040, -0.0014], device='cuda:0', grad_fn=<DivBackward0>), tensor([-2.1107e-01,  9.7063e-03, -1.4482e-02, -9.7421e-03, -2.1559e-02,
        -3.1993e-02,  4.8528e-02, -1.9131e-03,  5.4696e-03, -2.4615e-02,
        -4.1846e-01, -7.9889e-03, -1.2740e-02, -1.3984e-02,  1.8896e-03,
         2.1262e-02, -1.2738e-01,  3.3379e-04,  4.0463e-03, -1.4687e-03,
        -5.0830e-04, -5.6595e-03, -5.1998e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.7217e-01, -5.3486e-04, -1.9757e-02, -2.2141e-02, -1.2589e-01,
        -8.1872e-03, -5.0112e-01, -8.1408e-03, -1.3030e-02, -2.1506e-02,
         1.9036e-02, -2.0507e-03, -3.1512e-02, -3.8491e-03, -3.2038e-03,
        -4.8711e-03,  3.0603e-02, -5.9436e-03, -3.9961e-04, -2.0519e-03,
        -3.9964e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.3795, -0.0034, -0.0427, -0.0325, -0.0890, -0.0142, -0.3478,  0.0006,
        -0.0242, -0.0091,  0.0066, -0.0091,  0.0042,  0.0026,  0.0260,  0.0040,
         0.0031,  0.0015,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-2.1539e-01,  5.1443e-03, -1.7606e-02, -2.3339e-02, -8.6748e-02,
        -4.6917e-03, -5.2040e-01,  3.8993e-03, -2.0672e-02, -2.2731e-02,
         7.9441e-03,  5.3145e-04, -3.5337e-02, -7.4202e-03,  5.1390e-03,
         1.5169e-02, -3.1241e-04, -7.5264e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 9.7730e-03, -2.1596e-03, -2.8593e-02, -5.5079e-02, -1.2588e-01,
        -1.8610e-02, -6.1022e-01, -1.5993e-02, -2.7075e-02, -3.8090e-02,
        -1.3574e-02, -2.9771e-02,  1.6090e-03,  5.5501e-03, -1.1117e-02,
         4.9788e-04, -1.2671e-03, -5.1401e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.4418,  0.0194, -0.0151, -0.0285, -0.0185, -0.0132, -0.2639,  0.0284,
        -0.0157, -0.0179,  0.0071,  0.0021, -0.1178,  0.0054, -0.0051,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-3.3583e-01,  1.1510e-02, -4.4046e-02, -3.9667e-02, -5.9077e-02,
        -2.3488e-02, -3.9345e-01,  1.3480e-02, -1.6468e-02, -3.3738e-02,
         1.0401e-02, -2.6124e-03,  1.1521e-04, -9.8343e-03, -3.1564e-03,
        -1.1063e-03, -2.0174e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-3.2260e-01,  4.9088e-03, -1.8165e-02, -1.2681e-02, -3.8905e-02,
        -8.0387e-03, -3.0503e-01,  1.0974e-02, -1.5235e-02, -2.3523e-02,
         4.7893e-02, -3.3406e-03, -1.6019e-02, -6.8705e-03, -1.6032e-01,
         2.9114e-03,  8.1909e-05, -2.5034e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2960, -0.0004, -0.0117, -0.0143, -0.0538, -0.0093, -0.3736,  0.0136,
        -0.0157, -0.0134,  0.0044, -0.0045, -0.0084, -0.1637,  0.0092, -0.0076,
        -0.0004,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #700: [tensor([-3.4322e-01, -1.4670e-01,  7.6607e-03, -1.3538e-04, -1.6153e-01,
         8.6618e-03, -5.4860e-04,  2.1853e-03, -1.5761e-01, -3.4570e-03,
         8.3012e-04, -9.4789e-03, -1.0321e-02, -9.5114e-02,  1.3774e-02,
        -6.0316e-03, -6.9198e-03, -7.7709e-03,  5.1838e-03,  7.5757e-03,
        -4.6594e-03, -6.3138e-04,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-2.8308e-01, -1.5981e-01,  1.8326e-03, -1.4770e-03, -1.5926e-01,
         1.3511e-02, -3.6284e-03,  1.4201e-03, -1.1909e-01, -7.8575e-03,
        -3.9027e-04, -5.9331e-03, -4.2495e-03, -8.6804e-02,  6.7274e-03,
         1.6339e-03, -1.2628e-02,  6.2713e-03, -3.7659e-03, -3.3448e-03,
        -6.7598e-02, -2.0769e-04,  1.1332e-04,  1.6232e-03,  3.9798e-02,
         1.4372e-03, -5.7620e-03, -7.5099e-04,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.3450, -0.1149,  0.0054, -0.0218,  0.0216, -0.1006,  0.0121, -0.0037,
         0.0132, -0.0969,  0.0030, -0.0095, -0.0036,  0.0933,  0.0139,  0.0277,
         0.0041, -0.0014,  0.0917,  0.0109, -0.0035, -0.0023,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-2.9513e-01, -1.1823e-01,  1.6084e-03, -4.6331e-02,  1.3985e-02,
        -9.2500e-02,  1.0779e-02, -5.2803e-03, -1.5644e-02, -8.6276e-02,
         1.9631e-03, -6.0267e-03, -8.6876e-03,  2.3137e-03,  3.0765e-02,
        -8.1684e-02,  3.9520e-03,  1.1169e-02,  5.7668e-03, -5.0196e-02,
         7.5546e-03, -1.1355e-03, -4.2821e-03, -4.3567e-03, -4.7644e-03,
        -5.5649e-03, -7.1752e-02, -5.8547e-03,  1.9024e-03, -4.7045e-05,
        -4.4988e-03], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.3186, -0.1336,  0.0064, -0.0203,  0.0275, -0.1096,  0.0104,  0.0020,
        -0.0202, -0.1095,  0.0032, -0.0057, -0.0044,  0.0026,  0.0441, -0.0978,
         0.0138,  0.0004, -0.0543,  0.0126,  0.0020,  0.0010,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.4362, -0.1233,  0.0084, -0.0143,  0.0295, -0.0961,  0.0202, -0.0032,
        -0.0060, -0.0961,  0.0051, -0.0141, -0.0074,  0.0617,  0.0097,  0.0326,
         0.0025,  0.0124,  0.0007,  0.0112, -0.0030, -0.0065,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-4.6620e-01, -1.3663e-01,  9.4124e-03, -3.0684e-03,  1.8124e-02,
        -1.0708e-01,  2.0895e-02,  2.6668e-03, -1.8127e-02, -1.1970e-01,
         4.2886e-03, -6.5939e-03, -6.8328e-03, -5.5950e-02,  1.7550e-02,
        -1.0156e-03,  3.1117e-04, -1.0611e-03,  4.4911e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.4294, -0.1557,  0.0039, -0.0109,  0.0198, -0.1119,  0.0122, -0.0098,
         0.0055, -0.1237,  0.0020, -0.0097, -0.0032,  0.0048, -0.0185,  0.0156,
         0.0050, -0.0096, -0.0341,  0.0104, -0.0035,  0.0007,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-3.5433e-01, -1.4958e-01,  1.5475e-02, -3.3323e-02,  3.1639e-02,
        -8.0099e-02,  9.7032e-03,  4.1699e-04,  2.1502e-02, -1.0475e-01,
         4.4651e-03, -8.7741e-03, -6.5947e-03,  9.4103e-02,  2.3218e-02,
         4.9173e-02,  4.1616e-03,  8.3599e-03,  8.4505e-05,  2.4911e-04,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.4740, -0.1756,  0.0068, -0.0183,  0.0082, -0.1253,  0.0172, -0.0068,
        -0.0050, -0.1048, -0.0024, -0.0129, -0.0049,  0.0025,  0.0119,  0.0024,
        -0.0022, -0.0094, -0.0028,  0.0010, -0.0033, -0.0024,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.3587, -0.1097,  0.0156, -0.0145,  0.0341, -0.0894,  0.0102, -0.0137,
        -0.0245, -0.1339, -0.0005, -0.0095, -0.0012,  0.0043, -0.0281,  0.0144,
         0.0106, -0.0185,  0.0909,  0.0080, -0.0053, -0.0042,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.3158, -0.1667,  0.0082, -0.0263,  0.0432, -0.1378,  0.0265, -0.0050,
         0.0168, -0.1410,  0.0013, -0.0128, -0.0018, -0.0275,  0.0227, -0.0013,
         0.0323, -0.0078,  0.0051,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #750: [tensor([-1.7710e-01, -2.7083e-01, -7.9282e-03, -2.0937e-02, -2.7183e-01,
        -1.0407e-02,  1.5703e-03,  8.7881e-03,  3.8825e-03,  6.7255e-03,
        -1.4194e-02, -1.1304e-02, -1.1317e-02,  8.8135e-03, -1.2667e-03,
        -1.7470e-04,  1.7944e-03,  4.3341e-03, -2.4960e-02,  8.8157e-03,
         1.2121e-03, -1.1911e-01,  4.2131e-03,  2.6498e-03, -5.4522e-03,
         3.9964e-04,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2286, -0.2300, -0.0063, -0.0131, -0.1850, -0.0027, -0.0009,  0.0046,
         0.0035, -0.0007, -0.0088, -0.0068, -0.1809, -0.0071, -0.0028, -0.0067,
         0.0039, -0.0149, -0.0832,  0.0034, -0.0008, -0.0046, -0.0008,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2487, -0.1882, -0.0223, -0.0184, -0.2071, -0.0037,  0.0043,  0.0028,
         0.0064, -0.0038, -0.0148, -0.0151, -0.0847, -0.0088, -0.0118, -0.0019,
        -0.0017, -0.1203, -0.0042, -0.0236,  0.0020, -0.0055,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2632, -0.1680, -0.0091, -0.0172, -0.2082,  0.0023,  0.0038,  0.0086,
         0.0022,  0.0058, -0.0169, -0.0075, -0.1294, -0.0034, -0.0104, -0.1378,
         0.0021, -0.0027, -0.0014,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-3.1891e-01, -1.5860e-01, -1.9241e-02, -3.3501e-03, -1.7061e-01,
        -3.6867e-04,  1.0795e-03,  8.2075e-04,  3.0710e-03, -2.7288e-03,
        -4.9138e-03, -2.0513e-03, -1.5144e-01, -8.6525e-03, -1.2211e-02,
        -4.1008e-03, -2.9255e-04,  3.1611e-03,  2.5632e-04, -6.2744e-03,
        -1.1827e-01, -2.6345e-04, -1.5456e-03, -2.6067e-03, -5.1762e-03,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2986, -0.2164, -0.0157, -0.0196, -0.2294, -0.0057,  0.0020,  0.0048,
         0.0022,  0.0014, -0.0087, -0.0041, -0.1598, -0.0026,  0.0023, -0.0141,
        -0.0127,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2067, -0.2212, -0.0106, -0.0199, -0.2283, -0.0017, -0.0013,  0.0066,
        -0.0034,  0.0025, -0.0120, -0.0079, -0.1987, -0.0072, -0.0062, -0.0126,
        -0.0238, -0.0073, -0.0142, -0.0080,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2905, -0.1426, -0.0062, -0.0068, -0.2170,  0.0040,  0.0011,  0.0100,
         0.0090,  0.0006, -0.0042, -0.0078, -0.1865, -0.0093, -0.0278, -0.0053,
        -0.0592, -0.0034, -0.0037, -0.0050,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.3067, -0.2326, -0.0136, -0.0148, -0.1806, -0.0016,  0.0032,  0.0083,
         0.0149,  0.0084, -0.0087, -0.0079, -0.1156, -0.0036,  0.0213, -0.0062,
        -0.0297, -0.0013, -0.0010,  0.0125, -0.0023, -0.0053,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-2.9469e-01, -2.0505e-01,  4.6364e-03, -9.9019e-04, -1.1423e-02,
        -3.8991e-02,  1.2485e-02, -4.5488e-03, -7.5867e-03, -1.6637e-02,
        -1.7268e-01,  5.7287e-03,  9.5894e-05, -8.9954e-03, -9.7014e-03,
         8.5720e-02,  1.3532e-03, -6.3062e-04,  4.6465e-03,  8.4514e-03,
        -1.2103e-03, -8.7299e-03, -3.1260e-03, -7.4986e-02, -3.9356e-03,
        -9.5230e-04, -1.2023e-02], device='cuda:0', grad_fn=<DivBackward0>), tensor([-2.0291e-01, -1.6338e-01,  6.1393e-03, -4.1504e-03, -7.9700e-02,
        -2.0394e-02, -7.7508e-04, -4.9940e-05, -1.3575e-02, -1.5347e-02,
        -2.9650e-01, -1.7686e-03, -1.4590e-03, -9.2224e-03, -1.1100e-02,
         6.6120e-02,  7.6618e-03, -1.7447e-04, -1.1622e-02, -5.5311e-03,
        -1.3428e-02, -1.3179e-03,  5.2849e-02, -5.5733e-03, -5.1320e-03,
        -4.1254e-03,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-2.1871e-01, -1.7987e-01, -1.6361e-03, -1.5378e-04, -4.9891e-02,
        -2.8915e-02,  5.8048e-03, -1.6044e-03, -3.8379e-03, -7.4983e-03,
        -2.2398e-01,  4.6143e-03,  2.3076e-03, -2.9433e-03, -8.8800e-03,
         5.3315e-02, -4.4585e-03, -3.1939e-03,  7.1418e-03, -3.2494e-02,
        -4.4205e-03, -1.4077e-01, -4.6047e-03, -5.1933e-03, -3.7539e-03,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #800: [tensor([-0.3458, -0.2227, -0.0085, -0.0057, -0.0014, -0.0135, -0.0385, -0.2334,
         0.0045, -0.0074, -0.0125, -0.0062, -0.0060, -0.0081,  0.0487, -0.0045,
        -0.0173,  0.0011,  0.0030, -0.0048, -0.0062,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-5.1007e-02, -6.7575e-03, -9.7480e-04, -3.1103e-03, -1.6844e-03,
        -7.3484e-03, -6.4825e-03, -2.8105e-03, -9.9875e-03, -4.6479e-03,
        -4.1985e-01, -2.6667e-03, -2.2080e-03, -4.3659e-03, -9.1287e-02,
        -1.5172e-02, -1.2540e-03, -5.3562e-03, -3.0542e-01, -6.3360e-04,
        -1.1227e-03, -1.6377e-03,  9.9819e-05, -3.5470e-03, -3.7593e-03,
        -4.0083e-03, -3.1714e-03, -3.1252e-02, -4.9069e-04, -2.6150e-03,
        -2.2736e-03, -2.9953e-03], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1236, -0.0050, -0.0046, -0.0083, -0.0074, -0.0058, -0.0033, -0.0033,
        -0.0120, -0.0099, -0.2300, -0.0019, -0.0041, -0.0054, -0.1208, -0.0133,
        -0.0054, -0.0066, -0.0028, -0.0065, -0.0030, -0.0238, -0.3773, -0.0016,
        -0.0048,  0.0014, -0.0027, -0.0052,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0904, -0.0012, -0.0074, -0.0068, -0.0041, -0.0050, -0.0046, -0.0074,
        -0.0127, -0.0162, -0.3048, -0.0031, -0.0034, -0.0118, -0.0699, -0.0114,
        -0.0038, -0.0055, -0.0020, -0.0007, -0.0006, -0.0012, -0.0033, -0.0059,
         0.0010, -0.4066, -0.0036, -0.0014, -0.0044,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0066, -0.3803, -0.0309, -0.0239, -0.0147, -0.0088, -0.2861,  0.0006,
         0.0108, -0.0316, -0.0271, -0.0137, -0.0053,  0.0294, -0.0175, -0.0078,
        -0.0060, -0.0612, -0.0007, -0.0165, -0.0205,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.3134, -0.2510, -0.0056, -0.0126, -0.0068, -0.0003, -0.1950, -0.0013,
         0.0050, -0.0138, -0.0112, -0.0602, -0.0047,  0.0027, -0.0222,  0.0727,
         0.0055, -0.0072, -0.0087,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1451, -0.1714, -0.0066, -0.0107, -0.0069, -0.0042, -0.1649, -0.0024,
         0.0068, -0.0070, -0.0088, -0.1479, -0.0117, -0.0058, -0.1207, -0.0047,
        -0.0006, -0.1518,  0.0030,  0.0055, -0.0011, -0.0070, -0.0054,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0592, -0.0042, -0.0030, -0.0477, -0.0181, -0.0062, -0.0130, -0.0029,
        -0.0034, -0.0027, -0.0075, -0.0063, -0.0148, -0.7934, -0.0023, -0.0061,
        -0.0090,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 9.1351e-03, -1.5262e-03,  3.5495e-03, -2.2416e-02, -8.9207e-03,
        -1.6770e-03, -9.1034e-03, -1.5574e-03, -3.5261e-03, -8.0594e-04,
        -3.2197e-03, -6.4600e-03, -6.7620e-03, -5.9455e-03, -1.1077e-02,
        -8.7468e-01, -3.5816e-03, -3.6526e-03, -7.8687e-03, -2.7740e-03,
        -3.5497e-03, -3.1399e-03, -5.0725e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0839, -0.0045,  0.0028, -0.0328, -0.0098, -0.0077, -0.0158, -0.0052,
        -0.0010,  0.0012, -0.0053, -0.7875, -0.0052, -0.0053, -0.0106, -0.0039,
        -0.0053, -0.0033, -0.0090,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-2.7321e-01, -3.6940e-01, -7.6401e-03, -4.3065e-03,  3.0115e-03,
        -4.0662e-03, -1.3165e-02,  2.4302e-03, -5.2855e-03,  9.6315e-03,
         2.2692e-03, -1.1142e-02, -1.5626e-02, -2.3134e-01,  1.8799e-04,
         2.5386e-03, -2.9927e-04, -2.2106e-03, -2.9330e-03,  2.0754e-02,
        -5.4117e-03, -3.5189e-03, -2.4918e-03, -7.1300e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.1017, -0.2287, -0.0017, -0.0031, -0.0007, -0.0030, -0.0064, -0.0093,
        -0.1561, -0.0068, -0.0043, -0.0042, -0.0077, -0.4269, -0.0010, -0.0030,
        -0.0008, -0.0011, -0.0039, -0.0065, -0.0031, -0.0033, -0.0017, -0.0019,
        -0.0026, -0.0004, -0.0036, -0.0026, -0.0038,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #850: [tensor([-0.1445, -0.0146, -0.0678, -0.0247, -0.0325, -0.0047, -0.0017,  0.0048,
        -0.1380, -0.0278, -0.0243,  0.0011, -0.0049, -0.0741, -0.0105, -0.0072,
        -0.0070, -0.0075, -0.0632, -0.0068, -0.0019, -0.0310, -0.0077, -0.0099,
        -0.0033, -0.1474, -0.0026, -0.0058, -0.1008, -0.0103, -0.0032, -0.0083],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1642, -0.0324, -0.0221, -0.0082, -0.0433, -0.0048, -0.0017,  0.0040,
        -0.1365, -0.0217, -0.0199,  0.0037, -0.0108, -0.0973, -0.0162, -0.0084,
        -0.0107, -0.0378, -0.0071, -0.3124, -0.0115, -0.0085, -0.0027, -0.0032,
        -0.0109,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-7.0080e-02, -6.3466e-03, -2.9126e-03, -9.2423e-03, -3.5272e-02,
        -1.6866e-01, -4.1160e-04, -3.9306e-03, -4.4812e-03, -2.1802e-02,
        -3.8163e-03,  2.2965e-04, -4.1053e-03, -2.0505e-03, -4.8176e-03,
        -3.1614e-01, -6.1684e-03, -1.3883e-02, -3.1172e-01, -3.1024e-03,
        -4.5338e-03, -6.2946e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0290, -0.0164, -0.0375, -0.0171, -0.1370, -0.5752, -0.0030, -0.0185,
        -0.0090, -0.0462, -0.0149, -0.0079, -0.0067, -0.0073, -0.0147, -0.0176,
        -0.0065, -0.0068, -0.0027, -0.0111,  0.0015, -0.0015, -0.0037, -0.0081,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-9.5750e-02, -1.1428e-02, -9.3864e-03, -1.0186e-02, -2.2914e-02,
        -1.8821e-01, -2.4976e-03, -4.9641e-03, -3.7378e-03, -1.6649e-02,
        -5.0049e-03,  7.4063e-05, -5.7277e-03, -6.9871e-03, -6.0257e-03,
        -3.1718e-01, -2.9050e-03, -3.3450e-03, -1.0216e-02, -2.4389e-01,
        -5.2842e-04, -4.2222e-03, -5.0203e-03, -8.0562e-03, -5.3004e-03,
         3.5701e-04, -3.7506e-03, -2.1308e-03, -3.5501e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0828, -0.1541, -0.0068, -0.1336,  0.0004, -0.0007, -0.0035, -0.1805,
        -0.0014, -0.0080, -0.0957, -0.2313, -0.0004, -0.0110, -0.0071,  0.0351,
         0.0030, -0.0052, -0.0165, -0.0051,  0.0039, -0.0003, -0.0044, -0.0090,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-9.4457e-02, -8.9441e-02, -7.2681e-04, -8.8245e-02, -9.7039e-04,
        -2.8213e-03,  1.8293e-03, -1.6251e-01,  5.9502e-04, -7.4859e-03,
        -2.7410e-02, -1.3348e-01,  5.2060e-04, -7.0875e-03, -6.2784e-03,
         4.0354e-02,  9.0579e-05, -2.9231e-02,  1.5566e-03, -1.5305e-01,
         1.9285e-03, -2.1138e-03, -1.6402e-05, -5.1418e-03, -1.2632e-01,
        -4.8787e-04, -5.4204e-03, -3.9749e-03, -6.4590e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1538, -0.1435, -0.0063, -0.0724, -0.0007, -0.0030, -0.0056, -0.2318,
         0.0012, -0.0096, -0.0526, -0.2260, -0.0028, -0.0067, -0.0055,  0.0330,
         0.0009, -0.0161, -0.0043, -0.0085, -0.0054,  0.0046, -0.0043, -0.0014,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1585, -0.0849, -0.0040, -0.1273, -0.0022, -0.2396,  0.0036, -0.0031,
        -0.0153, -0.2271,  0.0027, -0.0044, -0.0072, -0.0058,  0.0559, -0.0056,
        -0.0367,  0.0075, -0.0051, -0.0037,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1339, -0.1078, -0.0020, -0.2046,  0.0014, -0.1790,  0.0039, -0.0027,
        -0.0060, -0.2186, -0.0056, -0.0056, -0.0085, -0.0152,  0.0310, -0.0065,
        -0.0476,  0.0007, -0.0069, -0.0124,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.0378, -0.1678, -0.0035, -0.1857, -0.0100, -0.1939,  0.0013, -0.0057,
        -0.0044, -0.2660, -0.0031, -0.0067, -0.0068, -0.0059, -0.0532, -0.0026,
        -0.0269,  0.0006, -0.0055, -0.0025, -0.0040, -0.0063,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0439, -0.0145, -0.0868, -0.0098, -0.0070, -0.3059, -0.0042, -0.0067,
        -0.0035, -0.0063, -0.0068, -0.0055, -0.0205, -0.4659, -0.0031, -0.0043,
        -0.0054,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #900: [tensor([-0.0088, -0.3590, -0.0445, -0.0171, -0.0019, -0.0027,  0.0021,  0.0012,
         0.0022, -0.4508, -0.0066, -0.0148, -0.0201,  0.0144, -0.0068, -0.0101,
        -0.0024, -0.0055, -0.0091, -0.0068, -0.0130,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 9.0122e-02, -3.4960e-01, -2.3167e-02, -1.0514e-02, -1.9740e-02,
         3.5312e-04,  1.1588e-03, -3.7752e-03, -7.8499e-05, -3.9904e-01,
        -7.5964e-03, -2.1283e-03, -6.3701e-03, -1.4377e-02, -8.4226e-03,
        -1.1079e-02, -1.5633e-03,  1.6832e-03, -2.7792e-02,  4.0072e-03,
        -1.8258e-03, -5.1592e-03, -1.0446e-02,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.0952, -0.0048, -0.0654, -0.0734, -0.0081, -0.4776, -0.0280, -0.0034,
        -0.0030, -0.1197, -0.0037, -0.0016, -0.0054, -0.0029, -0.0116, -0.0157,
        -0.0058, -0.0035, -0.0040, -0.0573, -0.0034, -0.0014, -0.0050,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 1.4849e-02, -3.0073e-03, -6.3396e-02, -2.9663e-02, -2.4707e-03,
        -2.6391e-01, -3.4773e-02, -5.2639e-03,  3.0989e-04, -1.5822e-01,
        -1.8595e-03, -8.4373e-04, -4.6404e-03, -1.2309e-02, -1.8230e-02,
        -8.3068e-03, -1.0001e-02, -1.1541e-02, -3.4492e-01, -3.1099e-03,
        -1.5899e-03, -6.7895e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 8.1392e-02, -5.0375e-03, -4.1827e-02, -2.2565e-02, -5.5913e-03,
        -2.2808e-01, -9.9641e-03, -5.2265e-03, -4.5600e-03, -9.5901e-02,
        -4.2131e-04, -2.2957e-03, -5.0236e-03, -5.8631e-03, -1.1404e-02,
        -3.8293e-03, -1.8913e-03, -4.5525e-01, -7.0256e-03, -1.2142e-03,
        -5.6420e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 1.0433e-01, -1.5431e-01, -4.8439e-03,  2.5262e-04, -3.9875e-03,
        -1.9902e-02, -3.2284e-03, -8.2336e-03, -1.3683e-03, -2.1207e-01,
        -3.0220e-03, -2.3439e-03, -8.8526e-03, -4.2154e-01, -5.0813e-03,
        -2.8768e-02, -5.6306e-03, -1.4690e-03, -4.4622e-03, -6.3076e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 1.1442e-01, -1.6639e-01, -1.1529e-04, -1.1802e-03, -3.9256e-03,
        -1.2779e-02, -7.0976e-03, -9.5659e-03,  2.2352e-04, -1.6513e-01,
        -1.5450e-03, -5.1514e-03, -9.7283e-03, -4.3811e-01, -1.3358e-03,
        -3.1020e-02, -3.7529e-03, -6.0426e-03, -5.6418e-03, -7.0064e-03,
        -4.0321e-03, -5.8113e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.0488, -0.1672, -0.0063, -0.0019, -0.0040, -0.0066, -0.0040, -0.0092,
        -0.0031, -0.1760, -0.0010, -0.0024, -0.0075, -0.4837, -0.0028, -0.0501,
        -0.0054, -0.0050, -0.0062, -0.0023, -0.0065,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 1.0778e-01, -1.2697e-01, -1.0417e-02, -9.1792e-04, -1.6006e-02,
        -2.5371e-02, -9.2592e-03, -1.6010e-04, -2.4662e-01, -5.4607e-03,
        -2.9691e-03, -1.1603e-03, -4.2507e-03, -5.9081e-03, -1.3308e-02,
        -7.2802e-03, -1.3696e-03, -8.9447e-03, -1.4587e-02, -9.5431e-03,
        -1.1697e-03, -3.6166e-01, -4.3542e-03, -5.8819e-03, -1.7088e-03,
        -6.9409e-03], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 1.2328e-01, -9.8562e-02, -1.1938e-02, -3.6834e-04, -6.9235e-02,
        -4.6046e-02, -1.0675e-02, -1.2258e-03, -5.2892e-01, -9.0926e-03,
        -5.7866e-03, -1.0251e-03, -7.0027e-03, -1.7174e-02, -1.8319e-02,
        -6.0279e-03, -4.2944e-03, -1.5991e-02, -1.4883e-02, -1.5626e-03,
        -2.3911e-03, -6.1959e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.1242, -0.1385, -0.0277, -0.0028, -0.0226, -0.1146, -0.0249,  0.0015,
        -0.4514, -0.0058, -0.0022, -0.0079, -0.0099, -0.0169, -0.0302, -0.0091,
        -0.0020, -0.0078,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.1630, -0.0118, -0.1462, -0.0055, -0.0024, -0.5795, -0.0014, -0.0052,
        -0.0106, -0.0044, -0.0183, -0.0219, -0.0163, -0.0055, -0.0081,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #950: [tensor([ 9.2672e-02, -2.6179e-01, -4.0992e-03, -2.3896e-03,  1.7459e-06,
        -5.4639e-01, -2.6375e-03, -5.8941e-03, -6.5798e-03, -2.8819e-03,
        -6.0391e-03, -2.8487e-03, -3.8834e-03, -5.8056e-03, -7.0173e-03,
        -9.4337e-03, -7.5538e-04, -4.6473e-03, -5.0897e-03, -1.8457e-02,
        -4.1575e-03, -3.1590e-03, -3.3678e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.1114, -0.2123, -0.0031, -0.0035, -0.0007, -0.3365, -0.0014, -0.0044,
        -0.0053, -0.0041, -0.0077, -0.0041, -0.0026, -0.0032, -0.0050, -0.0063,
         0.0003, -0.0033, -0.0120, -0.0050, -0.0023, -0.2522, -0.0040, -0.0041,
        -0.0009, -0.0045], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2103,  0.5731,  0.0305,  0.0008,  0.0014,  0.0056,  0.0129,  0.0041,
         0.0079,  0.0659,  0.0042,  0.0038,  0.0033,  0.0337,  0.0030,  0.0041,
         0.0087,  0.0063,  0.0104,  0.0036,  0.0063,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0311,  0.5423,  0.0102, -0.0012,  0.0029,  0.0019,  0.0081,  0.0040,
         0.0052,  0.0278,  0.0036,  0.0041,  0.0042,  0.0168,  0.0026,  0.0016,
         0.3026,  0.0039,  0.0077,  0.0047,  0.0076,  0.0011,  0.0049,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 1.0385e-01, -7.1139e-01, -1.4484e-02, -2.1433e-04, -3.0061e-03,
        -5.5250e-03, -1.6205e-02, -4.6130e-03, -9.6827e-03, -4.7896e-02,
        -6.0844e-03, -5.6567e-03, -2.1476e-03, -2.3691e-02, -2.0689e-03,
        -3.6062e-03, -8.9567e-03, -7.1611e-03, -1.3611e-02, -3.9346e-03,
        -6.2147e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3543, 0.0549, 0.1099, 0.1011, 0.0328, 0.1003, 0.0071, 0.0158, 0.0207,
        0.0170, 0.0500, 0.0710, 0.0359, 0.0107, 0.0183, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2924, 0.0382, 0.2186, 0.0750, 0.0304, 0.1136, 0.0043, 0.0110, 0.0193,
        0.0459, 0.0482, 0.0339, 0.0352, 0.0094, 0.0246, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2758, 0.0324, 0.1006, 0.0693, 0.0262, 0.0614, 0.0036, 0.0167, 0.1156,
        0.0297, 0.0774, 0.0299, 0.0207, 0.0895, 0.0278, 0.0091, 0.0146, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 5.7924e-02, -6.8105e-01, -7.5662e-04, -1.7226e-02, -7.8751e-03,
        -5.1907e-02, -5.3622e-03, -7.3240e-03, -2.0685e-03,  1.0167e-04,
        -5.1566e-03, -1.1773e-01, -6.3470e-03, -1.3645e-02, -3.9563e-03,
        -1.0352e-02, -3.8595e-03, -7.3616e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-2.4867e-02,  4.4891e-01,  2.0551e-03,  9.3388e-03,  2.9365e-03,
         2.2311e-02,  5.8951e-03,  4.9724e-03,  9.8411e-04,  3.0948e-05,
         3.5923e-03,  1.4636e-01,  6.4698e-03,  7.7248e-03,  4.8618e-03,
         5.9555e-03,  5.1829e-03,  7.4749e-03,  5.6735e-03,  4.6325e-03,
         4.2210e-03,  9.5620e-03,  2.5465e-01,  5.1594e-03,  1.7147e-03,
         4.4630e-03], device='cuda:0', grad_fn=<DivBackward0>), tensor([-4.9663e-02,  5.3783e-01,  2.2322e-03,  1.2375e-02,  5.7652e-03,
         1.4661e-02,  6.0371e-03,  7.2492e-03,  2.5520e-03, -1.5080e-06,
         3.2233e-03,  2.9268e-01,  9.8950e-03,  9.3237e-03,  5.4538e-03,
         7.0261e-03,  1.7649e-02,  6.2645e-03,  3.3076e-03,  6.8159e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0189, -0.0073, -0.0037, -0.0057, -0.0041, -0.0029, -0.5575, -0.0022,
        -0.0039, -0.0598, -0.0024,  0.0007, -0.0039, -0.2619, -0.0033, -0.0037,
        -0.0109, -0.0225, -0.0048, -0.0084, -0.0057, -0.0012, -0.0046,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #1000: [tensor([0.3697, 0.0562, 0.0059, 0.0161, 0.0063, 0.0202, 0.0063, 0.0061, 0.0081,
        0.0046, 0.0218, 0.0460, 0.0034, 0.0025, 0.0055, 0.1667, 0.0116, 0.0171,
        0.0132, 0.0438, 0.1411, 0.0047, 0.0105, 0.0043, 0.0082, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3004, 0.1153, 0.0103, 0.0203, 0.0114, 0.0286, 0.0084, 0.0093, 0.0180,
        0.0079, 0.0319, 0.0937, 0.0044, 0.0017, 0.0081, 0.1510, 0.0360, 0.0164,
        0.0102, 0.0048, 0.0537, 0.0195, 0.0125, 0.0083, 0.0035, 0.0037, 0.0106],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2321, 0.0667, 0.0057, 0.0149, 0.0092, 0.0169, 0.0092, 0.0098, 0.0108,
        0.0082, 0.0222, 0.0497, 0.0032, 0.0030, 0.0049, 0.2478, 0.0238, 0.0121,
        0.0072, 0.0119, 0.0151, 0.1753, 0.0218, 0.0073, 0.0111, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3378, 0.0739, 0.0096, 0.0184, 0.0113, 0.0097, 0.0426, 0.0497, 0.0043,
        0.0114, 0.0558, 0.0074, 0.0008, 0.0073, 0.0316, 0.0547, 0.2306, 0.0214,
        0.0118, 0.0099, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3495, 0.1377, 0.0089, 0.0165, 0.0159, 0.0139, 0.0457, 0.0666, 0.0042,
        0.0152, 0.0904, 0.0181, 0.0071, 0.0083, 0.0320, 0.0799, 0.0089, 0.0192,
        0.0090, 0.0367, 0.0054, 0.0111, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3975, 0.0924, 0.0079, 0.0237, 0.0116, 0.0096, 0.0382, 0.0509, 0.0057,
        0.0126, 0.0658, 0.0116, 0.0039, 0.0066, 0.0179, 0.0682, 0.0149, 0.0750,
        0.0154, 0.0204, 0.0058, 0.0099, 0.0099, 0.0173, 0.0074, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3434, 0.0611, 0.0111, 0.0078, 0.0139, 0.0068, 0.0033, 0.0078, 0.0066,
        0.0060, 0.0611, 0.0068, 0.0066, 0.0062, 0.3288, 0.0232, 0.0150, 0.0167,
        0.0224, 0.0141, 0.0130, 0.0047, 0.0134, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4342, 0.0787, 0.0055, 0.0116, 0.0135, 0.0061, 0.0042, 0.0072, 0.0072,
        0.0052, 0.0531, 0.0038, 0.0096, 0.0056, 0.1438, 0.0117, 0.0169, 0.0158,
        0.0102, 0.0059, 0.1243, 0.0041, 0.0120, 0.0095, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3568, 0.0629, 0.0113, 0.0080, 0.0147, 0.0057, 0.0042, 0.0059, 0.0079,
        0.0035, 0.0562, 0.0038, 0.0035, 0.0057, 0.1364, 0.0123, 0.0161, 0.0155,
        0.0355, 0.0076, 0.0336, 0.1713, 0.0117, 0.0096, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2878, 0.0584, 0.0047, 0.0013, 0.0122, 0.0063, 0.0147, 0.0209, 0.0097,
        0.0074, 0.0082, 0.0056, 0.0896, 0.0045, 0.0012, 0.0070, 0.2466, 0.0068,
        0.0428, 0.0122, 0.1247, 0.0141, 0.0048, 0.0085, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2766, 0.0797, 0.0057, 0.0022, 0.0105, 0.0062, 0.0091, 0.0227, 0.0098,
        0.0077, 0.0050, 0.0073, 0.0643, 0.0032, 0.0012, 0.0088, 0.2453, 0.0120,
        0.0165, 0.0571, 0.0043, 0.1185, 0.0078, 0.0062, 0.0122, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3344, 0.0649, 0.0048, 0.0057, 0.0107, 0.0064, 0.0096, 0.0293, 0.0072,
        0.0057, 0.0070, 0.0090, 0.0762, 0.0046, 0.0018, 0.0066, 0.2542, 0.0119,
        0.0697, 0.0170, 0.0421, 0.0079, 0.0045, 0.0089, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #1050: [tensor([0.4242, 0.1120, 0.0130, 0.0167, 0.0039, 0.0094, 0.0256, 0.0062, 0.0445,
        0.0399, 0.0077, 0.0072, 0.1310, 0.0287, 0.0231, 0.0066, 0.0198, 0.0184,
        0.0181, 0.0157, 0.0144, 0.0036, 0.0101, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3906, 0.0548, 0.0092, 0.0068, 0.0112, 0.0300, 0.0043, 0.0127, 0.0907,
        0.0075, 0.0016, 0.0149, 0.0343, 0.0049, 0.0018, 0.0045, 0.0882, 0.0058,
        0.0572, 0.0048, 0.0174, 0.0552, 0.0673, 0.0113, 0.0038, 0.0093, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4076, 0.0708, 0.0111, 0.0072, 0.0127, 0.0318, 0.0059, 0.0114, 0.0988,
        0.0056, 0.0052, 0.0102, 0.0332, 0.0046, 0.0012, 0.0071, 0.0579, 0.0152,
        0.0623, 0.0089, 0.0298, 0.0108, 0.0655, 0.0067, 0.0076, 0.0108, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2701, 0.0864, 0.0073, 0.0100, 0.0084, 0.0260, 0.0046, 0.0143, 0.0758,
        0.0023, 0.0044, 0.0145, 0.0276, 0.0012, 0.0011, 0.0067, 0.2575, 0.0144,
        0.0708, 0.0174, 0.0520, 0.0128, 0.0052, 0.0089, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3448, 0.0341, 0.0066, 0.0048, 0.0473, 0.0021, 0.0065, 0.0036, 0.0038,
        0.0065, 0.0240, 0.0043, 0.0071, 0.0352, 0.0030, 0.0084, 0.0409, 0.0350,
        0.0058, 0.0074, 0.0009, 0.0040, 0.1921, 0.0063, 0.0158, 0.0078, 0.0117,
        0.1134, 0.0074, 0.0035, 0.0058, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([3.2377e-01, 3.0831e-02, 5.2891e-03, 5.3084e-03, 5.9495e-02, 1.3003e-03,
        7.1759e-03, 4.4837e-03, 3.7801e-03, 8.5880e-03, 2.2305e-02, 5.1089e-03,
        6.2988e-03, 3.7728e-02, 3.4230e-03, 1.0893e-02, 3.4997e-02, 6.4630e-02,
        4.1593e-03, 7.2374e-03, 2.2835e-04, 5.5024e-03, 1.6000e-01, 9.8623e-03,
        6.8869e-03, 6.2932e-02, 6.8055e-03, 6.8060e-03, 1.0609e-02, 6.6311e-02,
        6.3098e-03, 3.1645e-03, 7.7821e-03, 0.0000e+00, 0.0000e+00, 0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2849, 0.0511, 0.0066, 0.0099, 0.0574, 0.0039, 0.0075, 0.0053, 0.0041,
        0.0126, 0.0256, 0.0060, 0.0080, 0.0573, 0.0041, 0.0094, 0.0421, 0.0546,
        0.0053, 0.0100, 0.0015, 0.0054, 0.1758, 0.0134, 0.0103, 0.1048, 0.0088,
        0.0058, 0.0085, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4615, 0.0648, 0.0161, 0.0030, 0.0048, 0.0030, 0.0065, 0.0050, 0.0124,
        0.0029, 0.0329, 0.0131, 0.0065, 0.0399, 0.0076, 0.0183, 0.0147, 0.0061,
        0.0088, 0.0072, 0.0025, 0.0051, 0.0565, 0.0144, 0.0065, 0.0091, 0.1266,
        0.0127, 0.0168, 0.0045, 0.0102, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3639, 0.0494, 0.0107, 0.0020, 0.0065, 0.0024, 0.0040, 0.0047, 0.0107,
        0.0016, 0.0204, 0.0103, 0.0049, 0.0324, 0.0056, 0.0140, 0.0136, 0.0052,
        0.0075, 0.0076, 0.0033, 0.0044, 0.1131, 0.0114, 0.0177, 0.1064, 0.0114,
        0.0127, 0.0132, 0.0038, 0.1071, 0.0101, 0.0082, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3222, 0.0784, 0.0165, 0.0022, 0.0088, 0.0039, 0.0049, 0.0053, 0.0122,
        0.0026, 0.0332, 0.0116, 0.0104, 0.0372, 0.0091, 0.0189, 0.0150, 0.0066,
        0.0114, 0.0095, 0.0040, 0.0056, 0.0576, 0.0184, 0.0034, 0.0152, 0.1000,
        0.0105, 0.0057, 0.0067, 0.0845, 0.0105, 0.0236, 0.0093, 0.0089, 0.0162],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3036, 0.0407, 0.0132, 0.0019, 0.0047, 0.0026, 0.0044, 0.0054, 0.0103,
        0.0044, 0.0242, 0.0123, 0.0047, 0.0380, 0.0051, 0.0116, 0.0171, 0.0046,
        0.0091, 0.0062, 0.0005, 0.0053, 0.1160, 0.0074, 0.0314, 0.1693, 0.0140,
        0.0197, 0.0128, 0.0837, 0.0080, 0.0078, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3882, 0.0560, 0.0165, 0.0026, 0.0067, 0.0016, 0.0043, 0.0063, 0.0118,
        0.0027, 0.0283, 0.0151, 0.0075, 0.0305, 0.0057, 0.0176, 0.0137, 0.0078,
        0.0114, 0.0094, 0.0008, 0.0065, 0.0596, 0.0153, 0.0043, 0.0108, 0.0996,
        0.0066, 0.1306, 0.0083, 0.0042, 0.0099, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #1100: [tensor([0.3677, 0.0634, 0.0099, 0.0119, 0.0095, 0.0039, 0.0160, 0.0239, 0.0085,
        0.0091, 0.0076, 0.0023, 0.0054, 0.1272, 0.0140, 0.0125, 0.1768, 0.0169,
        0.0159, 0.0503, 0.0048, 0.0111, 0.0121, 0.0051, 0.0141, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4420, 0.0191, 0.0294, 0.0078, 0.1137, 0.0167, 0.0627, 0.0140, 0.0273,
        0.1304, 0.0133, 0.0034, 0.0128, 0.0088, 0.0354, 0.0413, 0.0220, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3931, 0.0126, 0.0372, 0.0057, 0.0920, 0.0145, 0.0497, 0.0147, 0.0330,
        0.1790, 0.0251, 0.0039, 0.0138, 0.0129, 0.0432, 0.0357, 0.0187, 0.0151,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4722, 0.0140, 0.0251, 0.0018, 0.1007, 0.0090, 0.0426, 0.0134, 0.0231,
        0.0922, 0.0120, 0.0027, 0.0101, 0.0236, 0.1083, 0.0246, 0.0083, 0.0162,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3943, 0.0179, 0.0259, 0.0098, 0.1260, 0.0134, 0.0233, 0.0136, 0.0715,
        0.0237, 0.0011, 0.0157, 0.0296, 0.1916, 0.0186, 0.0240, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4496, 0.0226, 0.0451, 0.0130, 0.1696, 0.0154, 0.0261, 0.0223, 0.0707,
        0.0368, 0.0015, 0.0198, 0.0547, 0.0224, 0.0303, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3678, 0.0262, 0.0398, 0.0177, 0.1913, 0.0201, 0.0293, 0.0187, 0.1082,
        0.0352, 0.0094, 0.0193, 0.0151, 0.0648, 0.0161, 0.0209, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3518, 0.0102, 0.0067, 0.0065, 0.0039, 0.0405, 0.0118, 0.0503, 0.0058,
        0.0067, 0.0087, 0.0613, 0.0191, 0.0141, 0.0072, 0.0109, 0.0072, 0.0045,
        0.0057, 0.1956, 0.0142, 0.0102, 0.1133, 0.0180, 0.0061, 0.0100, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4270, 0.0115, 0.0074, 0.0143, 0.0064, 0.0309, 0.0153, 0.0726, 0.0009,
        0.0064, 0.0130, 0.0708, 0.0215, 0.0212, 0.0027, 0.0168, 0.0052, 0.0071,
        0.0077, 0.0641, 0.0093, 0.1236, 0.0195, 0.0108, 0.0141, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4875, 0.0101, 0.0043, 0.0087, 0.0073, 0.0365, 0.0116, 0.0553, 0.0027,
        0.0086, 0.0127, 0.0532, 0.0180, 0.0191, 0.0041, 0.0153, 0.0059, 0.0054,
        0.0098, 0.0677, 0.0116, 0.1036, 0.0145, 0.0109, 0.0155, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3043, 0.0093, 0.0109, 0.0251, 0.0052, 0.0081, 0.0175, 0.0059, 0.0281,
        0.0222, 0.0079, 0.0128, 0.0412, 0.0079, 0.0092, 0.0006, 0.0081, 0.0065,
        0.0115, 0.0682, 0.0065, 0.0091, 0.0411, 0.0109, 0.0411, 0.0451, 0.0126,
        0.0162, 0.1662, 0.0134, 0.0141, 0.0042, 0.0090, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4032, 0.0062, 0.0053, 0.0246, 0.0070, 0.0053, 0.0126, 0.0080, 0.0176,
        0.0208, 0.0077, 0.0117, 0.0379, 0.0052, 0.0057, 0.0013, 0.0063, 0.0070,
        0.0069, 0.0421, 0.0074, 0.0075, 0.0316, 0.0104, 0.0061, 0.0062, 0.0124,
        0.0149, 0.0080, 0.0328, 0.0342, 0.0119, 0.0149, 0.1227, 0.0124, 0.0125,
        0.0036, 0.0078], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #1150: [tensor([ 3.6442e-01,  6.4084e-02,  1.1246e-02,  4.5297e-02,  6.1163e-02,
         5.3166e-03,  7.9601e-03,  7.0849e-03,  3.7031e-02,  4.6396e-03,
         2.6216e-02,  6.4267e-03,  2.5608e-03,  1.6344e-02,  5.8761e-02,
         1.0523e-02,  7.2539e-02,  9.5322e-02,  4.9996e-03,  1.0909e-02,
        -5.6092e-05,  4.7773e-03,  8.8825e-03,  1.5003e-02,  3.1156e-02,
         1.0900e-02,  8.6113e-03,  7.7687e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4501, 0.0634, 0.0091, 0.0084, 0.0928, 0.0070, 0.0131, 0.0053, 0.0882,
        0.0112, 0.0054, 0.0054, 0.0180, 0.0121, 0.0221, 0.0095, 0.0135, 0.0041,
        0.0097, 0.0121, 0.0181, 0.0842, 0.0077, 0.0137, 0.0159, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4437, 0.0923, 0.0133, 0.0097, 0.0814, 0.0092, 0.0143, 0.0074, 0.0977,
        0.0088, 0.0062, 0.0097, 0.0226, 0.0119, 0.0244, 0.0119, 0.0188, 0.0037,
        0.0087, 0.0100, 0.0159, 0.0203, 0.0164, 0.0248, 0.0169, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4478, 0.0993, 0.0139, 0.0116, 0.0752, 0.0079, 0.0149, 0.0084, 0.0741,
        0.0147, 0.0078, 0.0111, 0.0200, 0.0099, 0.0180, 0.0115, 0.0155, 0.0047,
        0.0100, 0.0145, 0.0140, 0.0398, 0.0195, 0.0155, 0.0068, 0.0134, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4669, 0.0075, 0.0293, 0.0056, 0.0036, 0.0070, 0.0088, 0.0066, 0.0151,
        0.0985, 0.0085, 0.0040, 0.0058, 0.0080, 0.0549, 0.0093, 0.0142, 0.0371,
        0.0052, 0.0015, 0.0068, 0.0689, 0.0049, 0.0229, 0.0098, 0.0510, 0.0216,
        0.0068, 0.0099, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4022, 0.0101, 0.0294, 0.0049, 0.0040, 0.0070, 0.0095, 0.0080, 0.0130,
        0.0998, 0.0081, 0.0028, 0.0065, 0.0085, 0.0770, 0.0129, 0.0147, 0.0492,
        0.0085, 0.0018, 0.0056, 0.0623, 0.0177, 0.0664, 0.0185, 0.0389, 0.0041,
        0.0083, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3854, 0.0092, 0.0334, 0.0040, 0.0032, 0.0073, 0.0086, 0.0096, 0.0136,
        0.0937, 0.0074, 0.0041, 0.0067, 0.0078, 0.0517, 0.0096, 0.0187, 0.0351,
        0.0044, 0.0023, 0.0034, 0.0253, 0.0561, 0.0124, 0.0052, 0.1519, 0.0102,
        0.0068, 0.0055, 0.0076, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4212, 0.0099, 0.0157, 0.0047, 0.0024, 0.0049, 0.0065, 0.0230, 0.0061,
        0.0058, 0.0039, 0.0055, 0.0235, 0.0195, 0.0093, 0.0052, 0.0075, 0.0204,
        0.0184, 0.0077, 0.0033, 0.0019, 0.0007, 0.0033, 0.0311, 0.0092, 0.0259,
        0.0073, 0.0920, 0.0047, 0.0051, 0.0225, 0.0291, 0.0107, 0.0031, 0.0039,
        0.0314, 0.0102, 0.0089, 0.0061, 0.0090, 0.0031, 0.0101, 0.0261, 0.0102,
        0.0037, 0.0061], device='cuda:0', grad_fn=<DivBackward0>), tensor([4.0420e-01, 1.1971e-02, 3.2898e-02, 6.6548e-03, 3.4406e-03, 5.3095e-03,
        7.8383e-03, 3.5463e-02, 5.7376e-03, 7.5497e-03, 4.1971e-03, 5.7571e-03,
        2.6692e-02, 3.0578e-02, 9.5320e-03, 6.3479e-03, 1.0509e-02, 3.1713e-02,
        2.2641e-02, 8.5006e-03, 3.9280e-03, 2.6613e-03, 3.5603e-04, 4.1820e-03,
        4.1120e-02, 1.6992e-02, 2.9341e-02, 7.5160e-03, 6.9684e-03, 3.6147e-03,
        8.7689e-02, 8.9216e-03, 6.4149e-03, 1.1742e-02, 8.5099e-03, 5.5775e-03,
        6.7485e-03, 9.1007e-03, 4.2658e-02, 1.0149e-02, 2.2058e-03, 6.0761e-03,
        0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4306, 0.0121, 0.0334, 0.0063, 0.0039, 0.0059, 0.0112, 0.0380, 0.0075,
        0.0079, 0.0048, 0.0080, 0.0261, 0.0321, 0.0121, 0.0057, 0.0098, 0.0440,
        0.0223, 0.0124, 0.0037, 0.0023, 0.0024, 0.0038, 0.0195, 0.0231, 0.0042,
        0.0076, 0.0102, 0.0112, 0.0893, 0.0083, 0.0084, 0.0054, 0.0078, 0.0048,
        0.0270, 0.0076, 0.0081, 0.0035, 0.0078, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3809, 0.0067, 0.0095, 0.0253, 0.0061, 0.0179, 0.0058, 0.0042, 0.0103,
        0.1102, 0.0064, 0.0102, 0.0021, 0.0068, 0.0058, 0.0181, 0.0783, 0.0490,
        0.1756, 0.0160, 0.0213, 0.0222, 0.0016, 0.0097, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4108, 0.0079, 0.0194, 0.0313, 0.0083, 0.0291, 0.0120, 0.0043, 0.0149,
        0.0926, 0.0093, 0.0134, 0.0050, 0.0088, 0.0269, 0.0568, 0.0104, 0.0753,
        0.1308, 0.0124, 0.0069, 0.0133, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #1200: [tensor([0.3641, 0.0132, 0.0992, 0.0157, 0.0083, 0.0146, 0.0053, 0.0072, 0.0029,
        0.0076, 0.0875, 0.0120, 0.0853, 0.1354, 0.0215, 0.0172, 0.0246, 0.0149,
        0.0109, 0.0104, 0.0158, 0.0033, 0.0072, 0.0157, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4563, 0.0131, 0.0107, 0.0109, 0.0223, 0.0150, 0.0648, 0.0121, 0.0180,
        0.0814, 0.0159, 0.0086, 0.0133, 0.0163, 0.0072, 0.0330, 0.0128, 0.0140,
        0.0088, 0.0020, 0.0071, 0.0123, 0.0197, 0.0459, 0.0358, 0.0271, 0.0157,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4084, 0.0079, 0.0147, 0.0100, 0.0195, 0.0083, 0.0580, 0.0073, 0.0139,
        0.1195, 0.0113, 0.0077, 0.0115, 0.0097, 0.0053, 0.0161, 0.0158, 0.0086,
        0.0064, 0.0010, 0.0076, 0.0116, 0.0491, 0.0074, 0.0109, 0.1263, 0.0125,
        0.0141], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3988, 0.0109, 0.0093, 0.0099, 0.0245, 0.0112, 0.1072, 0.0090, 0.0153,
        0.0938, 0.0138, 0.0087, 0.0177, 0.0134, 0.0100, 0.0181, 0.0132, 0.0124,
        0.0083, 0.0028, 0.0049, 0.0264, 0.0683, 0.0199, 0.0248, 0.0245, 0.0112,
        0.0117], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3529, 0.0133, 0.0121, 0.0171, 0.0084, 0.0105, 0.0590, 0.0066, 0.0225,
        0.1234, 0.0094, 0.0134, 0.0043, 0.0109, 0.1176, 0.0182, 0.1669, 0.0133,
        0.0070, 0.0131, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4753, 0.0098, 0.0036, 0.0118, 0.0064, 0.0084, 0.0537, 0.0058, 0.0091,
        0.0889, 0.0039, 0.0125, 0.0027, 0.0068, 0.0138, 0.0091, 0.0203, 0.1015,
        0.0193, 0.0156, 0.0145, 0.0072, 0.0147, 0.0539, 0.0169, 0.0052, 0.0092,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3272, 0.0095, 0.0030, 0.0130, 0.0061, 0.0088, 0.0759, 0.0049, 0.0136,
        0.0542, 0.0074, 0.0104, 0.0010, 0.0074, 0.1501, 0.0091, 0.1826, 0.0118,
        0.0830, 0.0067, 0.0048, 0.0095, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4827, 0.0790, 0.0132, 0.0188, 0.0117, 0.0827, 0.0066, 0.0064, 0.0031,
        0.0087, 0.1599, 0.0164, 0.0148, 0.0204, 0.0113, 0.0206, 0.0210, 0.0082,
        0.0146, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.5432, 0.1050, 0.0237, 0.0189, 0.0075, 0.0824, 0.0060, 0.0069, 0.0067,
        0.0108, 0.0151, 0.0259, 0.0147, 0.0137, 0.0726, 0.0232, 0.0089, 0.0146,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3909, 0.1411, 0.0272, 0.0189, 0.0139, 0.1164, 0.0028, 0.0076, 0.0067,
        0.0151, 0.0188, 0.0336, 0.1093, 0.0371, 0.0208, 0.0108, 0.0290, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4338, 0.0773, 0.0088, 0.0115, 0.0522, 0.0068, 0.0054, 0.0055, 0.0088,
        0.1986, 0.0100, 0.0617, 0.0123, 0.0134, 0.0192, 0.0087, 0.0319, 0.0099,
        0.0115, 0.0130, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3497, 0.0604, 0.0038, 0.0079, 0.0354, 0.0049, 0.0056, 0.0028, 0.0092,
        0.1944, 0.0073, 0.0859, 0.0207, 0.1458, 0.0100, 0.0165, 0.0189, 0.0084,
        0.0123, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #1250: [tensor([0.3429, 0.0841, 0.0108, 0.0179, 0.0093, 0.0248, 0.0042, 0.0102, 0.0375,
        0.0105, 0.0092, 0.0058, 0.0498, 0.0077, 0.0245, 0.1078, 0.0109, 0.0107,
        0.0022, 0.0057, 0.0421, 0.0104, 0.0829, 0.0550, 0.0106, 0.0043, 0.0082,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.4456, 0.0230, 0.0073, 0.0067, 0.0210, 0.0392, 0.0140, 0.0091, 0.0637,
        0.0142, 0.0104, 0.0060, 0.0039, 0.0169, 0.1268, 0.0275, 0.0144, 0.1139,
        0.0151, 0.0075, 0.0138, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.4824, 0.0243, 0.0190, 0.0075, 0.0206, 0.0313, 0.0213, 0.0157, 0.0674,
        0.0127, 0.0111, 0.0022, 0.0042, 0.0115, 0.0336, 0.0462, 0.0302, 0.1133,
        0.0228, 0.0062, 0.0163, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.4790, 0.0276, 0.0113, 0.0097, 0.0343, 0.0422, 0.0268, 0.0180, 0.0881,
        0.0209, 0.0139, 0.0071, 0.0045, 0.0139, 0.0399, 0.0514, 0.0366, 0.0396,
        0.0120, 0.0232, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3741, 0.0095, 0.0141, 0.0334, 0.0092, 0.0242, 0.0042, 0.0128, 0.0089,
        0.0107, 0.0045, 0.0300, 0.0791, 0.0108, 0.0105, 0.0074, 0.0133, 0.0149,
        0.0058, 0.0127, 0.0645, 0.0066, 0.0040, 0.0077, 0.0164, 0.0135, 0.0088,
        0.0240, 0.1406, 0.0078, 0.0046, 0.0115], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.4222, 0.0118, 0.0189, 0.0254, 0.0117, 0.0313, 0.0045, 0.0133, 0.0078,
        0.0086, 0.0046, 0.0363, 0.0947, 0.0159, 0.0119, 0.0091, 0.0137, 0.0220,
        0.0042, 0.0151, 0.0839, 0.0058, 0.0040, 0.0072, 0.0118, 0.0190, 0.0508,
        0.0120, 0.0084, 0.0047, 0.0094, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.4528, 0.0079, 0.0129, 0.0267, 0.0115, 0.0226, 0.0049, 0.0129, 0.0096,
        0.0109, 0.0075, 0.0364, 0.0966, 0.0112, 0.0074, 0.0104, 0.0129, 0.0206,
        0.0079, 0.0092, 0.0657, 0.0070, 0.0040, 0.0100, 0.0165, 0.0150, 0.0586,
        0.0138, 0.0054, 0.0111, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3404, 0.1292, 0.0098, 0.0318, 0.0178, 0.0201, 0.0587, 0.0018, 0.0152,
        0.0052, 0.0115, 0.0132, 0.0169, 0.0087, 0.0014, 0.0121, 0.1244, 0.0164,
        0.1190, 0.0191, 0.0083, 0.0189, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.4836, 0.1140, 0.0163, 0.0284, 0.0181, 0.0102, 0.0891, 0.0033, 0.0144,
        0.0031, 0.0123, 0.0097, 0.0237, 0.0082, 0.0029, 0.0100, 0.0887, 0.0151,
        0.0110, 0.0233, 0.0054, 0.0092, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3731, 0.0778, 0.0103, 0.0167, 0.0097, 0.0071, 0.0633, 0.0025, 0.0133,
        0.0039, 0.0112, 0.0102, 0.0162, 0.0119, 0.0016, 0.0085, 0.0740, 0.0145,
        0.0666, 0.0155, 0.1087, 0.0084, 0.0101, 0.0176, 0.0274, 0.0061, 0.0138,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.4845, 0.0150, 0.0038, 0.0180, 0.0674, 0.0056, 0.0396, 0.0102, 0.0089,
        0.0021, 0.0065, 0.0166, 0.0109, 0.0039, 0.0125, 0.1427, 0.0551, 0.0279,
        0.0119, 0.0176, 0.0082, 0.0123, 0.0034, 0.0152, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.4954, 0.0132, 0.0040, 0.0148, 0.0620, 0.0073, 0.0441, 0.0100, 0.0100,
        0.0040, 0.0077, 0.0193, 0.0066, 0.0189, 0.0178, 0.0188, 0.0219, 0.0154,
        0.0144, 0.0871, 0.0573, 0.0209, 0.0094, 0.0198, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #1300: [tensor([0.4760, 0.0959, 0.0056, 0.0134, 0.0045, 0.0142, 0.0116, 0.0134, 0.0180,
        0.0028, 0.0078, 0.1698, 0.0124, 0.0222, 0.0528, 0.0240, 0.0264, 0.0127,
        0.0164, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4389, 0.1244, 0.0051, 0.0190, 0.0043, 0.0184, 0.0176, 0.0119, 0.0181,
        0.0051, 0.0096, 0.1093, 0.0227, 0.0271, 0.0112, 0.0252, 0.0239, 0.0231,
        0.0202, 0.0443, 0.0103, 0.0103, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3567, 0.2115, 0.0090, 0.0152, 0.0084, 0.0110, 0.0174, 0.0134, 0.0177,
        0.0074, 0.0085, 0.0881, 0.0319, 0.1018, 0.0294, 0.0393, 0.0133, 0.0200,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.5060, 0.1463, 0.0121, 0.0159, 0.0159, 0.0149, 0.0223, 0.0246, 0.0184,
        0.0081, 0.0110, 0.0337, 0.1218, 0.0203, 0.0286, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4683, 0.1669, 0.0131, 0.0175, 0.0103, 0.0181, 0.0223, 0.0172, 0.0293,
        0.0111, 0.0154, 0.0994, 0.0258, 0.0236, 0.0277, 0.0340, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4728, 0.1557, 0.0103, 0.0111, 0.0080, 0.0125, 0.0122, 0.0119, 0.0125,
        0.0027, 0.0100, 0.1417, 0.0112, 0.0160, 0.0106, 0.0233, 0.0187, 0.0129,
        0.0242, 0.0066, 0.0151, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4631, 0.0882, 0.0096, 0.0116, 0.0068, 0.0158, 0.0138, 0.0126, 0.0172,
        0.0024, 0.0103, 0.1442, 0.0120, 0.0164, 0.0132, 0.0797, 0.0270, 0.0247,
        0.0141, 0.0172, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4598, 0.1300, 0.0130, 0.0191, 0.0083, 0.0153, 0.0181, 0.0141, 0.0152,
        0.0054, 0.0070, 0.0786, 0.0192, 0.1572, 0.0104, 0.0089, 0.0205, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4879, 0.0976, 0.0065, 0.0118, 0.0058, 0.0174, 0.0146, 0.0144, 0.0154,
        0.0033, 0.0104, 0.1462, 0.0132, 0.0166, 0.0112, 0.0317, 0.0281, 0.0178,
        0.0264, 0.0076, 0.0162, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3664, 0.0036, 0.0024, 0.0046, 0.0032, 0.0043, 0.0030, 0.0045, 0.0075,
        0.0167, 0.0039, 0.0013, 0.0041, 0.0018, 0.0060, 0.0415, 0.0045, 0.0036,
        0.0010, 0.0015, 0.0009, 0.0027, 0.0017, 0.0043, 0.0433, 0.0037, 0.0043,
        0.0037, 0.0209, 0.0004, 0.0022, 0.0077, 0.0054, 0.0007, 0.0030, 0.1552,
        0.0064, 0.0064, 0.0049, 0.0051, 0.0931, 0.0083, 0.0084, 0.0041, 0.0075,
        0.0060, 0.0042, 0.0093, 0.0269, 0.0077, 0.0030, 0.0109, 0.0262, 0.0093,
        0.0022, 0.0044], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3483, 0.0063, 0.0060, 0.0071, 0.0061, 0.0064, 0.0050, 0.0050, 0.0069,
        0.0186, 0.0046, 0.0025, 0.0058, 0.0040, 0.0089, 0.0532, 0.0066, 0.0051,
        0.0015, 0.0015, 0.0007, 0.0050, 0.0035, 0.0062, 0.0832, 0.0043, 0.0079,
        0.0054, 0.0231, 0.0031, 0.0025, 0.0086, 0.0072, 0.0007, 0.0039, 0.0687,
        0.0066, 0.0158, 0.0354, 0.0076, 0.0238, 0.0159, 0.0145, 0.0062, 0.1013,
        0.0025, 0.0168, 0.0033, 0.0070, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([3.7701e-01, 4.3887e-03, 9.4980e-03, 7.3199e-03, 6.0131e-03, 5.5377e-03,
        4.1628e-03, 5.7547e-03, 9.5795e-03, 2.2979e-02, 5.9248e-03, 4.1669e-03,
        6.0365e-03, 7.1608e-03, 9.4689e-03, 9.8607e-02, 9.8425e-03, 4.9334e-03,
        3.7098e-03, 3.1204e-03, 2.0031e-03, 5.6997e-03, 2.9614e-03, 6.1023e-03,
        1.1922e-01, 1.0264e-02, 5.5883e-03, 6.1955e-03, 3.1659e-02, 1.7880e-03,
        3.3070e-03, 9.9092e-03, 7.6056e-03, 3.3492e-04, 4.2161e-03, 2.0938e-03,
        7.7907e-02, 1.2107e-02, 1.4427e-02, 3.5746e-02, 4.8658e-03, 8.9579e-03,
        6.5814e-03, 7.3487e-03, 1.9062e-03, 5.9902e-03, 0.0000e+00, 0.0000e+00,
        0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00,
        0.0000e+00, 0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #1350: [tensor([0.2921, 0.0220, 0.0113, 0.0111, 0.0087, 0.0064, 0.0104, 0.0077, 0.0095,
        0.0092, 0.0032, 0.0081, 0.0299, 0.0172, 0.0318, 0.0121, 0.3513, 0.0277,
        0.0311, 0.0666, 0.0106, 0.0063, 0.0159, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.5140, 0.0467, 0.0222, 0.0168, 0.0183, 0.0121, 0.0145, 0.0143, 0.0143,
        0.0140, 0.0042, 0.0118, 0.0665, 0.0289, 0.0593, 0.0333, 0.0406, 0.0260,
        0.0160, 0.0263, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2507, 0.0234, 0.0164, 0.0111, 0.0093, 0.0089, 0.0122, 0.0111, 0.0095,
        0.0072, 0.0012, 0.0097, 0.0531, 0.0183, 0.0362, 0.0143, 0.4722, 0.0138,
        0.0095, 0.0118, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.5741, 0.0500, 0.0316, 0.0171, 0.0191, 0.0127, 0.0192, 0.0153, 0.0203,
        0.0080, 0.0052, 0.0141, 0.0934, 0.0283, 0.0452, 0.0139, 0.0097, 0.0228,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3148, 0.0192, 0.0149, 0.0101, 0.0099, 0.0068, 0.0124, 0.0081, 0.0120,
        0.0054, 0.0023, 0.0076, 0.0630, 0.0122, 0.0420, 0.0158, 0.0129, 0.4018,
        0.0101, 0.0070, 0.0118, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.5457, 0.0466, 0.0216, 0.0246, 0.0185, 0.0159, 0.0163, 0.0156, 0.0217,
        0.0094, 0.0040, 0.0129, 0.0562, 0.0218, 0.0518, 0.0550, 0.0310, 0.0141,
        0.0170, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.5832, 0.0457, 0.0321, 0.0143, 0.0178, 0.0177, 0.0145, 0.0225, 0.0204,
        0.0082, 0.0019, 0.0151, 0.0479, 0.0360, 0.0463, 0.0314, 0.0156, 0.0094,
        0.0201, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4222, 0.0816, 0.0147, 0.0540, 0.0195, 0.0168, 0.0129, 0.0102, 0.0073,
        0.0121, 0.0166, 0.0289, 0.0133, 0.0029, 0.0019, 0.0080, 0.1142, 0.0217,
        0.0872, 0.0320, 0.0082, 0.0034, 0.0104, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3662, 0.0559, 0.0083, 0.0537, 0.0153, 0.0099, 0.0078, 0.0053, 0.0032,
        0.0078, 0.0075, 0.0234, 0.0094, 0.0023, 0.0010, 0.0071, 0.1672, 0.0145,
        0.0467, 0.0186, 0.0158, 0.0210, 0.0087, 0.0135, 0.0206, 0.0585, 0.0146,
        0.0043, 0.0120], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3916, 0.0806, 0.0113, 0.0694, 0.0174, 0.0112, 0.0119, 0.0065, 0.0038,
        0.0101, 0.0141, 0.0374, 0.0139, 0.0042, 0.0013, 0.0098, 0.0694, 0.0193,
        0.0610, 0.0150, 0.0125, 0.0886, 0.0216, 0.0054, 0.0125, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3921, 0.0727, 0.0108, 0.0095, 0.0272, 0.0792, 0.0087, 0.0101, 0.0100,
        0.0046, 0.0068, 0.0132, 0.0024, 0.0078, 0.0524, 0.0150, 0.1652, 0.0242,
        0.0607, 0.0114, 0.0063, 0.0098, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3340, 0.0879, 0.0134, 0.0069, 0.0226, 0.0463, 0.0088, 0.0063, 0.0094,
        0.0045, 0.0036, 0.0091, 0.0040, 0.0083, 0.1111, 0.0226, 0.0137, 0.0890,
        0.0265, 0.0892, 0.0396, 0.0227, 0.0088, 0.0116, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #1400: [tensor([3.7315e-01, 7.1247e-02, 1.2516e-02, 1.5412e-02, 8.0186e-03, 4.9812e-03,
        2.0182e-02, 6.4169e-03, 1.0115e-02, 5.9196e-03, 3.6133e-04, 6.9992e-03,
        1.2056e-02, 5.8591e-02, 2.0706e-02, 8.8624e-02, 1.0886e-02, 1.9844e-02,
        2.5520e-02, 1.9954e-01, 1.2969e-02, 4.6428e-03, 1.1297e-02, 0.0000e+00,
        0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00,
        0.0000e+00, 0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.4680,  0.1137,  0.0151,  0.0173,  0.0094,  0.0068,  0.0251,  0.0116,
         0.0112,  0.0062, -0.0005,  0.0072,  0.1940,  0.0298,  0.0292,  0.0183,
         0.0185,  0.0180,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3009, 0.0553, 0.0132, 0.0091, 0.0038, 0.0084, 0.0237, 0.0461, 0.0039,
        0.0040, 0.0030, 0.0057, 0.0065, 0.0062, 0.0016, 0.0057, 0.3155, 0.0102,
        0.0103, 0.0046, 0.0072, 0.0131, 0.0077, 0.0089, 0.0058, 0.0494, 0.0193,
        0.0149, 0.0103, 0.0148, 0.0039, 0.0069], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3441, 0.0517, 0.0104, 0.0128, 0.0061, 0.0104, 0.0264, 0.0287, 0.0050,
        0.0035, 0.0013, 0.0052, 0.0072, 0.0055, 0.0007, 0.0057, 0.3376, 0.0133,
        0.0597, 0.0085, 0.0116, 0.0065, 0.0240, 0.0054, 0.0085, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2757, 0.0689, 0.0112, 0.0117, 0.0078, 0.0115, 0.0328, 0.0392, 0.0077,
        0.0068, 0.0039, 0.0082, 0.0121, 0.0070, 0.0023, 0.0097, 0.3141, 0.0166,
        0.0984, 0.0187, 0.0078, 0.0076, 0.0061, 0.0143, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3903, 0.1070, 0.0138, 0.0673, 0.0037, 0.0053, 0.0145, 0.0110, 0.0155,
        0.0064, 0.0088, 0.0640, 0.0170, 0.0149, 0.2220, 0.0091, 0.0119, 0.0174,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.5124, 0.1359, 0.0148, 0.0730, 0.0099, 0.0037, 0.0177, 0.0117, 0.0176,
        0.0058, 0.0107, 0.0888, 0.0210, 0.0196, 0.0232, 0.0108, 0.0234, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.5249, 0.0670, 0.0122, 0.0495, 0.0062, 0.0025, 0.0149, 0.0115, 0.0142,
        0.0045, 0.0070, 0.0560, 0.0157, 0.0113, 0.0203, 0.0263, 0.1046, 0.0159,
        0.0179, 0.0069, 0.0105, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.4511, 0.0074, 0.0153, 0.0012, 0.0140, 0.0062, 0.0367, 0.0114, 0.0040,
        0.0074, 0.1144, 0.0067, 0.0703, 0.0267, 0.0179, 0.0722, 0.0297, 0.0688,
        0.0238, 0.0046, 0.0102, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.5902, 0.0116, 0.0231, 0.0076, 0.0287, 0.0119, 0.0702, 0.0209, 0.0061,
        0.0135, 0.0262, 0.0193, 0.0335, 0.0107, 0.0396, 0.0344, 0.0224, 0.0143,
        0.0160, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.4402, 0.0054, 0.0246, 0.0026, 0.0207, 0.0087, 0.0738, 0.0137, 0.0055,
        0.0127, 0.1623, 0.0139, 0.0155, 0.1038, 0.0167, 0.0196, 0.0369, 0.0065,
        0.0171, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.5295, 0.0081, 0.0230, 0.0066, 0.0197, 0.0093, 0.0500, 0.0203, 0.0073,
        0.0182, 0.0259, 0.0126, 0.0243, 0.1616, 0.0491, 0.0129, 0.0216, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #1450: [tensor([0.3459, 0.0047, 0.0034, 0.0039, 0.0087, 0.0083, 0.0425, 0.0026, 0.0074,
        0.0088, 0.0079, 0.0091, 0.0076, 0.0089, 0.0077, 0.0160, 0.1564, 0.0089,
        0.0270, 0.0088, 0.0092, 0.0050, 0.0088, 0.0062, 0.0153, 0.0095, 0.0087,
        0.0690, 0.1604, 0.0062, 0.0071, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 3.7531e-01,  1.1672e-02,  5.9731e-03,  5.9099e-03,  9.9326e-03,
         7.3950e-03,  4.3024e-02,  2.6334e-03,  8.6092e-03,  1.0223e-02,
         6.7558e-03,  6.6634e-03,  7.7385e-03,  7.8665e-03,  8.4045e-03,
         1.3063e-02,  1.0307e-01,  9.7421e-03,  4.2365e-02,  5.3431e-03,
         1.1634e-02,  5.5991e-03,  1.1664e-02,  5.5605e-03,  1.4159e-01,
         8.6837e-03,  6.4028e-02,  2.7640e-02,  1.1954e-02, -3.5170e-05,
         7.8594e-03,  4.0754e-03,  7.9799e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4058, 0.0073, 0.0071, 0.0060, 0.0119, 0.0113, 0.0470, 0.0020, 0.0127,
        0.0101, 0.0117, 0.0095, 0.0084, 0.0112, 0.0147, 0.0181, 0.2336, 0.0118,
        0.0401, 0.0082, 0.0135, 0.0089, 0.0134, 0.0067, 0.0048, 0.0377, 0.0123,
        0.0042, 0.0102, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3393, 0.0074, 0.0061, 0.0036, 0.0090, 0.0044, 0.0303, 0.0016, 0.0062,
        0.0101, 0.0085, 0.0068, 0.0049, 0.0065, 0.0090, 0.0142, 0.0966, 0.0052,
        0.0191, 0.0045, 0.0095, 0.0049, 0.0083, 0.0070, 0.1670, 0.0120, 0.0075,
        0.0523, 0.0068, 0.0424, 0.0736, 0.0061, 0.0033, 0.0063, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3298, 0.0084, 0.0044, 0.0059, 0.0132, 0.0068, 0.0349, 0.0034, 0.0101,
        0.0084, 0.0099, 0.0081, 0.0065, 0.0076, 0.0114, 0.0137, 0.1120, 0.0073,
        0.0339, 0.0068, 0.0125, 0.0061, 0.0118, 0.0055, 0.1904, 0.0211, 0.0087,
        0.0826, 0.0088, 0.0019, 0.0082, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2422, 0.0064, 0.0058, 0.0037, 0.0066, 0.0038, 0.0283, 0.0017, 0.0064,
        0.0048, 0.0092, 0.0044, 0.0034, 0.0053, 0.0070, 0.0082, 0.1684, 0.0056,
        0.0188, 0.0052, 0.0091, 0.0055, 0.0087, 0.0062, 0.2658, 0.0061, 0.0594,
        0.0067, 0.0737, 0.0065, 0.0031, 0.0041, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3650, 0.0072, 0.0038, 0.0048, 0.0142, 0.0093, 0.0344, 0.0031, 0.0118,
        0.0079, 0.0128, 0.0056, 0.0064, 0.0110, 0.0129, 0.0133, 0.1198, 0.0101,
        0.0218, 0.0075, 0.0118, 0.0075, 0.0100, 0.0050, 0.0449, 0.0119, 0.1058,
        0.0093, 0.0198, 0.0066, 0.0146, 0.0455, 0.0115, 0.0026, 0.0104, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3367, 0.0068, 0.0043, 0.0041, 0.0080, 0.0067, 0.0787, 0.0017, 0.0095,
        0.0071, 0.0085, 0.0054, 0.0051, 0.0100, 0.0091, 0.0135, 0.1206, 0.0079,
        0.0223, 0.0058, 0.0095, 0.0061, 0.0115, 0.0039, 0.1680, 0.0202, 0.0077,
        0.0845, 0.0047, 0.0042, 0.0081, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3791, 0.0063, 0.0042, 0.0036, 0.0079, 0.0038, 0.0427, 0.0022, 0.0076,
        0.0076, 0.0060, 0.0056, 0.0060, 0.0084, 0.0100, 0.0085, 0.1108, 0.0079,
        0.0191, 0.0028, 0.0102, 0.0074, 0.0086, 0.0051, 0.1671, 0.0082, 0.0055,
        0.0124, 0.0104, 0.0095, 0.0050, 0.0125, 0.0086, 0.0060, 0.0128, 0.0186,
        0.0117, 0.0103, 0.0065, 0.0055, 0.0021, 0.0057], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3881, 0.0089, 0.0050, 0.0045, 0.0109, 0.0110, 0.0622, 0.0032, 0.0106,
        0.0135, 0.0167, 0.0098, 0.0107, 0.0122, 0.0156, 0.0178, 0.1964, 0.0100,
        0.0499, 0.0069, 0.0120, 0.0092, 0.0176, 0.0080, 0.0163, 0.0131, 0.0179,
        0.0087, 0.0062, 0.0032, 0.0124, 0.0115, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3717, 0.0100, 0.0090, 0.0091, 0.0100, 0.0102, 0.0425, 0.0046, 0.0105,
        0.0117, 0.0150, 0.0078, 0.0060, 0.0089, 0.0174, 0.0204, 0.1763, 0.0094,
        0.0404, 0.0085, 0.0134, 0.0081, 0.0203, 0.0072, 0.0098, 0.0105, 0.0138,
        0.0607, 0.0155, 0.0166, 0.0149, 0.0100, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3180, 0.0064, 0.0035, 0.0029, 0.0074, 0.0053, 0.0274, 0.0007, 0.0054,
        0.0059, 0.0062, 0.0046, 0.0054, 0.0047, 0.0075, 0.0129, 0.0651, 0.0061,
        0.0174, 0.0048, 0.0079, 0.0072, 0.0068, 0.0037, 0.1026, 0.0101, 0.0063,
        0.0054, 0.0791, 0.0067, 0.0122, 0.0346, 0.0080, 0.0132, 0.1324, 0.0078,
        0.0147, 0.0124, 0.0043, 0.0066, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #1500: [tensor([0.4254, 0.0708, 0.0233, 0.0106, 0.0161, 0.0105, 0.0155, 0.0119, 0.0565,
        0.0172, 0.0036, 0.0116, 0.0576, 0.0096, 0.0309, 0.1399, 0.0531, 0.0160,
        0.0085, 0.0113, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4334, 0.0739, 0.0278, 0.0118, 0.0184, 0.0104, 0.0152, 0.0122, 0.0604,
        0.0309, 0.0015, 0.0115, 0.0756, 0.0216, 0.0261, 0.0655, 0.0271, 0.0307,
        0.0214, 0.0083, 0.0162, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3202, 0.1002, 0.0193, 0.0136, 0.0642, 0.0086, 0.0065, 0.0120, 0.0080,
        0.0051, 0.0091, 0.0310, 0.1521, 0.2013, 0.0302, 0.0077, 0.0108, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4410, 0.1392, 0.0210, 0.0130, 0.0565, 0.0161, 0.0026, 0.0127, 0.0119,
        0.0027, 0.0080, 0.0679, 0.0264, 0.0265, 0.0255, 0.0820, 0.0192, 0.0075,
        0.0204, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4504, 0.1303, 0.0246, 0.0138, 0.0797, 0.0124, 0.0031, 0.0134, 0.0150,
        0.0058, 0.0101, 0.0816, 0.0353, 0.0330, 0.0306, 0.0218, 0.0152, 0.0241,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2930, 0.0518, 0.0120, 0.0113, 0.0130, 0.0041, 0.0259, 0.0458, 0.0072,
        0.0104, 0.0008, 0.0047, 0.0126, 0.0219, 0.0081, 0.0137, 0.1577, 0.0073,
        0.0111, 0.0111, 0.0072, 0.0051, 0.2191, 0.0100, 0.0216, 0.0022, 0.0113],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3455, 0.0530, 0.0237, 0.0159, 0.0284, 0.0046, 0.0359, 0.0758, 0.0130,
        0.0193, 0.0037, 0.0097, 0.0283, 0.0416, 0.0307, 0.0257, 0.1123, 0.1050,
        0.0085, 0.0080, 0.0114, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 2.8973e-01,  8.8691e-02,  1.7261e-02,  1.5982e-02,  2.5101e-02,
         5.7391e-03,  3.6400e-02,  5.8979e-02,  8.5819e-03,  1.6691e-02,
        -5.7623e-05,  5.9085e-03,  1.6399e-02,  2.6425e-02,  1.1680e-02,
         2.9150e-02,  2.9797e-01,  1.2051e-02,  1.9383e-02,  6.8350e-03,
         1.0986e-02,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4359, 0.1240, 0.0239, 0.0155, 0.0517, 0.0903, 0.0139, 0.0119, 0.0220,
        0.0297, 0.0126, 0.0030, 0.0121, 0.0332, 0.0666, 0.0347, 0.0190, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4058, 0.1049, 0.0189, 0.0124, 0.0375, 0.0705, 0.0124, 0.0120, 0.0323,
        0.0269, 0.0172, 0.0022, 0.0132, 0.1746, 0.0152, 0.0247, 0.0194, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3250, 0.1396, 0.0248, 0.0164, 0.0445, 0.0788, 0.0100, 0.0124, 0.0190,
        0.0337, 0.0128, 0.0037, 0.0151, 0.1680, 0.0061, 0.0188, 0.0461, 0.0254,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4893, 0.0826, 0.0134, 0.0104, 0.0101, 0.0070, 0.0150, 0.0100, 0.0161,
        0.0058, 0.0071, 0.0056, 0.0087, 0.0132, 0.0018, 0.0079, 0.0199, 0.0231,
        0.0249, 0.0221, 0.0381, 0.0072, 0.0591, 0.0680, 0.0153, 0.0083, 0.0102],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #1550: [tensor([0.2851, 0.0851, 0.0148, 0.0106, 0.0162, 0.0117, 0.0093, 0.0059, 0.0103,
        0.0222, 0.0004, 0.0073, 0.0163, 0.0773, 0.0144, 0.0120, 0.3707, 0.0200,
        0.0103, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.5095, 0.0711, 0.0117, 0.0150, 0.0194, 0.0122, 0.0130, 0.0052, 0.0126,
        0.0217, 0.0019, 0.0069, 0.0590, 0.0312, 0.0855, 0.0425, 0.0110, 0.0266,
        0.0168, 0.0105, 0.0167, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3442, 0.0524, 0.0188, 0.0144, 0.0158, 0.0101, 0.0109, 0.0065, 0.0132,
        0.0192, 0.0013, 0.0096, 0.2523, 0.0099, 0.0846, 0.0260, 0.0085, 0.0221,
        0.0309, 0.0202, 0.0115, 0.0037, 0.0137, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3529, 0.1171, 0.0195, 0.0189, 0.0152, 0.0093, 0.0131, 0.0077, 0.0146,
        0.0187, 0.0013, 0.0112, 0.1548, 0.0131, 0.0861, 0.0228, 0.0188, 0.0317,
        0.0177, 0.0094, 0.0191, 0.0073, 0.0196, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.3342,  0.1347,  0.0188,  0.0175,  0.0235,  0.0138,  0.0164,  0.0066,
         0.0208,  0.0311, -0.0005,  0.0161,  0.2547,  0.0292,  0.0427,  0.0095,
         0.0300,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.4661, 0.0915, 0.0176, 0.0188, 0.0202, 0.0132, 0.0157, 0.0074, 0.0152,
        0.0270, 0.0012, 0.0088, 0.0716, 0.0237, 0.1177, 0.0272, 0.0185, 0.0108,
        0.0086, 0.0191, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3066, 0.0416, 0.0043, 0.0045, 0.0095, 0.0032, 0.0049, 0.0036, 0.0659,
        0.0044, 0.0072, 0.0061, 0.0063, 0.0214, 0.0515, 0.0039, 0.0073, 0.0081,
        0.0008, 0.0048, 0.0413, 0.0063, 0.0571, 0.0036, 0.0627, 0.2407, 0.0077,
        0.0056, 0.0093, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4831, 0.0540, 0.0073, 0.0051, 0.0134, 0.0040, 0.0060, 0.0072, 0.0857,
        0.0088, 0.0094, 0.0065, 0.0093, 0.0242, 0.0801, 0.0031, 0.0149, 0.0062,
        0.0034, 0.0051, 0.0479, 0.0067, 0.0114, 0.0208, 0.0268, 0.0094, 0.0081,
        0.0190, 0.0045, 0.0087], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4045, 0.0422, 0.0037, 0.0011, 0.0180, 0.0051, 0.0071, 0.0065, 0.0808,
        0.0113, 0.0107, 0.0082, 0.0103, 0.0248, 0.0656, 0.0044, 0.0164, 0.0105,
        0.0021, 0.0058, 0.0514, 0.0119, 0.1128, 0.0643, 0.0059, 0.0047, 0.0100,
        0.0000, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4116, 0.1020, 0.0069, 0.0190, 0.0091, 0.0114, 0.0102, 0.0090, 0.0232,
        0.0075, 0.0634, 0.0137, 0.0076, 0.0123, 0.0144, 0.0163, 0.0377, 0.0244,
        0.0440, 0.1045, 0.0260, 0.0078, 0.0182, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3663, 0.0943, 0.0118, 0.0335, 0.0129, 0.0107, 0.0107, 0.0144, 0.0259,
        0.0099, 0.0867, 0.0242, 0.0060, 0.0092, 0.0106, 0.0219, 0.0864, 0.1169,
        0.0230, 0.0106, 0.0141, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3353, 0.0891, 0.0090, 0.0235, 0.0073, 0.0096, 0.0127, 0.0102, 0.0285,
        0.0053, 0.0560, 0.0189, 0.0043, 0.0073, 0.0681, 0.0159, 0.0285, 0.0201,
        0.0393, 0.0363, 0.1231, 0.0152, 0.0166, 0.0047, 0.0152, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #1600: [tensor([0.3228, 0.1051, 0.0207, 0.0354, 0.0340, 0.0530, 0.0860, 0.0224, 0.0050,
        0.0059, 0.0107, 0.1746, 0.0169, 0.0420, 0.0485, 0.0170, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4411, 0.0150, 0.0083, 0.0642, 0.0126, 0.0271, 0.0404, 0.0102, 0.0037,
        0.0135, 0.1214, 0.0227, 0.0156, 0.0129, 0.1526, 0.0139, 0.0104, 0.0144,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4634, 0.0110, 0.0173, 0.0799, 0.0208, 0.0534, 0.0426, 0.0091, 0.0080,
        0.0120, 0.0149, 0.0263, 0.0184, 0.0294, 0.0332, 0.1097, 0.0259, 0.0129,
        0.0119, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3024, 0.0114, 0.0147, 0.0917, 0.0138, 0.0283, 0.0542, 0.0119, 0.0072,
        0.0161, 0.1789, 0.0167, 0.0310, 0.0887, 0.0791, 0.0208, 0.0127, 0.0203,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4163, 0.0108, 0.0111, 0.0078, 0.0159, 0.0166, 0.0115, 0.0439, 0.0093,
        0.0032, 0.0057, 0.1110, 0.0195, 0.0132, 0.0647, 0.0228, 0.0286, 0.1065,
        0.0093, 0.0135, 0.0343, 0.0111, 0.0134, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.6161, 0.0227, 0.0227, 0.0192, 0.0268, 0.0198, 0.0155, 0.0551, 0.0160,
        0.0041, 0.0150, 0.0393, 0.0326, 0.0254, 0.0260, 0.0155, 0.0281, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3994, 0.0140, 0.0190, 0.0120, 0.0206, 0.0219, 0.0145, 0.0428, 0.0082,
        0.0028, 0.0071, 0.1754, 0.0265, 0.0216, 0.0896, 0.0202, 0.0424, 0.0221,
        0.0184, 0.0217, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3462, 0.1341, 0.0108, 0.0167, 0.0125, 0.0273, 0.0102, 0.0103, 0.0109,
        0.0145, 0.0089, 0.0099, 0.0148, 0.0113, 0.0218, 0.0574, 0.0137, 0.0088,
        0.0121, 0.1017, 0.0137, 0.0721, 0.0148, 0.0154, 0.0096, 0.0201],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3665, 0.0786, 0.0141, 0.0087, 0.0135, 0.0250, 0.0122, 0.0130, 0.0093,
        0.0111, 0.0126, 0.0095, 0.0125, 0.0038, 0.0221, 0.0477, 0.0190, 0.0061,
        0.0132, 0.0886, 0.0176, 0.1468, 0.0204, 0.0078, 0.0204, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4634, 0.0731, 0.0067, 0.0107, 0.0104, 0.0206, 0.0080, 0.0116, 0.0044,
        0.0130, 0.0071, 0.0105, 0.0163, 0.0095, 0.0144, 0.0422, 0.0178, 0.0041,
        0.0097, 0.0670, 0.0192, 0.1280, 0.0113, 0.0065, 0.0146, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2852, 0.0462, 0.0107, 0.0052, 0.0324, 0.0109, 0.0099, 0.0223, 0.0278,
        0.0080, 0.0060, 0.0049, 0.0920, 0.0094, 0.0085, 0.0038, 0.0084, 0.0547,
        0.0092, 0.0603, 0.0102, 0.0178, 0.2264, 0.0142, 0.0053, 0.0103],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3781, 0.1037, 0.0084, 0.0082, 0.0381, 0.0105, 0.0107, 0.0331, 0.0411,
        0.0105, 0.0084, 0.0074, 0.0650, 0.0101, 0.0068, 0.0039, 0.0121, 0.0702,
        0.0110, 0.0116, 0.1068, 0.0120, 0.0137, 0.0075, 0.0112, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #1650: [tensor([0.2900, 0.0675, 0.0099, 0.0054, 0.0067, 0.0115, 0.0106, 0.0366, 0.0067,
        0.0356, 0.0705, 0.0139, 0.0086, 0.0411, 0.0516, 0.0065, 0.0056, 0.0050,
        0.0060, 0.0030, 0.0060, 0.0088, 0.0178, 0.0343, 0.0146, 0.0647, 0.1378,
        0.0128, 0.0046, 0.0064, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2972, 0.0093, 0.0072, 0.0267, 0.0053, 0.0014, 0.0566, 0.0039, 0.0087,
        0.0394, 0.0248, 0.0056, 0.0089, 0.0652, 0.0116, 0.0054, 0.0180, 0.0109,
        0.0082, 0.0036, 0.0288, 0.0051, 0.0158, 0.0352, 0.0144, 0.0041, 0.0050,
        0.0107, 0.0108, 0.0211, 0.0098, 0.0116, 0.0135, 0.0041, 0.1618, 0.0108,
        0.0111, 0.0085], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4031, 0.0062, 0.0068, 0.0190, 0.0062, 0.0008, 0.0317, 0.0044, 0.0089,
        0.0287, 0.0297, 0.0032, 0.0093, 0.0865, 0.0106, 0.0073, 0.0110, 0.0079,
        0.0083, 0.0027, 0.0310, 0.0049, 0.0094, 0.0203, 0.0131, 0.0025, 0.0057,
        0.0121, 0.0097, 0.0225, 0.0059, 0.0121, 0.0060, 0.1284, 0.0084, 0.0089,
        0.0070, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3446, 0.0078, 0.0099, 0.0167, 0.0055, 0.0006, 0.0467, 0.0044, 0.0099,
        0.0322, 0.0216, 0.0048, 0.0145, 0.1030, 0.0101, 0.0068, 0.0173, 0.0104,
        0.0101, 0.0022, 0.0212, 0.0070, 0.0140, 0.0282, 0.0226, 0.0033, 0.0064,
        0.0093, 0.0103, 0.0263, 0.0098, 0.0062, 0.1270, 0.0072, 0.0120, 0.0101,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3355, 0.0619, 0.0104, 0.0201, 0.0910, 0.0074, 0.0078, 0.0054, 0.0093,
        0.0458, 0.0087, 0.0070, 0.0117, 0.0079, 0.0100, 0.0087, 0.0713, 0.0066,
        0.0028, 0.0053, 0.0492, 0.0128, 0.1051, 0.0170, 0.0081, 0.0111, 0.0193,
        0.0161, 0.0116, 0.0050, 0.0101, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2615, 0.1109, 0.0158, 0.0287, 0.1101, 0.0085, 0.0098, 0.0082, 0.0130,
        0.0562, 0.0117, 0.0094, 0.0171, 0.0080, 0.0077, 0.0073, 0.1134, 0.0092,
        0.0047, 0.0096, 0.0668, 0.0188, 0.0228, 0.0133, 0.0280, 0.0098, 0.0098,
        0.0101, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3748, 0.0399, 0.0082, 0.0177, 0.0358, 0.0053, 0.0072, 0.0034, 0.0074,
        0.0359, 0.0075, 0.0040, 0.0095, 0.0063, 0.0052, 0.0050, 0.0548, 0.0068,
        0.0010, 0.0054, 0.0149, 0.0853, 0.1933, 0.0096, 0.0061, 0.0123, 0.0083,
        0.0170, 0.0040, 0.0080, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2742, 0.1226, 0.0282, 0.0046, 0.0931, 0.0138, 0.0183, 0.0072, 0.0113,
        0.0046, 0.0098, 0.0777, 0.0273, 0.0539, 0.0170, 0.0229, 0.1600, 0.0189,
        0.0143, 0.0202, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3892, 0.0876, 0.0159, 0.0076, 0.0753, 0.0128, 0.0139, 0.0041, 0.0115,
        0.0036, 0.0086, 0.1200, 0.0139, 0.1008, 0.0219, 0.0252, 0.0349, 0.0203,
        0.0205, 0.0121, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3149, 0.0617, 0.0130, 0.0112, 0.0424, 0.0116, 0.0136, 0.0016, 0.0091,
        0.0038, 0.0084, 0.0265, 0.1240, 0.1934, 0.0127, 0.0112, 0.1025, 0.0278,
        0.0104, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4551, 0.0093, 0.0080, 0.0108, 0.0108, 0.0050, 0.0095, 0.0049, 0.0130,
        0.0034, 0.0084, 0.0055, 0.0132, 0.0725, 0.0023, 0.0134, 0.0030, 0.0052,
        0.0128, 0.0130, 0.0106, 0.0132, 0.0078, 0.0159, 0.0133, 0.0168, 0.0137,
        0.0078, 0.0239, 0.0082, 0.0229, 0.1272, 0.0044, 0.0208, 0.0068, 0.0075,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3582, 0.0108, 0.0074, 0.0120, 0.0188, 0.0050, 0.0075, 0.0078, 0.0141,
        0.0045, 0.0110, 0.0050, 0.0148, 0.0943, 0.0058, 0.0269, 0.0050, 0.0110,
        0.0238, 0.0321, 0.0166, 0.0125, 0.0095, 0.0218, 0.2268, 0.0057, 0.0162,
        0.0058, 0.0095, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #1700: [tensor([0.4127, 0.1179, 0.0315, 0.0025, 0.0124, 0.0238, 0.0215, 0.0104, 0.0054,
        0.0152, 0.0808, 0.0286, 0.0444, 0.0267, 0.0340, 0.0802, 0.0199, 0.0120,
        0.0200, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.5790, 0.0355, 0.0172, 0.0403, 0.0308, 0.0560, 0.0206, 0.0245, 0.0084,
        0.0203, 0.0386, 0.0121, 0.0302, 0.0678, 0.0186, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.5817, 0.0371, 0.0175, 0.0465, 0.0366, 0.0343, 0.0177, 0.0381, 0.0099,
        0.0204, 0.0455, 0.0266, 0.0582, 0.0298, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.5093, 0.0511, 0.0190, 0.0674, 0.0366, 0.0542, 0.0159, 0.0318, 0.0145,
        0.0221, 0.0366, 0.0226, 0.0256, 0.0637, 0.0297, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([4.8704e-01, 7.7599e-03, 8.8067e-03, 3.6838e-03, 5.4283e-03, 5.6674e-03,
        5.7840e-03, 3.2618e-02, 1.3199e-02, 4.9636e-03, 5.0942e-03, 3.7703e-03,
        2.0526e-03, 4.0937e-02, 1.6086e-03, 7.2565e-03, 9.4217e-03, 5.0564e-03,
        5.5985e-03, 7.2757e-02, 3.6689e-03, 2.3741e-03, 1.9512e-03, 5.0001e-03,
        4.1953e-03, 6.2186e-03, 3.2625e-02, 7.9552e-03, 5.1221e-02, 2.5457e-02,
        1.0001e-03, 7.6540e-03, 2.3960e-04, 4.9280e-03, 9.5677e-03, 1.1144e-02,
        1.1158e-02, 6.7074e-03, 3.9201e-03, 5.8840e-03, 6.6299e-03, 3.7307e-02,
        1.4436e-02, 2.8722e-03, 7.3813e-03, 0.0000e+00, 0.0000e+00, 0.0000e+00,
        0.0000e+00, 0.0000e+00, 0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.4446, 0.0053, 0.0057, 0.0041, 0.0045, 0.0034, 0.0059, 0.0237, 0.0099,
        0.0046, 0.0018, 0.0035, 0.0027, 0.0414, 0.0019, 0.0049, 0.0104, 0.0037,
        0.0048, 0.0594, 0.0013, 0.0019, 0.0036, 0.0054, 0.0031, 0.0038, 0.0245,
        0.0079, 0.0232, 0.0215, 0.0010, 0.0054, 0.0009, 0.0031, 0.0070, 0.0089,
        0.0065, 0.0076, 0.0037, 0.0089, 0.0051, 0.0068, 0.0129, 0.0061, 0.1429,
        0.0036, 0.0060, 0.0039, 0.0064, 0.0055, 0.0055], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2791, 0.0069, 0.0100, 0.0045, 0.0100, 0.0085, 0.0088, 0.0425, 0.0132,
        0.0072, 0.0056, 0.0057, 0.0053, 0.0661, 0.0025, 0.0074, 0.0162, 0.0047,
        0.0093, 0.0751, 0.0055, 0.0013, 0.0041, 0.0080, 0.0095, 0.0056, 0.0369,
        0.0147, 0.0519, 0.0264, 0.0005, 0.0133, 0.0028, 0.0053, 0.0488, 0.0143,
        0.0465, 0.0166, 0.0212, 0.0409, 0.0026, 0.0189, 0.0074, 0.0083, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3960, 0.0584, 0.0085, 0.0483, 0.0090, 0.0065, 0.0180, 0.0325, 0.0045,
        0.0126, 0.0037, 0.0032, 0.0100, 0.1061, 0.0142, 0.1002, 0.0209, 0.1208,
        0.0097, 0.0058, 0.0113, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3194, 0.0668, 0.0130, 0.0456, 0.0126, 0.0079, 0.0214, 0.0614, 0.0061,
        0.0156, 0.0068, 0.0033, 0.0099, 0.0929, 0.0138, 0.0130, 0.2608, 0.0105,
        0.0059, 0.0131, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2796, 0.0538, 0.0086, 0.0444, 0.0079, 0.0065, 0.0184, 0.0482, 0.0034,
        0.0123, 0.0032, 0.0031, 0.0066, 0.1496, 0.0103, 0.1548, 0.0222, 0.0541,
        0.0124, 0.0221, 0.0430, 0.0035, 0.0157, 0.0066, 0.0029, 0.0068, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3045, 0.0571, 0.0121, 0.0097, 0.0388, 0.0350, 0.0131, 0.0095, 0.0892,
        0.0066, 0.0010, 0.0100, 0.2116, 0.0229, 0.0136, 0.1321, 0.0147, 0.0034,
        0.0151, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3206, 0.0732, 0.0127, 0.0125, 0.0351, 0.0277, 0.0105, 0.0155, 0.0888,
        0.0078, 0.0014, 0.0084, 0.2088, 0.0168, 0.1201, 0.0157, 0.0076, 0.0166,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #1750: [tensor([0.3449, 0.0218, 0.0031, 0.0257, 0.0477, 0.0019, 0.0063, 0.0059, 0.0112,
        0.0125, 0.0033, 0.0448, 0.0027, 0.0082, 0.0034, 0.0240, 0.0050, 0.0013,
        0.0043, 0.0319, 0.0048, 0.0444, 0.0102, 0.0107, 0.2240, 0.0054, 0.0093,
        0.0049, 0.0363, 0.0124, 0.0132, 0.0070, 0.0074], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3143, 0.0762, 0.0066, 0.0503, 0.0740, 0.0030, 0.0130, 0.0086, 0.0189,
        0.0126, 0.0091, 0.0733, 0.0045, 0.0210, 0.0115, 0.0483, 0.0093, 0.0041,
        0.0079, 0.0602, 0.0070, 0.0209, 0.0974, 0.0141, 0.0113, 0.0089, 0.0136,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2840, 0.0291, 0.0036, 0.0298, 0.0371, 0.0023, 0.0065, 0.0042, 0.0098,
        0.0082, 0.0039, 0.0271, 0.0018, 0.0052, 0.0035, 0.0183, 0.0054, 0.0021,
        0.0052, 0.1131, 0.0058, 0.0388, 0.1429, 0.0093, 0.0097, 0.0791, 0.0127,
        0.0127, 0.0072, 0.0583, 0.0034, 0.0129, 0.0071], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3254, 0.0386, 0.0092, 0.0759, 0.0029, 0.0056, 0.0213, 0.0625, 0.0055,
        0.0197, 0.0064, 0.0668, 0.0103, 0.0039, 0.0082, 0.1053, 0.0155, 0.1457,
        0.0359, 0.0144, 0.0086, 0.0123, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2935, 0.0258, 0.0051, 0.0486, 0.0026, 0.0053, 0.0156, 0.0360, 0.0046,
        0.0143, 0.0045, 0.0589, 0.0063, 0.0024, 0.0056, 0.0448, 0.0151, 0.0614,
        0.0126, 0.3104, 0.0122, 0.0045, 0.0100, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.4249, 0.0468, 0.0101, 0.0549, 0.0051, 0.0040, 0.0226, 0.0704, 0.0029,
        0.0248, 0.0084, 0.1060, 0.0075, 0.0050, 0.0078, 0.0624, 0.0176, 0.0823,
        0.0174, 0.0055, 0.0138, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.4970, 0.0665, 0.0069, 0.0433, 0.0061, 0.0083, 0.0115, 0.0080, 0.0069,
        0.0376, 0.0040, 0.0177, 0.0017, 0.0082, 0.0488, 0.0121, 0.0107, 0.0155,
        0.0143, 0.0168, 0.0146, 0.0130, 0.0891, 0.0249, 0.0049, 0.0117, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.4170, 0.0887, 0.0133, 0.0551, 0.0072, 0.0101, 0.0067, 0.0078, 0.0073,
        0.0447, 0.0041, 0.0104, 0.0053, 0.0119, 0.1567, 0.0128, 0.0139, 0.0109,
        0.0652, 0.0107, 0.0218, 0.0036, 0.0148, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.4652, 0.0822, 0.0065, 0.0716, 0.0120, 0.0087, 0.0099, 0.0114, 0.0093,
        0.0521, 0.0037, 0.0215, 0.0032, 0.0112, 0.0645, 0.0112, 0.0457, 0.0159,
        0.0158, 0.0163, 0.0159, 0.0209, 0.0109, 0.0145, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2884, 0.0597, 0.0145, 0.0080, 0.0026, 0.0028, 0.0322, 0.0067, 0.0160,
        0.0189, 0.0385, 0.0083, 0.0023, 0.0087, 0.2078, 0.0102, 0.1627, 0.0074,
        0.0149, 0.0623, 0.0093, 0.0054, 0.0124, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2957, 0.0904, 0.0154, 0.0080, 0.0036, 0.0018, 0.0339, 0.0087, 0.0123,
        0.0161, 0.0371, 0.0156, 0.0039, 0.0090, 0.1328, 0.0108, 0.1124, 0.0931,
        0.0716, 0.0066, 0.0093, 0.0118, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3581, 0.0937, 0.0130, 0.0101, 0.0014, 0.0044, 0.0330, 0.0077, 0.0162,
        0.0212, 0.0414, 0.0104, 0.0042, 0.0087, 0.2096, 0.0080, 0.1155, 0.0130,
        0.0125, 0.0070, 0.0110, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #1800: [tensor([0.3757, 0.1242, 0.0087, 0.0104, 0.0101, 0.0071, 0.0106, 0.0103, 0.0189,
        0.0423, 0.0044, 0.0045, 0.0105, 0.0184, 0.0095, 0.0318, 0.2690, 0.0132,
        0.0056, 0.0147, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.5010, 0.0714, 0.0094, 0.0071, 0.0082, 0.0035, 0.0081, 0.0077, 0.0155,
        0.0448, 0.0085, 0.0026, 0.0100, 0.0127, 0.0086, 0.0182, 0.0313, 0.2028,
        0.0085, 0.0065, 0.0137, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.5128, 0.1262, 0.0180, 0.0171, 0.0198, 0.0083, 0.0143, 0.0201, 0.0322,
        0.0778, 0.0097, 0.0020, 0.0131, 0.0266, 0.0154, 0.0272, 0.0331, 0.0114,
        0.0149, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3492, 0.0076, 0.0148, 0.0175, 0.0373, 0.0552, 0.0082, 0.0072, 0.1059,
        0.0075, 0.0349, 0.0064, 0.0046, 0.0023, 0.0071, 0.0596, 0.0121, 0.0774,
        0.0129, 0.0130, 0.1236, 0.0209, 0.0058, 0.0091, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3668, 0.0093, 0.0143, 0.0365, 0.0304, 0.0579, 0.0081, 0.0106, 0.0393,
        0.0051, 0.0313, 0.0100, 0.0042, 0.0013, 0.0066, 0.0639, 0.0280, 0.0536,
        0.0110, 0.0129, 0.1267, 0.0204, 0.0149, 0.0089, 0.0075, 0.0051, 0.0061,
        0.0092, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([3.9306e-01, 8.4823e-03, 1.6793e-02, 2.5090e-02, 3.3440e-02, 4.6949e-02,
        7.5730e-03, 7.8145e-03, 8.1686e-02, 6.9117e-03, 2.3246e-02, 5.7116e-03,
        3.5241e-03, 2.0651e-04, 6.3272e-03, 5.3240e-02, 2.1915e-02, 1.7701e-02,
        1.4253e-02, 1.4800e-02, 1.8547e-02, 9.4087e-02, 6.9569e-03, 1.3397e-02,
        4.9715e-02, 1.0392e-02, 3.4870e-03, 5.2048e-03, 9.4923e-03, 0.0000e+00,
        0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00,
        0.0000e+00, 0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 2.9947e-01,  7.9384e-03,  9.6027e-03,  3.9040e-02,  5.5854e-02,
         2.3053e-03,  4.5904e-03,  8.3983e-03,  7.0740e-02,  5.7229e-03,
         4.7329e-03,  4.7307e-02,  4.4403e-03,  7.3710e-03, -2.3029e-04,
         4.1790e-03,  6.8304e-02,  1.4339e-02,  4.2468e-02,  2.0536e-01,
         8.2359e-03,  7.9667e-03,  3.4818e-02,  1.7278e-02,  1.3648e-02,
         5.6289e-03,  1.0039e-02,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3685, 0.0134, 0.0122, 0.0646, 0.0873, 0.0049, 0.0084, 0.0122, 0.0808,
        0.0074, 0.0063, 0.0832, 0.0047, 0.0143, 0.0021, 0.0086, 0.0472, 0.0436,
        0.0229, 0.0269, 0.0493, 0.0100, 0.0077, 0.0134, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3726, 0.0098, 0.0100, 0.0410, 0.0862, 0.0026, 0.0061, 0.0094, 0.0508,
        0.0068, 0.0052, 0.0554, 0.0044, 0.0100, 0.0014, 0.0074, 0.0684, 0.0166,
        0.0372, 0.0195, 0.0595, 0.0851, 0.0169, 0.0050, 0.0127, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3606, 0.0455, 0.0066, 0.0060, 0.0463, 0.0060, 0.0085, 0.0055, 0.0634,
        0.0041, 0.0057, 0.0087, 0.0281, 0.0489, 0.0048, 0.0137, 0.0024, 0.0070,
        0.0686, 0.0069, 0.0113, 0.0646, 0.1467, 0.0172, 0.0044, 0.0084, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2915, 0.0906, 0.0081, 0.0096, 0.0796, 0.0063, 0.0058, 0.0052, 0.0742,
        0.0048, 0.0104, 0.0076, 0.0378, 0.1707, 0.0064, 0.0158, 0.0050, 0.0093,
        0.1112, 0.0118, 0.0125, 0.0062, 0.0066, 0.0131, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3718, 0.0487, 0.0040, 0.0073, 0.0451, 0.0065, 0.0054, 0.0047, 0.0478,
        0.0038, 0.0049, 0.0091, 0.0257, 0.0469, 0.0031, 0.0109, 0.0031, 0.0059,
        0.0385, 0.0087, 0.0093, 0.0228, 0.0085, 0.0124, 0.0769, 0.0409, 0.0105,
        0.0055, 0.0141, 0.0335, 0.0066, 0.0063, 0.0140, 0.0085, 0.0066, 0.0087,
        0.0053, 0.0079], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #1850: [tensor([0.3319, 0.0408, 0.0045, 0.0077, 0.0049, 0.0075, 0.0204, 0.0073, 0.0056,
        0.0113, 0.0033, 0.0025, 0.0070, 0.0040, 0.0210, 0.0584, 0.0040, 0.0048,
        0.0046, 0.0051, 0.0038, 0.0257, 0.0020, 0.0013, 0.0041, 0.0930, 0.0048,
        0.0113, 0.0087, 0.0069, 0.0098, 0.0084, 0.0096, 0.0080, 0.1394, 0.0048,
        0.0072, 0.0103, 0.0071, 0.0361, 0.0101, 0.0146, 0.0104, 0.0062, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4655, 0.0415, 0.0071, 0.0065, 0.0055, 0.0079, 0.0316, 0.0083, 0.0090,
        0.0096, 0.0030, 0.0027, 0.0102, 0.0064, 0.0169, 0.0678, 0.0041, 0.0072,
        0.0046, 0.0044, 0.0045, 0.0335, 0.0025, 0.0012, 0.0059, 0.0433, 0.0089,
        0.0078, 0.0109, 0.0094, 0.0172, 0.0077, 0.0128, 0.0437, 0.0102, 0.0090,
        0.0079, 0.0097, 0.0043, 0.0075, 0.0037, 0.0105, 0.0077, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3581, 0.0825, 0.0061, 0.0077, 0.0057, 0.0096, 0.0340, 0.0127, 0.0082,
        0.0135, 0.0062, 0.0062, 0.0124, 0.0102, 0.0406, 0.0920, 0.0063, 0.0058,
        0.0095, 0.0114, 0.0055, 0.0376, 0.0040, 0.0031, 0.0080, 0.1071, 0.0211,
        0.0335, 0.0151, 0.0056, 0.0071, 0.0136, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3132, 0.0511, 0.0094, 0.0071, 0.0056, 0.0095, 0.0521, 0.0070, 0.0098,
        0.0109, 0.0052, 0.0041, 0.0139, 0.0108, 0.0336, 0.1072, 0.0069, 0.0053,
        0.0088, 0.0074, 0.0086, 0.0436, 0.0034, 0.0022, 0.0048, 0.1335, 0.0176,
        0.0869, 0.0062, 0.0021, 0.0123, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4363, 0.0409, 0.0052, 0.0059, 0.0049, 0.0070, 0.0280, 0.0084, 0.0083,
        0.0096, 0.0017, 0.0041, 0.0076, 0.0046, 0.0199, 0.0700, 0.0056, 0.0033,
        0.0064, 0.0069, 0.0069, 0.0242, 0.0026, 0.0012, 0.0040, 0.0423, 0.0073,
        0.0099, 0.0082, 0.0068, 0.0057, 0.0050, 0.0093, 0.0060, 0.0132, 0.0508,
        0.0063, 0.0048, 0.0089, 0.0067, 0.0455, 0.0076, 0.0239, 0.0085, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3662, 0.0435, 0.0087, 0.0074, 0.0042, 0.0086, 0.0340, 0.0075, 0.0099,
        0.0096, 0.0053, 0.0037, 0.0107, 0.0081, 0.0396, 0.1139, 0.0073, 0.0068,
        0.0079, 0.0083, 0.0081, 0.0334, 0.0047, 0.0022, 0.0052, 0.1286, 0.0207,
        0.0205, 0.0125, 0.0189, 0.0092, 0.0091, 0.0067, 0.0089, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3264, 0.0482, 0.0057, 0.0063, 0.0059, 0.0068, 0.0286, 0.0048, 0.0055,
        0.0083, 0.0024, 0.0038, 0.0085, 0.0069, 0.0198, 0.0852, 0.0034, 0.0039,
        0.0050, 0.0079, 0.0051, 0.0276, 0.0027, 0.0015, 0.0047, 0.1402, 0.0108,
        0.0552, 0.0131, 0.1194, 0.0153, 0.0045, 0.0068, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2866, 0.0508, 0.0049, 0.0053, 0.0051, 0.0068, 0.0198, 0.0045, 0.0067,
        0.0082, 0.0027, 0.0038, 0.0066, 0.0069, 0.0253, 0.0954, 0.0048, 0.0040,
        0.0063, 0.0042, 0.0046, 0.0272, 0.0030, 0.0014, 0.0035, 0.0953, 0.0116,
        0.0608, 0.1488, 0.0106, 0.0099, 0.0117, 0.0097, 0.0123, 0.0086, 0.0095,
        0.0061, 0.0063, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3541, 0.0596, 0.0068, 0.0046, 0.0042, 0.0072, 0.0243, 0.0075, 0.0074,
        0.0109, 0.0051, 0.0034, 0.0085, 0.0072, 0.0299, 0.1118, 0.0050, 0.0049,
        0.0059, 0.0061, 0.0060, 0.0376, 0.0024, 0.0006, 0.0051, 0.1448, 0.0108,
        0.0065, 0.0132, 0.0492, 0.0051, 0.0105, 0.0089, 0.0083, 0.0053, 0.0114,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3360, 0.0593, 0.0071, 0.0042, 0.0045, 0.0087, 0.0372, 0.0112, 0.0095,
        0.0138, 0.0038, 0.0061, 0.0111, 0.0083, 0.0292, 0.0981, 0.0088, 0.0035,
        0.0067, 0.0086, 0.0077, 0.0420, 0.0027, 0.0038, 0.0073, 0.1110, 0.0148,
        0.0863, 0.0170, 0.0165, 0.0065, 0.0087, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2686, 0.0250, 0.0027, 0.0037, 0.0021, 0.0045, 0.0159, 0.0041, 0.0046,
        0.0064, 0.0021, 0.0020, 0.0048, 0.0028, 0.0149, 0.0408, 0.0028, 0.0038,
        0.0044, 0.0048, 0.0042, 0.0200, 0.0023, 0.0010, 0.0029, 0.1010, 0.0043,
        0.0056, 0.0066, 0.0080, 0.0096, 0.0057, 0.0059, 0.0061, 0.1370, 0.0041,
        0.0092, 0.0083, 0.0047, 0.0242, 0.0058, 0.0122, 0.0060, 0.0063, 0.0766,
        0.0042, 0.0068, 0.0085, 0.0307, 0.0304, 0.0032, 0.0023, 0.0062, 0.0034,
        0.0058], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2797, 0.0269, 0.0044, 0.0041, 0.0037, 0.0047, 0.0275, 0.0042, 0.0065,
        0.0055, 0.0035, 0.0026, 0.0079, 0.0057, 0.0181, 0.0619, 0.0032, 0.0032,
        0.0062, 0.0067, 0.0034, 0.0232, 0.0017, 0.0019, 0.0043, 0.0750, 0.0051,
        0.0075, 0.0060, 0.0063, 0.0111, 0.1239, 0.0057, 0.0513, 0.1599, 0.0208,
        0.0067, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #1900: [tensor([0.5267, 0.0153, 0.0291, 0.0276, 0.0308, 0.0202, 0.0609, 0.0203, 0.0035,
        0.0183, 0.0222, 0.0463, 0.0271, 0.0303, 0.0232, 0.0592, 0.0104, 0.0285,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3817, 0.0145, 0.0077, 0.0113, 0.0143, 0.0171, 0.0516, 0.0116, 0.0065,
        0.0110, 0.0424, 0.0187, 0.0132, 0.0171, 0.1145, 0.2241, 0.0297, 0.0056,
        0.0075, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3739, 0.0810, 0.0033, 0.0145, 0.0106, 0.0303, 0.0681, 0.0048, 0.0047,
        0.0061, 0.0075, 0.0183, 0.0034, 0.0074, 0.0131, 0.0204, 0.0389, 0.0068,
        0.0052, 0.1389, 0.0068, 0.0221, 0.0058, 0.0144, 0.0005, 0.0081, 0.0011,
        0.0440, 0.0297, 0.0108, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.4509, 0.0648, 0.0034, 0.0131, 0.0072, 0.0241, 0.0431, 0.0039, 0.0057,
        0.0047, 0.0053, 0.0125, 0.0055, 0.0071, 0.0058, 0.0184, 0.0246, 0.0086,
        0.0050, 0.0960, 0.0027, 0.0158, 0.0096, 0.0133, 0.0017, 0.0033, 0.0254,
        0.0876, 0.0250, 0.0060, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([3.5187e-01, 7.9957e-02, 3.0634e-04, 1.4849e-02, 1.2868e-02, 3.0772e-02,
        8.0435e-02, 3.6108e-03, 5.0378e-03, 6.1592e-03, 9.0936e-03, 1.1993e-02,
        5.8553e-03, 9.0172e-03, 7.7217e-03, 1.7286e-02, 2.4533e-02, 8.1901e-03,
        2.7337e-03, 1.8652e-01, 5.1436e-03, 2.1213e-02, 1.0821e-02, 1.5275e-02,
        1.1030e-03, 8.4763e-03, 2.7376e-02, 2.7273e-02, 1.4510e-02, 0.0000e+00,
        0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00,
        0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3474, 0.0437, 0.0091, 0.0345, 0.0066, 0.0119, 0.0457, 0.0109, 0.0033,
        0.0075, 0.0041, 0.0401, 0.0071, 0.0038, 0.0055, 0.0082, 0.0130, 0.0039,
        0.0055, 0.0067, 0.0040, 0.0047, 0.0086, 0.0865, 0.0124, 0.0042, 0.0030,
        0.0076, 0.0024, 0.0042, 0.1404, 0.0113, 0.0558, 0.0048, 0.0142, 0.0053,
        0.0040, 0.0081, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3183, 0.0346, 0.0087, 0.0299, 0.0065, 0.0102, 0.0388, 0.0076, 0.0023,
        0.0058, 0.0042, 0.0435, 0.0047, 0.0041, 0.0025, 0.0064, 0.0172, 0.0018,
        0.0057, 0.0067, 0.0042, 0.0057, 0.0099, 0.0764, 0.0151, 0.0052, 0.0022,
        0.0072, 0.0021, 0.0040, 0.0667, 0.0107, 0.0186, 0.1570, 0.0132, 0.0188,
        0.0115, 0.0034, 0.0085, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3615, 0.0585, 0.0090, 0.0249, 0.0055, 0.0134, 0.0338, 0.0105, 0.0019,
        0.0091, 0.0062, 0.0539, 0.0065, 0.0042, 0.0073, 0.0072, 0.0172, 0.0033,
        0.0052, 0.0072, 0.0031, 0.0062, 0.0106, 0.0745, 0.0153, 0.0046, 0.0031,
        0.0065, 0.0026, 0.0038, 0.0378, 0.0073, 0.0124, 0.0440, 0.0189, 0.0055,
        0.0069, 0.0142, 0.0485, 0.0160, 0.0025, 0.0094], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3815, 0.0344, 0.0072, 0.0317, 0.0080, 0.0094, 0.0434, 0.0077, 0.0036,
        0.0093, 0.0061, 0.0402, 0.0053, 0.0016, 0.0067, 0.0051, 0.0132, 0.0014,
        0.0061, 0.0048, 0.0027, 0.0050, 0.0099, 0.0742, 0.0107, 0.0038, 0.0031,
        0.0089, 0.0019, 0.0038, 0.0143, 0.0040, 0.0062, 0.0102, 0.0260, 0.0167,
        0.0906, 0.0112, 0.0484, 0.0107, 0.0043, 0.0067], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2984, 0.0810, 0.0136, 0.0221, 0.0058, 0.0117, 0.0392, 0.0098, 0.0031,
        0.0066, 0.0041, 0.0393, 0.0064, 0.0026, 0.0066, 0.0084, 0.0162, 0.0027,
        0.0044, 0.0069, 0.0033, 0.0079, 0.0100, 0.0861, 0.0128, 0.0035, 0.0036,
        0.0049, 0.0044, 0.0031, 0.0999, 0.0108, 0.0455, 0.0105, 0.0831, 0.0072,
        0.0062, 0.0083, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3170, 0.0466, 0.0099, 0.0245, 0.0054, 0.0093, 0.0290, 0.0073, 0.0026,
        0.0053, 0.0042, 0.0243, 0.0035, 0.0035, 0.0047, 0.0049, 0.0111, 0.0015,
        0.0050, 0.0036, 0.0023, 0.0032, 0.0087, 0.0441, 0.0158, 0.0032, 0.0034,
        0.0065, 0.0008, 0.0040, 0.0900, 0.0088, 0.0400, 0.0057, 0.0615, 0.0045,
        0.1566, 0.0082, 0.0039, 0.0055, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2270, 0.0588, 0.0086, 0.0350, 0.0051, 0.0098, 0.0381, 0.0087, 0.0028,
        0.0052, 0.0043, 0.0352, 0.0047, 0.0050, 0.0034, 0.0061, 0.0105, 0.0020,
        0.0046, 0.0065, 0.0027, 0.0044, 0.0083, 0.0407, 0.0129, 0.0032, 0.0026,
        0.0065, 0.0016, 0.0032, 0.0281, 0.0099, 0.0770, 0.0085, 0.0441, 0.0102,
        0.2278, 0.0081, 0.0082, 0.0039, 0.0066, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #1950: [tensor([0.4287, 0.0480, 0.0091, 0.0063, 0.0162, 0.0076, 0.0894, 0.0137, 0.0165,
        0.0437, 0.0324, 0.0055, 0.0039, 0.0100, 0.0102, 0.0240, 0.0679, 0.0165,
        0.0121, 0.0549, 0.0603, 0.0127, 0.0103, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2716, 0.0951, 0.0060, 0.0087, 0.0148, 0.0093, 0.0821, 0.0122, 0.0198,
        0.0486, 0.0359, 0.0095, 0.0034, 0.0088, 0.0196, 0.1492, 0.0161, 0.0879,
        0.0491, 0.0235, 0.0200, 0.0088, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2355, 0.0512, 0.0044, 0.0066, 0.0088, 0.0099, 0.0840, 0.0096, 0.0105,
        0.0483, 0.0266, 0.0038, 0.0036, 0.0056, 0.0940, 0.0140, 0.1102, 0.0094,
        0.0138, 0.1990, 0.0124, 0.0165, 0.0073, 0.0046, 0.0105],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3727, 0.0722, 0.0096, 0.0114, 0.0269, 0.0087, 0.0034, 0.0058, 0.0879,
        0.0097, 0.0009, 0.0062, 0.1314, 0.0165, 0.0167, 0.0781, 0.0163, 0.0093,
        0.0123, 0.0143, 0.0091, 0.0592, 0.0046, 0.0050, 0.0118],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 3.2835e-01,  6.8171e-02,  1.3106e-02,  1.7537e-02,  5.0461e-02,
         1.4002e-02,  5.5650e-03,  7.5293e-03,  6.7331e-02,  1.2784e-02,
        -2.5008e-04,  6.9400e-03,  1.4564e-01,  1.5501e-02,  2.8308e-02,
         1.3049e-01,  1.8685e-02,  1.8754e-02,  3.2203e-02,  4.7138e-03,
         1.3685e-02,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2600, 0.0581, 0.0159, 0.0142, 0.0383, 0.0112, 0.0050, 0.0026, 0.0820,
        0.0100, 0.0025, 0.0091, 0.1513, 0.0163, 0.0223, 0.1188, 0.0244, 0.0150,
        0.0115, 0.0134, 0.0949, 0.0103, 0.0034, 0.0095, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2922, 0.0165, 0.0053, 0.0032, 0.0099, 0.0370, 0.0547, 0.0172, 0.0137,
        0.0028, 0.0095, 0.0189, 0.0279, 0.0562, 0.0102, 0.0179, 0.3331, 0.0328,
        0.0193, 0.0058, 0.0158, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4247, 0.0204, 0.0090, 0.0068, 0.0127, 0.0476, 0.1487, 0.0146, 0.0139,
        0.0028, 0.0090, 0.0944, 0.0378, 0.0146, 0.0140, 0.0145, 0.0198, 0.0044,
        0.0161, 0.0240, 0.0299, 0.0051, 0.0149, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4139, 0.0236, 0.0094, 0.0135, 0.0159, 0.0447, 0.1763, 0.0238, 0.0136,
        0.0049, 0.0116, 0.0807, 0.0224, 0.0167, 0.0299, 0.0604, 0.0091, 0.0294,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2633, 0.0372, 0.0120, 0.0734, 0.0294, 0.0734, 0.0065, 0.0083, 0.0041,
        0.0110, 0.0410, 0.0178, 0.1822, 0.0133, 0.0713, 0.1085, 0.0069, 0.0161,
        0.0079, 0.0163, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3030, 0.0262, 0.0089, 0.0483, 0.0182, 0.0396, 0.0027, 0.0073, 0.0025,
        0.0067, 0.0285, 0.0116, 0.0573, 0.0267, 0.1168, 0.0139, 0.0140, 0.0468,
        0.0130, 0.0074, 0.0041, 0.1782, 0.0038, 0.0035, 0.0109],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2462, 0.0423, 0.0215, 0.0720, 0.0310, 0.0768, 0.0045, 0.0109, 0.0044,
        0.0096, 0.0602, 0.0244, 0.0694, 0.0393, 0.2123, 0.0259, 0.0252, 0.0082,
        0.0159, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #2000: [tensor([0.4599, 0.0210, 0.0197, 0.0568, 0.0287, 0.0844, 0.0195, 0.0082, 0.0209,
        0.0204, 0.0071, 0.0149, 0.0257, 0.0474, 0.0863, 0.0393, 0.0174, 0.0225,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.5186, 0.0222, 0.0208, 0.0562, 0.0195, 0.0761, 0.0199, 0.0114, 0.0229,
        0.0160, 0.0030, 0.0171, 0.0293, 0.0392, 0.0643, 0.0212, 0.0131, 0.0291,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3991, 0.0993, 0.0141, 0.0283, 0.0361, 0.0106, 0.0172, 0.0439, 0.0143,
        0.0480, 0.0731, 0.0105, 0.0042, 0.0094, 0.0156, 0.0192, 0.0245, 0.0569,
        0.0168, 0.0134, 0.0087, 0.0197, 0.0169, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3572, 0.0499, 0.0191, 0.0173, 0.0203, 0.0086, 0.0098, 0.0334, 0.0066,
        0.0443, 0.0607, 0.0113, 0.0045, 0.0068, 0.0115, 0.0187, 0.0168, 0.0946,
        0.0150, 0.0485, 0.0910, 0.0041, 0.0146, 0.0242, 0.0112, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3353, 0.0844, 0.0191, 0.0286, 0.0413, 0.0129, 0.0078, 0.0474, 0.0207,
        0.0520, 0.0901, 0.0127, 0.0063, 0.0138, 0.0235, 0.0215, 0.0230, 0.1173,
        0.0255, 0.0169, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.4569, 0.0094, 0.0078, 0.0045, 0.0096, 0.0087, 0.0133, 0.0061, 0.0111,
        0.0238, 0.0051, 0.0110, 0.0079, 0.0103, 0.0071, 0.0057, 0.0068, 0.0108,
        0.0749, 0.0097, 0.0048, 0.0010, 0.0063, 0.0177, 0.0149, 0.0254, 0.0741,
        0.0196, 0.0213, 0.0118, 0.0111, 0.0105, 0.0105, 0.0065, 0.0269, 0.0137,
        0.0081, 0.0063, 0.0091, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.4228, 0.0099, 0.0154, 0.0087, 0.0159, 0.0099, 0.0150, 0.0092, 0.0111,
        0.0233, 0.0090, 0.0145, 0.0136, 0.0126, 0.0079, 0.0100, 0.0096, 0.0183,
        0.1080, 0.0086, 0.0093, 0.0028, 0.0080, 0.0123, 0.0213, 0.0752, 0.0395,
        0.0245, 0.0128, 0.0205, 0.0070, 0.0137, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.4774, 0.0127, 0.0088, 0.0055, 0.0118, 0.0113, 0.0097, 0.0094, 0.0115,
        0.0167, 0.0073, 0.0120, 0.0124, 0.0103, 0.0064, 0.0076, 0.0074, 0.0247,
        0.1519, 0.0096, 0.0080, 0.0020, 0.0082, 0.0183, 0.0117, 0.0105, 0.0188,
        0.0195, 0.0176, 0.0177, 0.0126, 0.0133, 0.0064, 0.0110, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([3.0799e-01, 2.3995e-02, 5.6511e-03, 3.7162e-03, 3.2877e-03, 4.1058e-03,
        2.0318e-02, 2.4262e-02, 5.4445e-03, 8.3896e-03, 3.6885e-03, 4.0581e-03,
        4.2550e-02, 1.3259e-03, 5.4684e-03, 2.9554e-02, 6.0642e-03, 3.6093e-03,
        5.0552e-03, 5.3944e-03, 4.6096e-03, 6.9939e-03, 7.5085e-02, 2.8127e-03,
        4.1502e-02, 6.8010e-02, 2.3445e-03, 5.3639e-03, 2.7517e-03, 1.2656e-04,
        4.6066e-03, 3.9484e-03, 4.1499e-03, 2.2771e-03, 8.4201e-02, 4.3716e-03,
        2.8694e-04, 4.4769e-03, 5.3448e-02, 5.6113e-03, 1.8575e-03, 8.7771e-02,
        8.0632e-03, 5.2658e-03, 1.8654e-03, 4.2695e-03, 0.0000e+00, 0.0000e+00,
        0.0000e+00, 0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3325, 0.0450, 0.0057, 0.0028, 0.0028, 0.0037, 0.0230, 0.0324, 0.0048,
        0.0117, 0.0056, 0.0042, 0.0347, 0.0019, 0.0061, 0.0392, 0.0056, 0.0057,
        0.0051, 0.0092, 0.0050, 0.0065, 0.0691, 0.0033, 0.0273, 0.0504, 0.0013,
        0.0044, 0.0024, 0.0006, 0.0040, 0.0047, 0.0037, 0.0024, 0.0738, 0.0061,
        0.0012, 0.0041, 0.0569, 0.0068, 0.0019, 0.0098, 0.0225, 0.0108, 0.0027,
        0.0064, 0.0134, 0.0058, 0.0038, 0.0072], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([3.4833e-01, 3.5286e-02, 6.4136e-03, 3.2753e-03, 2.9896e-03, 3.4090e-03,
        1.8085e-02, 2.4276e-02, 5.3933e-03, 7.8632e-03, 2.6908e-03, 4.5068e-03,
        5.4045e-02, 2.2225e-03, 7.5309e-03, 2.7271e-02, 4.9289e-03, 5.4342e-03,
        4.5702e-03, 6.6848e-03, 3.9702e-03, 7.8538e-03, 4.9043e-02, 2.6042e-03,
        2.9433e-02, 5.4876e-02, 8.5938e-04, 3.9401e-03, 2.0087e-03, 3.3072e-04,
        3.3534e-03, 2.1839e-03, 3.6445e-03, 1.4883e-03, 5.3398e-02, 5.8754e-03,
        3.1345e-04, 4.0809e-03, 6.8299e-02, 5.7056e-03, 1.5053e-03, 8.7115e-03,
        6.3657e-03, 9.6151e-03, 7.1171e-02, 8.7148e-03, 6.7453e-03, 2.2130e-03,
        6.4941e-03, 0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4551, 0.0135, 0.0186, 0.0257, 0.0720, 0.1054, 0.0206, 0.0114, 0.0209,
        0.0169, 0.0244, 0.0290, 0.0367, 0.0149, 0.0898, 0.0229, 0.0222, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #2050: [tensor([0.3554, 0.0333, 0.0099, 0.0066, 0.0069, 0.0099, 0.0039, 0.0051, 0.0690,
        0.0102, 0.0077, 0.0067, 0.0058, 0.0048, 0.0396, 0.0091, 0.0479, 0.0080,
        0.0141, 0.1018, 0.0045, 0.0107, 0.0018, 0.0142, 0.0137, 0.0030, 0.0099,
        0.0053, 0.0025, 0.0129, 0.0110, 0.0022, 0.0048, 0.0381, 0.0132, 0.0702,
        0.0092, 0.0065, 0.0050, 0.0059, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2936, 0.0492, 0.0088, 0.0063, 0.0049, 0.0101, 0.0023, 0.0055, 0.0582,
        0.0102, 0.0074, 0.0053, 0.0058, 0.0016, 0.0324, 0.0104, 0.0467, 0.0094,
        0.0125, 0.0679, 0.0035, 0.0078, 0.0028, 0.0176, 0.0093, 0.0026, 0.0074,
        0.0029, 0.0027, 0.0129, 0.0109, 0.0028, 0.0041, 0.0459, 0.0112, 0.1329,
        0.0159, 0.0358, 0.0088, 0.0046, 0.0035, 0.0056], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3505, 0.0438, 0.0101, 0.0046, 0.0420, 0.0054, 0.0030, 0.0070, 0.0234,
        0.0808, 0.0077, 0.0063, 0.0056, 0.0111, 0.0068, 0.0182, 0.1083, 0.0070,
        0.0021, 0.0051, 0.1131, 0.0083, 0.0132, 0.0847, 0.0123, 0.0054, 0.0064,
        0.0077, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3475, 0.0474, 0.0102, 0.0073, 0.0306, 0.0028, 0.0034, 0.0078, 0.0165,
        0.0747, 0.0081, 0.0058, 0.0092, 0.0080, 0.0082, 0.0184, 0.1186, 0.0063,
        0.0004, 0.0049, 0.0488, 0.0093, 0.0144, 0.0994, 0.0083, 0.0051, 0.0162,
        0.0047, 0.0149, 0.0250, 0.0088, 0.0029, 0.0062, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2711, 0.0476, 0.0131, 0.0051, 0.0552, 0.0049, 0.0032, 0.0066, 0.0201,
        0.0648, 0.0098, 0.0050, 0.0078, 0.0134, 0.0070, 0.0206, 0.0895, 0.0072,
        0.0027, 0.0074, 0.1002, 0.0139, 0.0192, 0.1409, 0.0296, 0.0092, 0.0106,
        0.0042, 0.0102, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2571, 0.0443, 0.0129, 0.0369, 0.0073, 0.0101, 0.0063, 0.0248, 0.0075,
        0.0135, 0.0045, 0.0275, 0.0099, 0.0097, 0.0053, 0.0013, 0.0111, 0.1065,
        0.0112, 0.0767, 0.0118, 0.0767, 0.1801, 0.0103, 0.0192, 0.0060, 0.0114,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2371, 0.0344, 0.0091, 0.0344, 0.0077, 0.0120, 0.0074, 0.0425, 0.0079,
        0.0136, 0.0038, 0.0298, 0.0116, 0.0074, 0.0076, 0.0025, 0.0070, 0.0932,
        0.0136, 0.0815, 0.0129, 0.0413, 0.2504, 0.0158, 0.0053, 0.0050, 0.0052,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3305, 0.0337, 0.0103, 0.0311, 0.0073, 0.0069, 0.0056, 0.0219, 0.0069,
        0.0125, 0.0026, 0.0240, 0.0097, 0.0060, 0.0060, 0.0031, 0.0084, 0.1870,
        0.0121, 0.0500, 0.0136, 0.0342, 0.1455, 0.0093, 0.0090, 0.0046, 0.0083,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2304, 0.0515, 0.0069, 0.0291, 0.0546, 0.0056, 0.0028, 0.0182, 0.0077,
        0.0240, 0.0061, 0.0156, 0.0523, 0.0036, 0.0038, 0.0009, 0.0057, 0.1187,
        0.0100, 0.0540, 0.0085, 0.0368, 0.2308, 0.0071, 0.0071, 0.0083, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2525, 0.0360, 0.0098, 0.0345, 0.0596, 0.0050, 0.0027, 0.0147, 0.0107,
        0.0201, 0.0064, 0.0243, 0.0680, 0.0049, 0.0048, 0.0039, 0.0083, 0.1267,
        0.0141, 0.0654, 0.0119, 0.0310, 0.1596, 0.0085, 0.0079, 0.0089, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.1989, 0.0362, 0.0071, 0.0303, 0.0463, 0.0034, 0.0026, 0.0163, 0.0080,
        0.0199, 0.0049, 0.0161, 0.0359, 0.0045, 0.0035, 0.0019, 0.0071, 0.0669,
        0.0114, 0.0786, 0.0094, 0.0361, 0.1417, 0.0063, 0.0050, 0.0117, 0.1748,
        0.0082, 0.0072, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2702, 0.0701, 0.0121, 0.0127, 0.0764, 0.0052, 0.0112, 0.0110, 0.0186,
        0.0045, 0.0062, 0.1041, 0.0176, 0.1056, 0.0190, 0.0151, 0.0180, 0.1977,
        0.0112, 0.0137, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #2100: [tensor([0.4389, 0.0118, 0.0022, 0.0095, 0.0129, 0.0139, 0.0133, 0.0106, 0.0151,
        0.0164, 0.0233, 0.0181, 0.0068, 0.0191, 0.0766, 0.0236, 0.0048, 0.0093,
        0.0606, 0.0308, 0.0470, 0.0112, 0.0899, 0.0160, 0.0066, 0.0118, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3096, 0.0367, 0.0070, 0.0327, 0.0076, 0.0237, 0.0078, 0.0057, 0.0054,
        0.0103, 0.0034, 0.0027, 0.0441, 0.0120, 0.0045, 0.0024, 0.0100, 0.0050,
        0.0330, 0.0068, 0.0006, 0.0050, 0.1787, 0.0119, 0.0107, 0.0165, 0.0560,
        0.0142, 0.0099, 0.0127, 0.0846, 0.0193, 0.0040, 0.0056],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([3.8636e-01, 6.9572e-02, 1.1770e-02, 5.6640e-02, 1.4615e-02, 6.4885e-02,
        1.4287e-02, 4.2480e-03, 8.2945e-03, 1.4770e-02, 3.6626e-03, 3.6082e-03,
        9.8404e-02, 1.0673e-02, 9.8279e-03, 4.5633e-03, 2.4849e-02, 4.7878e-03,
        5.7118e-02, 1.3308e-02, 5.7706e-05, 5.9573e-03, 7.9847e-03, 1.6805e-02,
        4.3808e-02, 2.1350e-02, 1.0575e-02, 5.4729e-03, 1.1751e-02, 0.0000e+00,
        0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3465, 0.0498, 0.0115, 0.0302, 0.0099, 0.0492, 0.0100, 0.0057, 0.0072,
        0.0123, 0.0014, 0.0048, 0.0722, 0.0111, 0.0065, 0.0025, 0.0144, 0.0073,
        0.0501, 0.0088, 0.0019, 0.0059, 0.0090, 0.0104, 0.0511, 0.0072, 0.1420,
        0.0159, 0.0153, 0.0099, 0.0061, 0.0045, 0.0090, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4224, 0.0862, 0.0109, 0.0191, 0.0097, 0.0094, 0.0325, 0.0038, 0.0051,
        0.0163, 0.0367, 0.0048, 0.0043, 0.0090, 0.0569, 0.0268, 0.0441, 0.0194,
        0.0484, 0.0088, 0.0178, 0.0817, 0.0066, 0.0076, 0.0117, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3348, 0.0832, 0.0070, 0.0246, 0.0138, 0.0088, 0.0309, 0.0080, 0.0112,
        0.0087, 0.0426, 0.0041, 0.0039, 0.0100, 0.0725, 0.0352, 0.0918, 0.0236,
        0.0704, 0.0831, 0.0074, 0.0044, 0.0200, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4895, 0.0616, 0.0126, 0.0183, 0.0121, 0.0081, 0.0261, 0.0075, 0.0065,
        0.0167, 0.0411, 0.0018, 0.0048, 0.0080, 0.0551, 0.0292, 0.0720, 0.0241,
        0.0360, 0.0180, 0.0213, 0.0076, 0.0078, 0.0143, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2810, 0.0098, 0.0091, 0.0675, 0.0037, 0.0080, 0.0635, 0.0099, 0.0378,
        0.0033, 0.0156, 0.0025, 0.0074, 0.1230, 0.0070, 0.0984, 0.0089, 0.0145,
        0.1185, 0.0259, 0.0435, 0.0016, 0.0220, 0.0060, 0.0116, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3053, 0.0077, 0.0084, 0.0436, 0.0021, 0.0035, 0.0515, 0.0087, 0.0321,
        0.0015, 0.0112, 0.0019, 0.0071, 0.1133, 0.0122, 0.0124, 0.1111, 0.0063,
        0.0112, 0.1252, 0.0108, 0.0695, 0.0060, 0.0271, 0.0030, 0.0074, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3486, 0.0111, 0.0112, 0.0503, 0.0038, 0.0052, 0.0559, 0.0110, 0.0416,
        0.0041, 0.0144, 0.0031, 0.0097, 0.1119, 0.0112, 0.0782, 0.0055, 0.0131,
        0.1097, 0.0159, 0.0384, 0.0035, 0.0277, 0.0054, 0.0095, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3976, 0.0185, 0.0252, 0.0217, 0.0145, 0.0161, 0.0151, 0.0216, 0.0280,
        0.0032, 0.0139, 0.2343, 0.0284, 0.0435, 0.0501, 0.0259, 0.0125, 0.0301,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.5125, 0.0246, 0.0311, 0.0251, 0.0230, 0.0361, 0.0226, 0.0336, 0.0314,
        0.0093, 0.0204, 0.0646, 0.0497, 0.0751, 0.0126, 0.0281, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #2150: [tensor([0.3608, 0.0193, 0.0212, 0.0726, 0.0293, 0.0420, 0.0625, 0.0138, 0.0057,
        0.0184, 0.1408, 0.0178, 0.0414, 0.0454, 0.0811, 0.0127, 0.0152, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3049, 0.0079, 0.0106, 0.0533, 0.0296, 0.0249, 0.0386, 0.0126, 0.0031,
        0.0083, 0.1287, 0.0068, 0.0203, 0.2311, 0.0178, 0.0215, 0.0197, 0.0077,
        0.0175, 0.0175, 0.0039, 0.0137, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2896, 0.0495, 0.0058, 0.0396, 0.0114, 0.0041, 0.0631, 0.0111, 0.0158,
        0.0033, 0.0038, 0.0772, 0.0130, 0.0754, 0.0077, 0.0113, 0.2723, 0.0130,
        0.0205, 0.0048, 0.0076, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.1881, 0.0458, 0.0113, 0.0560, 0.0126, 0.0058, 0.0774, 0.0086, 0.0174,
        0.0024, 0.0068, 0.1059, 0.0144, 0.0730, 0.0118, 0.0323, 0.2903, 0.0107,
        0.0125, 0.0066, 0.0102, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3102, 0.0602, 0.0104, 0.0548, 0.0101, 0.0069, 0.0426, 0.0104, 0.0150,
        0.0037, 0.0062, 0.0766, 0.0159, 0.0833, 0.0084, 0.0157, 0.0101, 0.0902,
        0.0146, 0.0102, 0.0856, 0.0183, 0.0294, 0.0034, 0.0079, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2201, 0.0056, 0.0583, 0.0854, 0.0036, 0.0068, 0.0564, 0.0029, 0.0079,
        0.0040, 0.0078, 0.0052, 0.0131, 0.0042, 0.0147, 0.0053, 0.0119, 0.0062,
        0.0298, 0.1071, 0.0027, 0.0015, 0.0056, 0.0433, 0.0117, 0.0614, 0.0491,
        0.1496, 0.0073, 0.0031, 0.0085], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2501, 0.0061, 0.0545, 0.0686, 0.0016, 0.0086, 0.0409, 0.0033, 0.0052,
        0.0035, 0.0050, 0.0065, 0.0188, 0.0048, 0.0175, 0.0089, 0.0116, 0.0071,
        0.0409, 0.0657, 0.0047, 0.0039, 0.0046, 0.0351, 0.0089, 0.0928, 0.1960,
        0.0091, 0.0062, 0.0094, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2257, 0.0041, 0.0608, 0.0698, 0.0022, 0.0076, 0.0577, 0.0024, 0.0088,
        0.0046, 0.0060, 0.0059, 0.0157, 0.0044, 0.0158, 0.0054, 0.0137, 0.0099,
        0.0293, 0.0842, 0.0049, 0.0022, 0.0057, 0.0387, 0.0117, 0.0563, 0.0545,
        0.1549, 0.0227, 0.0042, 0.0102], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3463, 0.0085, 0.0829, 0.1348, 0.0115, 0.0074, 0.0047, 0.0174, 0.0117,
        0.0352, 0.0734, 0.0070, 0.0056, 0.0020, 0.0075, 0.0485, 0.0886, 0.0469,
        0.0137, 0.0320, 0.0144, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2114, 0.0074, 0.1504, 0.0937, 0.0089, 0.0071, 0.0067, 0.0132, 0.0098,
        0.0244, 0.0597, 0.0074, 0.0063, 0.0014, 0.0066, 0.0318, 0.1216, 0.2127,
        0.0090, 0.0103, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3147, 0.0060, 0.0842, 0.1261, 0.0093, 0.0078, 0.0073, 0.0138, 0.0161,
        0.0206, 0.0805, 0.0079, 0.0044, 0.0041, 0.0074, 0.0400, 0.2008, 0.0177,
        0.0120, 0.0081, 0.0113, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3731, 0.0759, 0.0092, 0.0086, 0.0091, 0.0100, 0.0112, 0.0192, 0.0141,
        0.0089, 0.0137, 0.0110, 0.0196, 0.0021, 0.0064, 0.0640, 0.0154, 0.0484,
        0.1445, 0.0130, 0.0123, 0.0226, 0.0294, 0.0088, 0.0204, 0.0076, 0.0216,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #2200: [tensor([0.3852, 0.0487, 0.0840, 0.0345, 0.0243, 0.0508, 0.0335, 0.0150, 0.0305,
        0.0264, 0.0265, 0.1111, 0.0724, 0.0195, 0.0376, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3212, 0.0134, 0.0259, 0.0135, 0.0068, 0.0148, 0.0140, 0.0069, 0.0116,
        0.0118, 0.0223, 0.0525, 0.0708, 0.3301, 0.0214, 0.0309, 0.0133, 0.0189,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2689, 0.0421, 0.0087, 0.0337, 0.0080, 0.0062, 0.0064, 0.0047, 0.0069,
        0.0140, 0.0286, 0.0081, 0.0300, 0.0065, 0.0131, 0.0841, 0.0219, 0.0055,
        0.0023, 0.0059, 0.0057, 0.0021, 0.0046, 0.0766, 0.0130, 0.0101, 0.2062,
        0.0293, 0.0078, 0.0095, 0.0150, 0.0046, 0.0102, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2357, 0.0782, 0.0121, 0.0442, 0.0103, 0.0100, 0.0117, 0.0057, 0.0109,
        0.0211, 0.0344, 0.0106, 0.0373, 0.0081, 0.0149, 0.1005, 0.0286, 0.0089,
        0.0034, 0.0080, 0.0060, 0.0014, 0.0084, 0.1868, 0.0155, 0.0076, 0.0143,
        0.0128, 0.0196, 0.0206, 0.0037, 0.0090, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2669, 0.0391, 0.0070, 0.0407, 0.0098, 0.0068, 0.0070, 0.0052, 0.0087,
        0.0176, 0.0233, 0.0074, 0.0357, 0.0066, 0.0148, 0.0800, 0.0201, 0.0061,
        0.0034, 0.0079, 0.0041, 0.0021, 0.0046, 0.1905, 0.0098, 0.0096, 0.0064,
        0.0137, 0.0103, 0.0095, 0.0174, 0.0075, 0.0143, 0.0393, 0.0338, 0.0035,
        0.0095], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3025, 0.0941, 0.0129, 0.0235, 0.0136, 0.0277, 0.0342, 0.0534, 0.0095,
        0.0096, 0.0842, 0.0101, 0.0050, 0.0090, 0.0746, 0.0287, 0.0195, 0.0828,
        0.0368, 0.0325, 0.0251, 0.0108, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3927, 0.0761, 0.0107, 0.0250, 0.0144, 0.0226, 0.0382, 0.0529, 0.0128,
        0.0060, 0.0551, 0.0093, 0.0035, 0.0102, 0.0628, 0.0211, 0.0209, 0.1212,
        0.0162, 0.0141, 0.0142, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3316, 0.0926, 0.0103, 0.0274, 0.0169, 0.0187, 0.0470, 0.0727, 0.0101,
        0.0088, 0.0898, 0.0076, 0.0043, 0.0113, 0.0717, 0.0226, 0.0198, 0.0870,
        0.0333, 0.0165, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2295, 0.0796, 0.0107, 0.0088, 0.0190, 0.0396, 0.0156, 0.0084, 0.0778,
        0.0085, 0.0079, 0.0032, 0.0066, 0.1682, 0.0172, 0.0150, 0.0884, 0.1620,
        0.0194, 0.0145, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2202, 0.0474, 0.0144, 0.0153, 0.0246, 0.0374, 0.0083, 0.0078, 0.0782,
        0.0117, 0.0116, 0.0026, 0.0073, 0.1689, 0.0136, 0.0215, 0.0697, 0.2134,
        0.0151, 0.0110, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2550, 0.0409, 0.0104, 0.0109, 0.0379, 0.0344, 0.0115, 0.0065, 0.0697,
        0.0099, 0.0099, 0.0019, 0.0077, 0.1340, 0.0126, 0.0189, 0.0981, 0.1949,
        0.0080, 0.0177, 0.0093, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3399, 0.0096, 0.0047, 0.0090, 0.0133, 0.0094, 0.0052, 0.0117, 0.0370,
        0.0045, 0.0029, 0.0083, 0.0442, 0.0209, 0.0458, 0.0220, 0.3435, 0.0232,
        0.0165, 0.0079, 0.0061, 0.0143, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #2250: [tensor([0.3528, 0.0198, 0.0081, 0.0196, 0.0091, 0.0183, 0.0043, 0.0119, 0.2364,
        0.0302, 0.0079, 0.0652, 0.0838, 0.0170, 0.0267, 0.0128, 0.0377, 0.0146,
        0.0238, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3878, 0.0114, 0.0164, 0.0045, 0.0920, 0.0096, 0.0135, 0.0045, 0.0134,
        0.0055, 0.0511, 0.0098, 0.0309, 0.0182, 0.0021, 0.0094, 0.0169, 0.0072,
        0.0147, 0.0099, 0.1867, 0.0194, 0.0320, 0.0195, 0.0135, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4540, 0.0113, 0.0178, 0.0037, 0.1061, 0.0109, 0.0130, 0.0097, 0.0107,
        0.0091, 0.1027, 0.0101, 0.0220, 0.0216, 0.0009, 0.0101, 0.0212, 0.0138,
        0.0525, 0.0239, 0.0146, 0.0023, 0.0226, 0.0145, 0.0206, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3754, 0.0115, 0.0141, 0.0047, 0.0775, 0.0170, 0.0114, 0.0042, 0.0097,
        0.0088, 0.0926, 0.0119, 0.0205, 0.0142, 0.0038, 0.0125, 0.0365, 0.0603,
        0.0256, 0.0109, 0.1396, 0.0250, 0.0125, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4166, 0.0140, 0.0302, 0.0071, 0.0531, 0.0063, 0.0284, 0.1176, 0.0153,
        0.0143, 0.0020, 0.0181, 0.0212, 0.0740, 0.0286, 0.0658, 0.0317, 0.0136,
        0.0139, 0.0280, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4310, 0.0158, 0.0320, 0.0161, 0.0676, 0.0046, 0.0305, 0.0901, 0.0174,
        0.0101, 0.0011, 0.0133, 0.0922, 0.0118, 0.0991, 0.0176, 0.0146, 0.0077,
        0.0102, 0.0170, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([2.8185e-01, 1.5457e-02, 2.2567e-02, 1.1751e-02, 5.1948e-02, 3.0545e-03,
        2.4596e-02, 5.0649e-02, 1.2058e-02, 1.1088e-02, 6.6129e-05, 8.8974e-03,
        7.6308e-02, 1.4483e-02, 1.6524e-02, 1.6102e-02, 3.1771e-01, 1.7429e-02,
        2.9267e-02, 6.5510e-03, 1.1642e-02, 0.0000e+00, 0.0000e+00, 0.0000e+00,
        0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00,
        0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00,
        0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00,
        0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1802, 0.0247, 0.0050, 0.0242, 0.0072, 0.0011, 0.0052, 0.0120, 0.0188,
        0.0059, 0.0068, 0.0145, 0.0036, 0.0027, 0.0030, 0.0055, 0.0158, 0.0078,
        0.0022, 0.0396, 0.0051, 0.0041, 0.0062, 0.0180, 0.0066, 0.0046, 0.2313,
        0.0082, 0.0060, 0.0044, 0.0662, 0.0073, 0.0043, 0.0041, 0.1324, 0.0083,
        0.0042, 0.0055, 0.0075, 0.0124, 0.0070, 0.0044, 0.0057, 0.0367, 0.0048,
        0.0022, 0.0069], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2860, 0.0783, 0.0086, 0.0268, 0.0093, 0.0020, 0.0075, 0.0229, 0.0250,
        0.0091, 0.0110, 0.0259, 0.0050, 0.0033, 0.0039, 0.0073, 0.0163, 0.0124,
        0.0032, 0.0622, 0.0072, 0.0071, 0.0070, 0.0286, 0.0079, 0.0045, 0.1471,
        0.0124, 0.0041, 0.0124, 0.0169, 0.0088, 0.0065, 0.0312, 0.0526, 0.0093,
        0.0036, 0.0066, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2887, 0.0289, 0.0076, 0.0377, 0.0100, 0.0019, 0.0066, 0.0202, 0.0225,
        0.0109, 0.0081, 0.0216, 0.0048, 0.0044, 0.0044, 0.0071, 0.0205, 0.0160,
        0.0036, 0.0686, 0.0079, 0.0072, 0.0101, 0.0246, 0.0082, 0.0060, 0.0083,
        0.0225, 0.0049, 0.0063, 0.1141, 0.0120, 0.0151, 0.0490, 0.0119, 0.0174,
        0.0617, 0.0093, 0.0027, 0.0067, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3783, 0.0181, 0.0400, 0.0034, 0.0841, 0.0134, 0.0145, 0.0104, 0.0167,
        0.0078, 0.0026, 0.0119, 0.0228, 0.1259, 0.0091, 0.1682, 0.0122, 0.0271,
        0.0140, 0.0086, 0.0112, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4515, 0.0139, 0.0542, 0.0054, 0.1115, 0.0126, 0.0231, 0.0108, 0.0187,
        0.0132, 0.0031, 0.0074, 0.0183, 0.0184, 0.0173, 0.0501, 0.0223, 0.0435,
        0.0242, 0.0238, 0.0264, 0.0062, 0.0063, 0.0177, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #2300: [tensor([0.3732, 0.0103, 0.0109, 0.0489, 0.0104, 0.0097, 0.0222, 0.0129, 0.0060,
        0.0132, 0.0135, 0.0093, 0.1366, 0.0161, 0.0201, 0.0062, 0.0154, 0.0120,
        0.0018, 0.0095, 0.0777, 0.0115, 0.0201, 0.0541, 0.0206, 0.0074, 0.0257,
        0.0089, 0.0159, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2780, 0.0881, 0.0169, 0.0296, 0.0799, 0.0115, 0.0126, 0.0190, 0.0160,
        0.0099, 0.0035, 0.0111, 0.0652, 0.0241, 0.0121, 0.2030, 0.0357, 0.0274,
        0.0206, 0.0123, 0.0062, 0.0172, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3363, 0.0718, 0.0233, 0.0399, 0.0942, 0.0080, 0.0144, 0.0116, 0.0192,
        0.0112, 0.0024, 0.0125, 0.1673, 0.0140, 0.0181, 0.0180, 0.0465, 0.0302,
        0.0200, 0.0226, 0.0072, 0.0113, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2380, 0.1028, 0.0215, 0.0322, 0.0944, 0.0111, 0.0139, 0.0153, 0.0162,
        0.0125, 0.0030, 0.0124, 0.2861, 0.0102, 0.0165, 0.0289, 0.0221, 0.0109,
        0.0152, 0.0138, 0.0067, 0.0164, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3521, 0.0961, 0.0149, 0.0159, 0.1140, 0.0130, 0.0120, 0.0212, 0.0811,
        0.0102, 0.0052, 0.0081, 0.1346, 0.0164, 0.0172, 0.0297, 0.0170, 0.0222,
        0.0062, 0.0128, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2165, 0.0726, 0.0113, 0.0103, 0.0479, 0.0082, 0.0085, 0.0161, 0.0674,
        0.0086, 0.0063, 0.0092, 0.1743, 0.0142, 0.0128, 0.0521, 0.2155, 0.0160,
        0.0169, 0.0059, 0.0095, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2309, 0.0657, 0.0105, 0.0113, 0.0847, 0.0078, 0.0126, 0.0185, 0.0658,
        0.0122, 0.0054, 0.0073, 0.1208, 0.0146, 0.0136, 0.2180, 0.0181, 0.0196,
        0.0275, 0.0102, 0.0100, 0.0044, 0.0104, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3467, 0.0119, 0.0175, 0.0032, 0.0058, 0.0106, 0.0779, 0.0046, 0.0171,
        0.0816, 0.0069, 0.0051, 0.0086, 0.0157, 0.0240, 0.0132, 0.3028, 0.0155,
        0.0092, 0.0119, 0.0104, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3565, 0.0133, 0.0204, 0.0043, 0.0107, 0.0109, 0.0958, 0.0088, 0.0199,
        0.0818, 0.0073, 0.0012, 0.0119, 0.1859, 0.0195, 0.0367, 0.0255, 0.0365,
        0.0183, 0.0143, 0.0056, 0.0148, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3613, 0.0112, 0.0167, 0.0032, 0.0094, 0.0128, 0.1016, 0.0048, 0.0210,
        0.0702, 0.0058, 0.0033, 0.0135, 0.0125, 0.0208, 0.0127, 0.0325, 0.0118,
        0.2162, 0.0234, 0.0144, 0.0029, 0.0179, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2363, 0.0476, 0.0032, 0.0046, 0.0116, 0.0017, 0.0090, 0.0120, 0.0061,
        0.0295, 0.0438, 0.0108, 0.0139, 0.0110, 0.0028, 0.0153, 0.0080, 0.0096,
        0.0101, 0.0024, 0.0047, 0.1562, 0.0080, 0.0086, 0.0191, 0.0166, 0.0263,
        0.0078, 0.0126, 0.0195, 0.0330, 0.1546, 0.0129, 0.0151, 0.0066, 0.0090],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3789, 0.0596, 0.0041, 0.0068, 0.0179, 0.0024, 0.0089, 0.0140, 0.0075,
        0.0543, 0.0393, 0.0114, 0.0166, 0.0168, 0.0011, 0.0110, 0.0100, 0.0095,
        0.0152, 0.0004, 0.0049, 0.1260, 0.0127, 0.0290, 0.0209, 0.0327, 0.0208,
        0.0120, 0.0130, 0.0192, 0.0080, 0.0047, 0.0104, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #2350: [tensor([3.1239e-01, 1.0457e-02, 2.0709e-02, 3.0154e-02, 1.9754e-02, 5.1814e-02,
        6.7488e-03, 1.4803e-02, 9.3550e-03, 1.0998e-02, 1.1697e-02, 1.7097e-02,
        2.5832e-01, 1.7114e-02, 1.2533e-04, 1.1066e-02, 6.3104e-02, 2.5121e-02,
        4.6354e-02, 2.1101e-02, 1.4248e-02, 5.2172e-03, 2.2248e-02, 0.0000e+00,
        0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00,
        0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3739, 0.0201, 0.0200, 0.0433, 0.0280, 0.1335, 0.0372, 0.0152, 0.0015,
        0.0145, 0.0816, 0.0326, 0.1097, 0.0498, 0.0095, 0.0296, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3821, 0.0229, 0.0322, 0.0232, 0.0328, 0.1325, 0.0316, 0.0212, 0.0101,
        0.0208, 0.1075, 0.0254, 0.0765, 0.0240, 0.0157, 0.0416, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4385, 0.0172, 0.0333, 0.0268, 0.0322, 0.1082, 0.0340, 0.0146, 0.0091,
        0.0176, 0.1102, 0.0269, 0.0814, 0.0190, 0.0124, 0.0187, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4136, 0.1133, 0.0125, 0.0222, 0.1266, 0.0116, 0.0086, 0.0221, 0.0060,
        0.0164, 0.0259, 0.1035, 0.0280, 0.0309, 0.0353, 0.0236, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4172, 0.0982, 0.0170, 0.0174, 0.1809, 0.0076, 0.0090, 0.0193, 0.0116,
        0.0143, 0.0338, 0.1210, 0.0277, 0.0250, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3335, 0.1228, 0.0211, 0.0256, 0.1700, 0.0122, 0.0086, 0.0189, 0.0082,
        0.0159, 0.0289, 0.1506, 0.0451, 0.0193, 0.0192, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3019, 0.0571, 0.0143, 0.0100, 0.0332, 0.0247, 0.0133, 0.0171, 0.0113,
        0.0127, 0.0103, 0.0112, 0.0062, 0.0056, 0.0131, 0.1500, 0.0090, 0.0089,
        0.0159, 0.0063, 0.0007, 0.0071, 0.0554, 0.0121, 0.1515, 0.0213, 0.0060,
        0.0136, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3216, 0.0906, 0.0207, 0.0101, 0.0316, 0.0323, 0.0117, 0.0132, 0.0114,
        0.0169, 0.0121, 0.0080, 0.0067, 0.0073, 0.0156, 0.0907, 0.0089, 0.0101,
        0.0133, 0.0091, 0.0022, 0.0086, 0.0689, 0.0090, 0.1362, 0.0104, 0.0055,
        0.0172, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2609, 0.0719, 0.0136, 0.0064, 0.0346, 0.0260, 0.0100, 0.0114, 0.0088,
        0.0107, 0.0079, 0.0070, 0.0052, 0.0037, 0.0117, 0.0756, 0.0104, 0.0061,
        0.0113, 0.0046, 0.0017, 0.0069, 0.0395, 0.0102, 0.1253, 0.0051, 0.0070,
        0.0099, 0.1449, 0.0275, 0.0070, 0.0068, 0.0105, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3368, 0.0626, 0.0055, 0.0077, 0.0054, 0.0097, 0.0105, 0.0051, 0.0040,
        0.0422, 0.0045, 0.0307, 0.0704, 0.0072, 0.0137, 0.0059, 0.0080, 0.0101,
        0.0085, 0.0291, 0.0096, 0.0153, 0.0034, 0.0075, 0.1685, 0.0096, 0.0084,
        0.0260, 0.0163, 0.0213, 0.0141, 0.0095, 0.0045, 0.0087],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2763, 0.0594, 0.0055, 0.0086, 0.0070, 0.0077, 0.0068, 0.0056, 0.0041,
        0.0458, 0.0076, 0.0266, 0.0509, 0.0089, 0.0111, 0.0061, 0.0056, 0.0082,
        0.0126, 0.0240, 0.0062, 0.0160, 0.0020, 0.0054, 0.2946, 0.0082, 0.0113,
        0.0131, 0.0087, 0.0198, 0.0070, 0.0076, 0.0043, 0.0077],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #2400: [tensor([0.2722, 0.1173, 0.0144, 0.0157, 0.0118, 0.0114, 0.0977, 0.0078, 0.0157,
        0.0087, 0.0099, 0.0108, 0.0028, 0.0115, 0.1430, 0.0274, 0.1763, 0.0175,
        0.0094, 0.0185, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3322, 0.0894, 0.0153, 0.0090, 0.0066, 0.0076, 0.0561, 0.0048, 0.0152,
        0.0095, 0.0076, 0.0082, 0.0037, 0.0074, 0.1929, 0.0157, 0.0169, 0.0142,
        0.1408, 0.0123, 0.0172, 0.0038, 0.0137, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3260, 0.0476, 0.0107, 0.0077, 0.0078, 0.0053, 0.0940, 0.0037, 0.0145,
        0.0095, 0.0068, 0.0053, 0.0028, 0.0073, 0.1058, 0.0162, 0.1092, 0.0145,
        0.0096, 0.1493, 0.0086, 0.0137, 0.0068, 0.0056, 0.0118],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2127, 0.0862, 0.0143, 0.0127, 0.0087, 0.0068, 0.0440, 0.0046, 0.0152,
        0.0071, 0.0042, 0.0076, 0.0038, 0.0079, 0.1286, 0.0163, 0.1491, 0.0131,
        0.0094, 0.2049, 0.0198, 0.0071, 0.0161, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2417, 0.0765, 0.0118, 0.0120, 0.0116, 0.0096, 0.0537, 0.0083, 0.0173,
        0.0109, 0.0070, 0.0106, 0.0036, 0.0084, 0.1076, 0.0240, 0.1750, 0.0160,
        0.1540, 0.0081, 0.0197, 0.0020, 0.0107, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3008, 0.0960, 0.0261, 0.0124, 0.0125, 0.0142, 0.0986, 0.0066, 0.0193,
        0.0102, 0.0109, 0.0088, 0.0086, 0.0131, 0.1786, 0.0231, 0.0171, 0.0234,
        0.0745, 0.0146, 0.0104, 0.0046, 0.0156, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3112, 0.0791, 0.0160, 0.0140, 0.0128, 0.0116, 0.0634, 0.0065, 0.0157,
        0.0117, 0.0102, 0.0075, 0.0082, 0.0073, 0.0876, 0.0225, 0.1937, 0.0319,
        0.0181, 0.0177, 0.0135, 0.0160, 0.0065, 0.0172, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3575, 0.0873, 0.0232, 0.0201, 0.0152, 0.0132, 0.1058, 0.0061, 0.0210,
        0.0104, 0.0060, 0.0086, 0.0037, 0.0091, 0.2256, 0.0230, 0.0366, 0.0067,
        0.0211, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2524, 0.1146, 0.0179, 0.0116, 0.0106, 0.0068, 0.0854, 0.0057, 0.0222,
        0.0127, 0.0074, 0.0084, 0.0008, 0.0103, 0.1572, 0.0273, 0.1685, 0.0200,
        0.0098, 0.0312, 0.0073, 0.0121, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3968, 0.0149, 0.0189, 0.0301, 0.0160, 0.0507, 0.0101, 0.0077, 0.0118,
        0.0160, 0.0073, 0.0476, 0.0135, 0.0021, 0.0092, 0.0821, 0.0348, 0.1439,
        0.0242, 0.0226, 0.0140, 0.0073, 0.0182, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3069, 0.0127, 0.0133, 0.0222, 0.0121, 0.0399, 0.0101, 0.0099, 0.0114,
        0.0121, 0.0077, 0.0427, 0.0120, 0.0022, 0.0091, 0.0691, 0.0233, 0.0983,
        0.0175, 0.2229, 0.0218, 0.0059, 0.0168, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3386, 0.0112, 0.0105, 0.0210, 0.0105, 0.0300, 0.0077, 0.0096, 0.0095,
        0.0127, 0.0087, 0.0412, 0.0173, 0.0036, 0.0068, 0.2094, 0.0341, 0.0963,
        0.0602, 0.0115, 0.0127, 0.0159, 0.0077, 0.0134, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #2450: [tensor([0.1894, 0.0185, 0.0310, 0.0091, 0.0167, 0.0168, 0.0290, 0.0148, 0.0174,
        0.0291, 0.0622, 0.0050, 0.0244, 0.0171, 0.0092, 0.2036, 0.0123, 0.0227,
        0.0099, 0.0196, 0.0069, 0.0119, 0.0240, 0.0393, 0.0542, 0.0272, 0.0250,
        0.0188, 0.0144, 0.0207, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3171, 0.0121, 0.0128, 0.0033, 0.0087, 0.0114, 0.0128, 0.0075, 0.0194,
        0.0146, 0.0348, 0.0064, 0.0116, 0.0152, 0.0070, 0.0982, 0.0072, 0.0129,
        0.0055, 0.0093, 0.0023, 0.0079, 0.0174, 0.0206, 0.1979, 0.0069, 0.0119,
        0.0607, 0.0292, 0.0047, 0.0127], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2051, 0.0074, 0.0132, 0.0077, 0.0114, 0.0079, 0.0147, 0.0066, 0.0100,
        0.0758, 0.0074, 0.0141, 0.0024, 0.0079, 0.0156, 0.0281, 0.0523, 0.0573,
        0.0537, 0.0097, 0.0253, 0.3224, 0.0246, 0.0061, 0.0130, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2696, 0.0140, 0.0163, 0.0084, 0.0141, 0.0138, 0.0154, 0.0102, 0.0108,
        0.1135, 0.0061, 0.0216, 0.0063, 0.0105, 0.0199, 0.0719, 0.0333, 0.2738,
        0.0153, 0.0269, 0.0095, 0.0188, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3289, 0.0152, 0.0233, 0.0060, 0.0113, 0.0203, 0.0213, 0.0106, 0.0122,
        0.1204, 0.0083, 0.0194, 0.0059, 0.0129, 0.0068, 0.0336, 0.0863, 0.0356,
        0.0165, 0.0441, 0.0889, 0.0377, 0.0131, 0.0213, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2848, 0.0086, 0.0160, 0.0041, 0.0073, 0.0026, 0.0151, 0.0141, 0.0126,
        0.0131, 0.0439, 0.0038, 0.0116, 0.0045, 0.0066, 0.1702, 0.0174, 0.0128,
        0.1144, 0.0097, 0.0286, 0.0165, 0.0209, 0.1188, 0.0221, 0.0067, 0.0133,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3130, 0.0132, 0.0269, 0.0103, 0.0164, 0.0063, 0.0283, 0.0337, 0.0150,
        0.0214, 0.0744, 0.0076, 0.0217, 0.0043, 0.0104, 0.0875, 0.0349, 0.0553,
        0.0759, 0.0271, 0.0110, 0.0146, 0.0253, 0.0364, 0.0077, 0.0214, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3654, 0.0127, 0.0221, 0.0069, 0.0096, 0.0058, 0.0209, 0.0153, 0.0167,
        0.0218, 0.0521, 0.0082, 0.0248, 0.0036, 0.0054, 0.0146, 0.0236, 0.0126,
        0.0113, 0.0245, 0.0348, 0.0337, 0.0045, 0.1668, 0.0125, 0.0119, 0.0350,
        0.0085, 0.0145, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3047, 0.0694, 0.0138, 0.0070, 0.0128, 0.0075, 0.0138, 0.0099, 0.0129,
        0.0154, 0.0009, 0.0127, 0.0158, 0.1231, 0.3275, 0.0325, 0.0204, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3009, 0.1033, 0.0177, 0.0096, 0.0166, 0.0090, 0.0133, 0.0110, 0.0176,
        0.0271, 0.0013, 0.0118, 0.0136, 0.1088, 0.2255, 0.0591, 0.0071, 0.0321,
        0.0145, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 0.3915,  0.1380,  0.0266,  0.0122,  0.0264,  0.0129,  0.0188,  0.0096,
         0.0217,  0.0344, -0.0018,  0.0172,  0.0156,  0.1249,  0.0647,  0.0076,
         0.0539,  0.0221,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1749, 0.1662, 0.0130, 0.0157, 0.0073, 0.0143, 0.0340, 0.0074, 0.0121,
        0.0047, 0.0035, 0.0024, 0.0096, 0.0710, 0.0161, 0.1566, 0.0232, 0.2369,
        0.0123, 0.0045, 0.0144, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #2500: [tensor([0.2615, 0.0830, 0.0189, 0.0127, 0.0158, 0.0085, 0.0276, 0.0148, 0.0132,
        0.0417, 0.0915, 0.0035, 0.0059, 0.0095, 0.1622, 0.0148, 0.0221, 0.0161,
        0.0435, 0.0211, 0.0639, 0.0242, 0.0076, 0.0165, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3413, 0.0997, 0.0243, 0.0155, 0.0186, 0.0056, 0.0325, 0.0110, 0.0130,
        0.0594, 0.0819, 0.0038, 0.0039, 0.0126, 0.0974, 0.0184, 0.0205, 0.0775,
        0.0270, 0.0126, 0.0078, 0.0156, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2480, 0.1495, 0.0235, 0.0099, 0.0240, 0.0070, 0.0335, 0.0122, 0.0169,
        0.0760, 0.1208, 0.0046, 0.0035, 0.0117, 0.0925, 0.0221, 0.0191, 0.0810,
        0.0140, 0.0123, 0.0178, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2731, 0.0394, 0.0025, 0.0150, 0.0082, 0.0215, 0.0390, 0.0064, 0.0054,
        0.0087, 0.0058, 0.0090, 0.0499, 0.0104, 0.0070, 0.1885, 0.0102, 0.0028,
        0.0059, 0.0651, 0.0119, 0.1205, 0.0242, 0.0129, 0.0220, 0.0204, 0.0067,
        0.0077], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 2.0243e-01,  4.1350e-02, -1.1016e-04,  1.4797e-02,  1.1965e-02,
         3.7852e-02,  6.1504e-02,  1.0039e-02,  4.9614e-03,  9.5153e-03,
         4.7684e-03,  1.0407e-02,  8.7060e-02,  1.2683e-02,  1.1243e-02,
         1.0636e-01,  1.0597e-02,  4.5410e-03,  8.5025e-03,  5.5085e-02,
         1.3025e-02,  1.3007e-01,  1.2860e-02,  1.1528e-02,  9.1114e-02,
         1.7781e-02,  3.7864e-03,  1.4064e-02], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 0.1920,  0.0775, -0.0002,  0.0153,  0.0087,  0.0329,  0.0783,  0.0071,
         0.0058,  0.0076,  0.0058,  0.0092,  0.0841,  0.0153,  0.0057,  0.1434,
         0.0111,  0.0036,  0.0082,  0.0597,  0.0189,  0.0782,  0.0151,  0.0788,
         0.0269,  0.0106,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2912, 0.0860, 0.0063, 0.0185, 0.0069, 0.0101, 0.0055, 0.0077, 0.0132,
        0.0060, 0.0106, 0.0047, 0.1091, 0.0024, 0.0011, 0.0126, 0.0035, 0.0093,
        0.0428, 0.0868, 0.1964, 0.0090, 0.0217, 0.0171, 0.0087, 0.0130, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 3.5887e-01,  9.3431e-02,  1.0787e-02,  2.2274e-02,  1.5494e-02,
         1.3189e-02,  8.6547e-03,  9.9429e-03,  2.1375e-02,  8.4312e-03,
         7.1715e-03,  3.6127e-03,  8.6888e-02,  4.0560e-03, -9.5517e-05,
         1.9177e-02,  6.1178e-03,  1.4290e-02,  1.6978e-02,  3.5125e-02,
         8.0902e-02,  1.5156e-02,  6.0156e-02,  2.5444e-02,  4.9366e-02,
         1.3022e-02,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 0.3279,  0.0943,  0.0197,  0.0299,  0.0148,  0.0167,  0.0113,  0.0139,
         0.0278,  0.0084,  0.0121,  0.0060,  0.1126,  0.0029, -0.0005,  0.0189,
         0.0069,  0.0158,  0.0264,  0.0664,  0.0228,  0.0121,  0.0157,  0.0666,
         0.0247,  0.0063,  0.0186,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([3.0769e-01, 6.5772e-02, 8.3720e-03, 1.3977e-02, 6.2681e-02, 1.1236e-02,
        9.6758e-02, 1.4024e-02, 1.1643e-02, 2.0723e-02, 1.0866e-02, 1.0835e-02,
        7.1356e-03, 1.1753e-02, 3.0759e-04, 1.1842e-02, 1.2214e-01, 1.5957e-02,
        2.1560e-02, 8.0241e-02, 1.4975e-02, 1.9733e-02, 1.5088e-02, 1.7553e-02,
        8.9324e-03, 1.8204e-02, 0.0000e+00, 0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([2.9560e-01, 4.9403e-02, 3.8473e-03, 1.1012e-02, 4.7386e-02, 6.9807e-03,
        9.2618e-02, 1.1679e-02, 1.1934e-02, 2.1961e-02, 8.1325e-03, 1.1640e-02,
        7.1308e-03, 1.2826e-02, 1.6257e-04, 1.2177e-02, 8.0686e-02, 2.3939e-02,
        1.5410e-02, 2.1856e-01, 1.4002e-02, 2.0292e-02, 9.2258e-03, 1.3402e-02,
        0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2538, 0.1037, 0.0054, 0.0094, 0.0614, 0.0094, 0.0695, 0.0137, 0.0126,
        0.0142, 0.0105, 0.0116, 0.0081, 0.0162, 0.0024, 0.0112, 0.1154, 0.0300,
        0.0484, 0.0161, 0.1439, 0.0068, 0.0103, 0.0161, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #2550: [tensor([0.2854, 0.1317, 0.0156, 0.0288, 0.0155, 0.0037, 0.1246, 0.0108, 0.0186,
        0.0059, 0.0085, 0.0563, 0.1764, 0.0216, 0.0143, 0.0374, 0.0269, 0.0179,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2882, 0.0292, 0.0199, 0.0237, 0.0104, 0.0320, 0.1685, 0.0366, 0.0086,
        0.0263, 0.0282, 0.0380, 0.0444, 0.0557, 0.0393, 0.0515, 0.0626, 0.0367,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2410, 0.0339, 0.0159, 0.0326, 0.0182, 0.0295, 0.2122, 0.0311, 0.0125,
        0.0299, 0.0749, 0.0491, 0.1534, 0.0298, 0.0358, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4089, 0.0257, 0.0203, 0.0211, 0.0160, 0.0244, 0.2148, 0.0306, 0.0089,
        0.0207, 0.0298, 0.0299, 0.0639, 0.0357, 0.0252, 0.0242, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2227, 0.0585, 0.0143, 0.0146, 0.1024, 0.0088, 0.0081, 0.0157, 0.0086,
        0.0639, 0.0016, 0.0142, 0.0122, 0.0280, 0.0067, 0.0022, 0.0103, 0.2674,
        0.0259, 0.0910, 0.0115, 0.0114, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.1768,  0.0673,  0.0085,  0.0090,  0.0685,  0.0074,  0.0101,  0.0148,
         0.0127,  0.0669,  0.0030,  0.0107,  0.0107,  0.0438,  0.0055, -0.0007,
         0.0086,  0.1577,  0.0201,  0.0657,  0.0122,  0.1949,  0.0122,  0.0123,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.1946, 0.0590, 0.0172, 0.0121, 0.0780, 0.0123, 0.0082, 0.0197, 0.0063,
        0.0923, 0.0041, 0.0145, 0.0132, 0.0631, 0.0059, 0.0024, 0.0093, 0.2481,
        0.0185, 0.0986, 0.0121, 0.0103, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2513, 0.0097, 0.0115, 0.0175, 0.0410, 0.0085, 0.0164, 0.0081, 0.0063,
        0.0102, 0.0112, 0.0033, 0.0138, 0.0122, 0.0202, 0.0126, 0.1514, 0.0142,
        0.0121, 0.0265, 0.0328, 0.0867, 0.0085, 0.0787, 0.0667, 0.0149, 0.0277,
        0.0100, 0.0158], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1578, 0.0145, 0.0122, 0.0310, 0.0488, 0.0115, 0.0260, 0.0103, 0.0080,
        0.0154, 0.0217, 0.0073, 0.0180, 0.0151, 0.0127, 0.0207, 0.2171, 0.1136,
        0.0252, 0.0339, 0.0221, 0.0297, 0.0405, 0.0193, 0.0197, 0.0192, 0.0094,
        0.0193, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.4278, 0.0243, 0.0275, 0.0423, 0.0703, 0.0238, 0.0443, 0.0197, 0.0161,
        0.0166, 0.0359, 0.0094, 0.0291, 0.0286, 0.0324, 0.0378, 0.0617, 0.0172,
        0.0355, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2135, 0.0243, 0.0714, 0.0155, 0.0234, 0.0200, 0.0836, 0.0235, 0.0092,
        0.0154, 0.0819, 0.0488, 0.0733, 0.0345, 0.0169, 0.0489, 0.1366, 0.0378,
        0.0213, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3018, 0.0208, 0.0492, 0.0148, 0.0284, 0.0194, 0.0697, 0.0181, 0.0081,
        0.0144, 0.0697, 0.0078, 0.0115, 0.0311, 0.0267, 0.2005, 0.0447, 0.0136,
        0.0265, 0.0232, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #2600: [tensor([0.2409, 0.0235, 0.0239, 0.0080, 0.0106, 0.0280, 0.0072, 0.0052, 0.0070,
        0.0288, 0.0099, 0.0037, 0.0086, 0.0048, 0.0030, 0.0073, 0.0109, 0.0196,
        0.0047, 0.0124, 0.0038, 0.0072, 0.0038, 0.0045, 0.0031, 0.0321, 0.0024,
        0.0099, 0.0140, 0.0055, 0.0069, 0.0082, 0.0110, 0.0020, 0.0274, 0.0295,
        0.0098, 0.0014, 0.0024, 0.0050, 0.0464, 0.0106, 0.1389, 0.0072, 0.0195,
        0.0984, 0.0150, 0.0058, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.2635, 0.0257, 0.0205, 0.0099, 0.0107, 0.0449, 0.0089, 0.0057, 0.0079,
        0.0271, 0.0080, 0.0021, 0.0069, 0.0061, 0.0015, 0.0084, 0.0129, 0.0249,
        0.0050, 0.0124, 0.0049, 0.0089, 0.0029, 0.0048, 0.0034, 0.0360, 0.0007,
        0.0089, 0.0110, 0.0026, 0.0078, 0.0061, 0.0126, 0.0017, 0.0390, 0.0222,
        0.0079, 0.0028, 0.0028, 0.0049, 0.0420, 0.0098, 0.1938, 0.0122, 0.0067,
        0.0096, 0.0088, 0.0053, 0.0069], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3215, 0.0165, 0.0288, 0.0634, 0.0146, 0.0205, 0.0205, 0.0345, 0.0299,
        0.0424, 0.0202, 0.0025, 0.0135, 0.0235, 0.0267, 0.1049, 0.0399, 0.0298,
        0.0237, 0.0450, 0.0235, 0.0342, 0.0201, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3132, 0.0139, 0.0250, 0.0561, 0.0132, 0.0144, 0.0180, 0.0277, 0.0176,
        0.0242, 0.0380, 0.0027, 0.0188, 0.0185, 0.0208, 0.1026, 0.0436, 0.0231,
        0.0182, 0.0209, 0.0194, 0.0281, 0.0642, 0.0362, 0.0215, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.3049, 0.0179, 0.0339, 0.0574, 0.0269, 0.0260, 0.0183, 0.0352, 0.0219,
        0.0327, 0.0262, 0.0078, 0.0158, 0.0211, 0.0292, 0.0718, 0.0533, 0.0313,
        0.0276, 0.0794, 0.0364, 0.0251, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.1545, 0.0567, 0.0178, 0.0162, 0.0133, 0.0055, 0.0090, 0.0513, 0.0069,
        0.0463, 0.0081, 0.0030, 0.0088, 0.1568, 0.0210, 0.0992, 0.0217, 0.0201,
        0.1717, 0.0169, 0.0094, 0.0502, 0.0162, 0.0075, 0.0120, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.1890, 0.0615, 0.0153, 0.0110, 0.0151, 0.0080, 0.0099, 0.0854, 0.0104,
        0.0694, 0.0072, 0.0031, 0.0078, 0.1793, 0.0161, 0.0782, 0.1488, 0.0580,
        0.0104, 0.0046, 0.0115, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.1722, 0.0503, 0.0117, 0.0110, 0.0125, 0.0056, 0.0084, 0.0372, 0.0082,
        0.0607, 0.0055, 0.0021, 0.0064, 0.1316, 0.0103, 0.0706, 0.0101, 0.0305,
        0.0106, 0.1769, 0.0058, 0.0727, 0.0625, 0.0155, 0.0020, 0.0092, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 0.4325,  0.0473, -0.0012,  0.0367,  0.0628,  0.0948,  0.0187,  0.0304,
         0.0896,  0.0316,  0.0378,  0.0405,  0.0760,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.5049, 0.0417, 0.0261, 0.0392, 0.0615, 0.0810, 0.0217, 0.0284, 0.0655,
        0.0415, 0.0334, 0.0550, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.5021, 0.0326, 0.0158, 0.0250, 0.0595, 0.0724, 0.0199, 0.0450, 0.0570,
        0.0285, 0.0458, 0.0320, 0.0645, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.1975, 0.0877, 0.0046, 0.0126, 0.0225, 0.0097, 0.0189, 0.0105, 0.0065,
        0.0107, 0.1554, 0.0080, 0.1192, 0.0176, 0.0140, 0.0903, 0.1419, 0.0098,
        0.0337, 0.0103, 0.0187, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #2650: [tensor([0.2164, 0.1632, 0.0076, 0.0050, 0.0370, 0.0206, 0.0109, 0.0242, 0.1249,
        0.0197, 0.0269, 0.0089, 0.0138, 0.0056, 0.0119, 0.0873, 0.0354, 0.0804,
        0.0271, 0.0225, 0.0189, 0.0103, 0.0216, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2241, 0.0551, 0.0024, 0.0016, 0.0143, 0.0107, 0.0080, 0.0112, 0.1334,
        0.0109, 0.0221, 0.0058, 0.0130, 0.0046, 0.0074, 0.2244, 0.0075, 0.0345,
        0.0226, 0.1153, 0.0299, 0.0059, 0.0160, 0.0085, 0.0109],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2063, 0.1339, 0.0074, 0.0037, 0.0256, 0.0229, 0.0079, 0.0235, 0.2013,
        0.0212, 0.0354, 0.0055, 0.0160, 0.0070, 0.0163, 0.0358, 0.1121, 0.0631,
        0.0269, 0.0120, 0.0161, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1215, 0.1220, 0.0290, 0.0371, 0.0106, 0.0098, 0.0130, 0.0165, 0.0211,
        0.0130, 0.0054, 0.0187, 0.2620, 0.0247, 0.0376, 0.0213, 0.0397, 0.0423,
        0.0817, 0.0415, 0.0084, 0.0229, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2808, 0.1627, 0.0193, 0.0251, 0.0084, 0.0071, 0.0070, 0.0114, 0.0221,
        0.0118, 0.0027, 0.0097, 0.2538, 0.0304, 0.0056, 0.0121, 0.0249, 0.0291,
        0.0146, 0.0279, 0.0154, 0.0058, 0.0122, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.3024, 0.0922, 0.0222, 0.0368, 0.0074, 0.0069, 0.0082, 0.0147, 0.0195,
        0.0099, 0.0026, 0.0130, 0.0294, 0.0381, 0.0205, 0.0119, 0.0196, 0.0166,
        0.2448, 0.0223, 0.0356, 0.0047, 0.0208, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2458, 0.0956, 0.0151, 0.0057, 0.0126, 0.0260, 0.0922, 0.0134, 0.0815,
        0.1099, 0.0150, 0.0141, 0.0541, 0.0142, 0.0058, 0.0114, 0.0793, 0.0619,
        0.0177, 0.0133, 0.0153, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2702, 0.1157, 0.0100, 0.0083, 0.0132, 0.0182, 0.0850, 0.0102, 0.0646,
        0.0811, 0.0079, 0.0078, 0.0524, 0.0141, 0.0029, 0.0090, 0.0991, 0.0114,
        0.0962, 0.0090, 0.0138, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1222, 0.1277, 0.0102, 0.0072, 0.0139, 0.0186, 0.0717, 0.0132, 0.0506,
        0.1526, 0.0155, 0.0068, 0.0682, 0.0127, 0.0038, 0.0115, 0.0612, 0.1747,
        0.0189, 0.0228, 0.0163, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2823, 0.0422, 0.0057, 0.0837, 0.0128, 0.0335, 0.0064, 0.0035, 0.0503,
        0.0100, 0.0040, 0.0113, 0.0846, 0.0061, 0.0246, 0.0847, 0.0271, 0.0513,
        0.0720, 0.0074, 0.0218, 0.0194, 0.0224, 0.0113, 0.0214],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1206, 0.0373, 0.0062, 0.0429, 0.0100, 0.0268, 0.0040, 0.0039, 0.0346,
        0.0113, 0.0014, 0.0098, 0.1048, 0.0081, 0.0618, 0.0169, 0.4798, 0.0076,
        0.0124, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2918, 0.0563, 0.0072, 0.0891, 0.0130, 0.0536, 0.0059, 0.0035, 0.0560,
        0.0158, 0.0027, 0.0097, 0.1029, 0.0099, 0.0998, 0.0169, 0.0270, 0.0310,
        0.0319, 0.0204, 0.0086, 0.0193, 0.0097, 0.0181, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #2700: [tensor([0.1585, 0.0568, 0.0124, 0.0427, 0.0065, 0.0056, 0.0320, 0.0071, 0.0169,
        0.0351, 0.0049, 0.0121, 0.0071, 0.0068, 0.0084, 0.0071, 0.0045, 0.0122,
        0.0087, 0.1020, 0.0087, 0.0107, 0.0153, 0.0243, 0.0280, 0.1644, 0.0103,
        0.0023, 0.0095, 0.0124, 0.0325, 0.0112, 0.0165, 0.0620, 0.0346, 0.0100,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 2.0580e-01,  6.4355e-02,  8.1817e-03,  5.8967e-02,  3.5301e-03,
         5.2466e-03,  3.5075e-02,  6.0424e-03,  1.5145e-02,  3.6738e-02,
         3.5151e-03,  1.4237e-02,  7.7493e-03,  7.6196e-03,  6.6239e-03,
         3.4823e-03,  4.7072e-03,  1.2872e-02,  6.7712e-03,  6.3096e-02,
         7.5877e-03,  7.2309e-03,  1.6611e-02,  1.6197e-02,  2.8137e-02,
         1.1811e-01,  5.9385e-03, -1.3307e-04,  7.0052e-03,  1.2535e-01,
         1.1510e-02,  3.9040e-02,  1.0054e-02,  4.4070e-03,  1.7550e-02,
         4.1054e-03,  1.1282e-02,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.1421, 0.0587, 0.0225, 0.0481, 0.0053, 0.0054, 0.0464, 0.0078, 0.0168,
        0.0345, 0.0045, 0.0104, 0.0082, 0.0072, 0.0087, 0.0052, 0.0064, 0.0144,
        0.0114, 0.0659, 0.0124, 0.0086, 0.0181, 0.0147, 0.0432, 0.0868, 0.0041,
        0.0016, 0.0068, 0.0146, 0.0534, 0.1865, 0.0112, 0.0084, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1644, -0.0671, -0.0095, -0.0336, -0.0060, -0.0050, -0.0376, -0.0044,
        -0.0111, -0.0287, -0.0045, -0.0082, -0.0062, -0.0073, -0.0067, -0.0045,
        -0.0063, -0.0140, -0.0072, -0.1100, -0.0066, -0.0077, -0.0104, -0.0139,
        -0.0347, -0.0802, -0.0037, -0.0009, -0.0074, -0.0529, -0.0135, -0.0345,
        -0.0082, -0.0175, -0.1262, -0.0126, -0.0107, -0.0062, -0.0100,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1645, 0.0370, 0.0096, 0.0352, 0.0054, 0.0054, 0.0316, 0.0060, 0.0096,
        0.0256, 0.0041, 0.0128, 0.0076, 0.0032, 0.0046, 0.0050, 0.0047, 0.0114,
        0.0084, 0.0679, 0.0044, 0.0049, 0.0097, 0.0168, 0.0338, 0.0688, 0.0044,
        0.0031, 0.0061, 0.0352, 0.0108, 0.0111, 0.0610, 0.0055, 0.0106, 0.0146,
        0.2105, 0.0197, 0.0026, 0.0071, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1673, 0.0414, 0.0092, 0.0345, 0.0029, 0.0060, 0.0331, 0.0051, 0.0127,
        0.0275, 0.0039, 0.0134, 0.0055, 0.0051, 0.0067, 0.0060, 0.0044, 0.0102,
        0.0074, 0.0899, 0.0074, 0.0069, 0.0117, 0.0225, 0.0362, 0.0646, 0.0060,
        0.0021, 0.0076, 0.0413, 0.0145, 0.0358, 0.0071, 0.1661, 0.0069, 0.0131,
        0.0056, 0.0051, 0.0131, 0.0084, 0.0096, 0.0044, 0.0118],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1707, -0.0556, -0.0116, -0.0399, -0.0048, -0.0086, -0.0465, -0.0063,
        -0.0173, -0.0316, -0.0051, -0.0172, -0.0082, -0.0075, -0.0104, -0.0051,
        -0.0077, -0.0129, -0.0094, -0.1381, -0.0108, -0.0083, -0.0114, -0.0157,
        -0.0438, -0.0820, -0.0088, -0.0042, -0.0072, -0.0307, -0.0270, -0.0267,
        -0.0118, -0.0615, -0.0085, -0.0099, -0.0069, -0.0099,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1468, 0.0622, 0.0115, 0.0412, 0.0063, 0.0082, 0.0332, 0.0074, 0.0135,
        0.0361, 0.0073, 0.0199, 0.0081, 0.0071, 0.0077, 0.0085, 0.0063, 0.0151,
        0.0086, 0.0759, 0.0100, 0.0127, 0.0210, 0.0182, 0.0379, 0.0972, 0.0089,
        0.0022, 0.0073, 0.1226, 0.0132, 0.0116, 0.0689, 0.0127, 0.0116, 0.0131,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2318, 0.0610, 0.0098, 0.0309, 0.0042, 0.0054, 0.0300, 0.0069, 0.0147,
        0.0394, 0.0043, 0.0169, 0.0106, 0.0055, 0.0072, 0.0044, 0.0072, 0.0098,
        0.0091, 0.0873, 0.0087, 0.0087, 0.0168, 0.0178, 0.0312, 0.0782, 0.0052,
        0.0042, 0.0078, 0.1234, 0.0142, 0.0414, 0.0051, 0.0191, 0.0093, 0.0123,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1512, -0.0372, -0.0086, -0.0258, -0.0015, -0.0066, -0.0183, -0.0059,
        -0.0099, -0.0247, -0.0038, -0.0109, -0.0073, -0.0043, -0.0064, -0.0033,
        -0.0028, -0.0092, -0.0058, -0.0880, -0.0055, -0.0077, -0.0101, -0.0099,
        -0.0280, -0.1361, -0.0040, -0.0017, -0.0041, -0.0162, -0.0328, -0.0133,
        -0.0061, -0.0301, -0.2400, -0.0166, -0.0065,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1259, 0.1383, 0.0213, 0.0312, 0.1104, 0.0237, 0.0190, 0.0095, 0.0192,
        0.0238, 0.0346, 0.0717, 0.0317, 0.0266, 0.1786, 0.0278, 0.0609, 0.0222,
        0.0237, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2998, 0.1452, 0.0266, 0.0504, 0.0914, 0.0313, 0.0324, 0.0119, 0.0209,
        0.0315, 0.0325, 0.0707, 0.0546, 0.0490, 0.0168, 0.0349, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #2750: [tensor([0.1331, 0.0572, 0.0091, 0.0090, 0.0743, 0.0067, 0.0041, 0.0244, 0.0146,
        0.0780, 0.0078, 0.0070, 0.0076, 0.0072, 0.0120, 0.0221, 0.0146, 0.0139,
        0.0022, 0.0026, 0.0065, 0.1581, 0.0118, 0.0071, 0.2806, 0.0120, 0.0079,
        0.0086, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0176, -0.0726, -0.0106, -0.0106, -0.0922, -0.0074, -0.0077, -0.0288,
        -0.0226, -0.1182, -0.0109, -0.0083, -0.0076, -0.0085, -0.0173, -0.0217,
        -0.0161, -0.0153, -0.0053, -0.0033, -0.0063, -0.1556, -0.0144, -0.0127,
        -0.0286, -0.0222, -0.0858, -0.0168, -0.0723, -0.0577, -0.0087, -0.0066,
        -0.0096,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-9.8026e-02, -2.7983e-02, -7.2253e-03, -6.3254e-03, -3.6847e-02,
        -6.3781e-03, -2.5243e-03, -6.9824e-03, -7.5013e-03, -7.9026e-03,
        -4.8385e-03, -3.6781e-02, -2.2193e-03, -5.5588e-03, -5.4703e-03,
        -8.7512e-02, -9.1601e-03, -1.1791e-02, -2.9000e-03, -9.5569e-03,
        -4.2649e-03, -8.0571e-04, -1.7389e-03, -1.0778e-02, -7.5605e-05,
        -4.9485e-03, -3.0040e-01, -8.1918e-03, -9.0828e-03, -9.2043e-02,
        -5.8009e-03, -3.3015e-03, -8.7529e-02, -5.3048e-03, -1.5896e-02,
        -4.1696e-03, -1.3488e-02, -8.6567e-03, -5.3463e-03, -6.5521e-03,
        -1.5118e-02, -5.5378e-03, -7.4865e-03], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1168, -0.0604, -0.0146, -0.0094, -0.0871, -0.0092, -0.0069, -0.0125,
        -0.0142, -0.0101, -0.0055, -0.0738, -0.0087, -0.0063, -0.0101, -0.1561,
        -0.0153, -0.0258, -0.0054, -0.0101, -0.0084, -0.0037, -0.0055, -0.0164,
        -0.0046, -0.0068, -0.0383, -0.0730, -0.0206, -0.0083, -0.0778, -0.0148,
        -0.0112, -0.0037, -0.0250, -0.0101, -0.0135,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([1.7957e-01, 5.2041e-02, 1.1132e-02, 7.8263e-03, 4.4314e-02, 8.0571e-03,
        3.5509e-03, 8.7810e-03, 7.0666e-03, 1.1701e-02, 4.6356e-03, 5.9480e-02,
        4.4898e-03, 6.1742e-03, 8.4739e-03, 7.0620e-02, 1.1618e-02, 1.6297e-02,
        2.4686e-03, 1.5236e-02, 8.0479e-03, 1.5916e-03, 5.4803e-03, 1.0517e-02,
        1.4360e-05, 6.0373e-03, 3.3778e-01, 8.7839e-03, 2.2989e-02, 1.3881e-02,
        1.5241e-02, 5.8971e-03, 1.5900e-02, 3.2879e-03, 1.1018e-02, 0.0000e+00,
        0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00, 0.0000e+00,
        0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2188, -0.0770, -0.0172, -0.0089, -0.0992, -0.0108, -0.0050, -0.0153,
        -0.0157, -0.0127, -0.0090, -0.0782, -0.0066, -0.0094, -0.0122, -0.1440,
        -0.0170, -0.0219, -0.0051, -0.0188, -0.0123, -0.0018, -0.0076, -0.0156,
        -0.0027, -0.0102, -0.0181, -0.0165, -0.0197, -0.0172, -0.0117, -0.0168,
        -0.0190, -0.0067, -0.0213,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1740, 0.0482, 0.0070, 0.0078, 0.0422, 0.0059, 0.0033, 0.0093, 0.0086,
        0.0076, 0.0051, 0.0400, 0.0038, 0.0055, 0.0088, 0.0529, 0.0101, 0.0111,
        0.0028, 0.0100, 0.0054, 0.0019, 0.0041, 0.0090, 0.0018, 0.0056, 0.1885,
        0.0107, 0.1025, 0.0092, 0.0086, 0.1408, 0.0065, 0.0086, 0.0049, 0.0157,
        0.0045, 0.0076, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1986, 0.0528, 0.0124, 0.0099, 0.0552, 0.0074, 0.0028, 0.0115, 0.0096,
        0.0105, 0.0040, 0.0649, 0.0074, 0.0049, 0.0109, 0.1178, 0.0093, 0.0172,
        0.0032, 0.0110, 0.0085, 0.0011, 0.0054, 0.0132, 0.0021, 0.0068, 0.0806,
        0.0142, 0.0128, 0.0497, 0.0125, 0.0118, 0.0049, 0.0079, 0.0649, 0.0241,
        0.0152, 0.0115, 0.0126, 0.0085, 0.0104, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2228, -0.0584, -0.0129, -0.0089, -0.0785, -0.0091, -0.0071, -0.0128,
        -0.0124, -0.0101, -0.0069, -0.0554, -0.0039, -0.0085, -0.0095, -0.1436,
        -0.0186, -0.0194, -0.0034, -0.0145, -0.0067, -0.0008, -0.0057, -0.0144,
        -0.0034, -0.0083, -0.0266, -0.0257, -0.1639, -0.0139, -0.0044, -0.0094,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.0857, 0.0646, 0.0116, 0.0098, 0.0418, 0.0092, 0.0042, 0.0107, 0.0083,
        0.0073, 0.0054, 0.0608, 0.0032, 0.0062, 0.0090, 0.0913, 0.0115, 0.0158,
        0.0034, 0.0111, 0.0103, 0.0036, 0.0049, 0.0123, 0.0021, 0.0069, 0.3318,
        0.0075, 0.0068, 0.0754, 0.0267, 0.0228, 0.0089, 0.0091, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1536, 0.0694, 0.0098, 0.0065, 0.0612, 0.0052, 0.0032, 0.0102, 0.0059,
        0.0112, 0.0055, 0.0316, 0.0036, 0.0055, 0.0073, 0.0670, 0.0148, 0.0191,
        0.0050, 0.0109, 0.0077, 0.0009, 0.0059, 0.0138, 0.0006, 0.0058, 0.3243,
        0.0167, 0.0703, 0.0159, 0.0176, 0.0044, 0.0098, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1169, 0.0356, 0.0049, 0.0063, 0.0460, 0.0047, 0.0034, 0.0068, 0.0066,
        0.0067, 0.0041, 0.0266, 0.0030, 0.0043, 0.0080, 0.0651, 0.0071, 0.0128,
        0.0019, 0.0087, 0.0039, 0.0020, 0.0030, 0.0079, 0.0010, 0.0050, 0.1257,
        0.0087, 0.0140, 0.0037, 0.0122, 0.0092, 0.0766, 0.0057, 0.0140, 0.2864,
        0.0045, 0.0052, 0.0087, 0.0136, 0.0024, 0.0073, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #2800: [tensor([0.0823, 0.0123, 0.0270, 0.0788, 0.0106, 0.0035, 0.0206, 0.0153, 0.1314,
        0.0222, 0.0091, 0.0050, 0.0119, 0.0165, 0.0231, 0.1263, 0.0277, 0.0088,
        0.0273, 0.0251, 0.2510, 0.0013, 0.0166, 0.0229, 0.0067, 0.0166, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1796, 0.0115, 0.0085, 0.0489, 0.0081, 0.0047, 0.0131, 0.0138, 0.0763,
        0.0131, 0.0082, 0.0036, 0.0100, 0.0164, 0.0194, 0.1083, 0.0133, 0.0211,
        0.0149, 0.3534, 0.0150, 0.0151, 0.0094, 0.0143, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.0718, 0.0325, 0.2793, 0.0230, 0.0266, 0.0158, 0.0195, 0.0064, 0.0188,
        0.1477, 0.0316, 0.1305, 0.0463, 0.0200, 0.0417, 0.0322, 0.0226, 0.0335,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0994, -0.0378, -0.2345, -0.0181, -0.0269, -0.0126, -0.0299, -0.0087,
        -0.0186, -0.1768, -0.0338, -0.1728, -0.0329, -0.0506, -0.0151, -0.0314,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.1769, 0.0183, 0.1136, 0.0105, 0.0149, 0.0098, 0.0138, 0.0046, 0.0107,
        0.0658, 0.0160, 0.0817, 0.1568, 0.0263, 0.0281, 0.2198, 0.0140, 0.0080,
        0.0106, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0865, -0.0585, -0.0176, -0.0039, -0.0074, -0.0071, -0.0050, -0.0142,
        -0.0069, -0.0638, -0.0094, -0.0120, -0.0459, -0.0396, -0.0155, -0.0055,
        -0.0044, -0.0094, -0.0106, -0.0061, -0.0102, -0.0070, -0.0374, -0.0150,
        -0.0229, -0.0090, -0.0115, -0.0040, -0.0081, -0.2042, -0.0105, -0.0228,
        -0.1624, -0.0213, -0.0074, -0.0171], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.1335, 0.0878, 0.0116, 0.0033, 0.0074, 0.0062, 0.0036, 0.0119, 0.0062,
        0.0959, 0.0058, 0.0078, 0.0459, 0.0373, 0.0134, 0.0042, 0.0050, 0.0083,
        0.0066, 0.0045, 0.0092, 0.0049, 0.0343, 0.0096, 0.0247, 0.0062, 0.0062,
        0.0032, 0.0067, 0.1483, 0.0111, 0.0146, 0.1851, 0.0067, 0.0123, 0.0104],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1752, 0.0374, 0.0271, 0.0045, 0.0071, 0.0073, 0.0037, 0.0113, 0.0054,
        0.0826, 0.0061, 0.0104, 0.0453, 0.0403, 0.0155, 0.0045, 0.0046, 0.0067,
        0.0083, 0.0045, 0.0105, 0.0079, 0.0341, 0.0111, 0.0186, 0.0098, 0.0060,
        0.0035, 0.0055, 0.1179, 0.0091, 0.0172, 0.0882, 0.1250, 0.0169, 0.0110],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1573, -0.0265, -0.0235, -0.0334, -0.0140, -0.0153, -0.0167, -0.0231,
        -0.0187, -0.0287, -0.0213, -0.0089, -0.0211, -0.1661, -0.0293, -0.3286,
        -0.0202, -0.0190, -0.0283,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.1730, 0.0243, 0.0199, 0.0196, 0.0098, 0.0090, 0.0196, 0.0157, 0.0180,
        0.0186, 0.0155, 0.0078, 0.0137, 0.1365, 0.0133, 0.3002, 0.0567, 0.0174,
        0.0280, 0.0493, 0.0162, 0.0180, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2365, -0.0267, -0.0198, -0.0243, -0.0172, -0.0122, -0.0258, -0.0218,
        -0.0080, -0.0175, -0.0181, -0.0100, -0.0200, -0.1500, -0.0295, -0.2533,
        -0.0593, -0.0147, -0.0352,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.1383, 0.1825, 0.0443, 0.0290, 0.0186, 0.1445, 0.0176, 0.0264, 0.0118,
        0.0191, 0.0310, 0.2579, 0.0455, 0.0335, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #2850: [tensor([-0.1345, -0.1296, -0.0116, -0.0152, -0.0101, -0.0594, -0.0084, -0.0255,
        -0.0058, -0.0082, -0.0661, -0.0180, -0.0617, -0.0118, -0.0255, -0.3314,
        -0.0306, -0.0320, -0.0144,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1993, -0.2337, -0.0248, -0.0267, -0.0369, -0.1021, -0.0177, -0.0403,
        -0.0163, -0.0272, -0.0624, -0.1054, -0.0508, -0.0347, -0.0217,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1885, 0.0045, 0.0131, 0.0136, 0.0158, 0.0295, 0.0053, 0.0032, 0.0551,
        0.0072, 0.0142, 0.0064, 0.0024, 0.0113, 0.0267, 0.0069, 0.0641, 0.0380,
        0.0139, 0.0224, 0.0732, 0.0050, 0.0015, 0.0076, 0.0066, 0.0343, 0.0523,
        0.0092, 0.0029, 0.0066, 0.0142, 0.0113, 0.0170, 0.1009, 0.0214, 0.0103,
        0.0587, 0.0127, 0.0120], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1544, -0.0054, -0.0153, -0.0099, -0.0149, -0.0280, -0.0044, -0.0050,
        -0.0468, -0.0116, -0.0161, -0.0072, -0.0047, -0.0074, -0.0359, -0.0069,
        -0.0725, -0.0367, -0.0182, -0.0222, -0.0744, -0.0049, -0.0021, -0.0085,
        -0.0107, -0.0290, -0.0406, -0.0072, -0.0045, -0.0071, -0.0075, -0.0123,
        -0.0899, -0.0138, -0.0582, -0.0785, -0.0156, -0.0115,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2521, -0.0056, -0.0138, -0.0136, -0.0157, -0.0205, -0.0070, -0.0037,
        -0.0416, -0.0108, -0.0157, -0.0068, -0.0036, -0.0089, -0.0383, -0.0138,
        -0.0811, -0.0393, -0.0158, -0.0259, -0.0522, -0.0044, -0.0020, -0.0066,
        -0.0087, -0.0312, -0.0516, -0.0129, -0.0045, -0.0074, -0.0151, -0.0241,
        -0.0161, -0.0431, -0.0236, -0.0187, -0.0263, -0.0059, -0.0121],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1381, -0.0626, -0.0074, -0.0440, -0.0865, -0.0049, -0.0063, -0.0070,
        -0.0412, -0.0082, -0.0171, -0.0148, -0.0131, -0.0067, -0.0110, -0.0047,
        -0.0845, -0.0044, -0.0009, -0.0044, -0.0080, -0.0682, -0.0101, -0.0778,
        -0.0189, -0.2000, -0.0219, -0.0104, -0.0076, -0.0095,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.5229e-01, -1.0423e-01, -9.4857e-03, -6.3959e-02, -8.8905e-02,
        -4.9733e-03, -5.2208e-03, -7.1483e-03, -5.6205e-02, -9.2642e-03,
        -1.9494e-02, -1.5585e-02, -1.6742e-02, -6.5161e-03, -1.5302e-02,
        -7.0012e-03, -1.0030e-01, -5.0004e-03,  5.7670e-05, -5.0275e-03,
        -7.7674e-03, -8.7693e-02, -2.5024e-02, -2.2624e-02, -1.2798e-02,
        -1.1320e-01, -1.2820e-02, -9.1599e-03, -1.6214e-02,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1539, -0.0808, -0.0097, -0.0474, -0.0896, -0.0052, -0.0045, -0.0045,
        -0.0330, -0.0070, -0.0169, -0.0144, -0.0148, -0.0136, -0.0136, -0.0057,
        -0.0860, -0.0051, -0.0030, -0.0026, -0.0070, -0.0092, -0.0426, -0.0612,
        -0.0252, -0.0574, -0.0223, -0.0910, -0.0200, -0.0222, -0.0116, -0.0066,
        -0.0125,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1667, -0.1151, -0.0160, -0.0157, -0.0060, -0.0473, -0.0192, -0.0391,
        -0.0537, -0.0174, -0.0164, -0.0144, -0.0149, -0.0100, -0.0012, -0.0063,
        -0.0134, -0.3433, -0.0118, -0.0353, -0.0223, -0.0036, -0.0109,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1648, 0.1035, 0.0211, 0.0134, 0.0037, 0.0548, 0.0181, 0.0367, 0.0454,
        0.0133, 0.0201, 0.0170, 0.0208, 0.0232, 0.0058, 0.0058, 0.0114, 0.2386,
        0.0103, 0.0340, 0.0248, 0.0026, 0.0841, 0.0101, 0.0166, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1669, 0.0984, 0.0164, 0.0126, 0.0058, 0.0393, 0.0166, 0.0497, 0.0337,
        0.0155, 0.0201, 0.0147, 0.0189, 0.0179, 0.0053, 0.0044, 0.0121, 0.0215,
        0.0396, 0.2987, 0.0116, 0.0232, 0.0168, 0.0286, 0.0115, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1785, -0.0146, -0.0202, -0.0208, -0.0094, -0.0149, -0.0447, -0.0100,
        -0.0177, -0.0570, -0.0083, -0.0176, -0.0451, -0.0183, -0.0100, -0.0571,
        -0.0328, -0.0150, -0.0536, -0.0254, -0.0083, -0.0045, -0.0105, -0.1212,
        -0.0133, -0.0246, -0.0178, -0.0262, -0.0070, -0.0174, -0.0242, -0.0401,
        -0.0138,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #2900: [tensor([0.2189, 0.1727, 0.0237, 0.0210, 0.0206, 0.0100, 0.0361, 0.0727, 0.0148,
        0.0312, 0.0141, 0.0166, 0.0880, 0.0297, 0.0073, 0.0114, 0.0715, 0.0247,
        0.0268, 0.0327, 0.0417, 0.0136, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1397, 0.2691, 0.0165, 0.0347, 0.0235, 0.0103, 0.0412, 0.0716, 0.0220,
        0.0313, 0.0165, 0.0135, 0.0983, 0.0306, 0.0048, 0.0193, 0.0544, 0.0143,
        0.0138, 0.0271, 0.0256, 0.0218, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1866, -0.0699, -0.0098, -0.0088, -0.0098, -0.0041, -0.0140, -0.0249,
        -0.0102, -0.0146, -0.0051, -0.0071, -0.0315, -0.0139, -0.0016, -0.0093,
        -0.3529, -0.0215, -0.0089, -0.0113, -0.0451, -0.0114, -0.0234, -0.0116,
        -0.0639, -0.0108, -0.0068, -0.0112,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.0690, 0.0299, 0.0042, 0.0051, 0.0052, 0.0031, 0.0089, 0.0207, 0.0079,
        0.0075, 0.0038, 0.0031, 0.0202, 0.0064, 0.0009, 0.0049, 0.3493, 0.0086,
        0.0086, 0.0103, 0.0156, 0.0973, 0.0139, 0.0360, 0.2316, 0.0157, 0.0036,
        0.0086, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0856, -0.0698, -0.0063, -0.0105, -0.0087, -0.0034, -0.0133, -0.0317,
        -0.0093, -0.0066, -0.0062, -0.0057, -0.0370, -0.0161, -0.0016, -0.0082,
        -0.0935, -0.0218, -0.0712, -0.0110, -0.0051, -0.0174, -0.4147, -0.0123,
        -0.0143, -0.0064, -0.0124,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.1791, 0.0807, 0.0108, 0.0109, 0.0075, 0.0040, 0.0106, 0.0313, 0.0090,
        0.0143, 0.0060, 0.0065, 0.0337, 0.0114, 0.0025, 0.0071, 0.4031, 0.0204,
        0.0131, 0.0129, 0.0062, 0.0193, 0.0156, 0.0137, 0.0478, 0.0113, 0.0114,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.2241, 0.2347, 0.0180, 0.0206, 0.0178, 0.0085, 0.0328, 0.0747, 0.0265,
        0.0319, 0.0152, 0.0149, 0.0756, 0.0298, 0.0056, 0.0182, 0.0332, 0.0275,
        0.0227, 0.0513, 0.0168, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1362, -0.1086, -0.0088, -0.0110, -0.0121, -0.0029, -0.0178, -0.0408,
        -0.0133, -0.0136, -0.0053, -0.0103, -0.0385, -0.0180, -0.0030, -0.0090,
        -0.1099, -0.0181, -0.1179, -0.0363, -0.2284, -0.0198, -0.0083, -0.0121,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1194, -0.0592, -0.0082, -0.0069, -0.0051, -0.0028, -0.0119, -0.0316,
        -0.0092, -0.0108, -0.0060, -0.0050, -0.0358, -0.0138, -0.0018, -0.0055,
        -0.4244, -0.0114, -0.0565, -0.0125, -0.0044, -0.0076, -0.0108, -0.0220,
        -0.0893, -0.0078, -0.0063, -0.0138,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.1187, 0.0696, 0.0052, 0.0054, 0.0050, 0.0020, 0.0115, 0.0194, 0.0057,
        0.0076, 0.0037, 0.0047, 0.0213, 0.0072, 0.0017, 0.0059, 0.3918, 0.0090,
        0.0077, 0.0622, 0.0094, 0.0058, 0.0497, 0.0122, 0.0049, 0.0061, 0.1283,
        0.0072, 0.0045, 0.0065, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1220, 0.1117, 0.0129, 0.0144, 0.0128, 0.0071, 0.0331, 0.0518, 0.0174,
        0.0232, 0.0096, 0.0136, 0.0778, 0.0209, 0.0037, 0.0151, 0.1720, 0.0291,
        0.1204, 0.0746, 0.0315, 0.0049, 0.0205, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1243, -0.0746, -0.0099, -0.0120, -0.0050, -0.0036, -0.0161, -0.0391,
        -0.0138, -0.0117, -0.0071, -0.0093, -0.0347, -0.0121, -0.0014, -0.0086,
        -0.0877, -0.0080, -0.0238, -0.0148, -0.0058, -0.0131, -0.0866, -0.0495,
        -0.0143, -0.0228, -0.0982, -0.0271, -0.0140, -0.0038, -0.0080, -0.0103,
        -0.0107, -0.0827, -0.0111, -0.0099, -0.0147], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #2950: [tensor([-0.0948, -0.0428, -0.0098, -0.0320, -0.0042, -0.0028, -0.0108, -0.0169,
        -0.0069, -0.0100, -0.0363, -0.0034, -0.0044, -0.0051, -0.0016, -0.0076,
        -0.0096, -0.0041, -0.0228, -0.0672, -0.0018, -0.0134, -0.0010, -0.0017,
        -0.0028, -0.3322, -0.0108, -0.1258, -0.0198, -0.0809, -0.0075, -0.0025,
        -0.0065,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0974, -0.0723, -0.0084, -0.0463, -0.0066, -0.0025, -0.0155, -0.0199,
        -0.0078, -0.0120, -0.0523, -0.0044, -0.0059, -0.0102, -0.0043, -0.0094,
        -0.0120, -0.0037, -0.0299, -0.0837, -0.0020, -0.0208, -0.0035, -0.0029,
        -0.0057, -0.0650, -0.0143, -0.0913, -0.0147, -0.2414, -0.0135, -0.0072,
        -0.0056, -0.0077,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1207, -0.0534, -0.0080, -0.0378, -0.0090, -0.0032, -0.0123, -0.0251,
        -0.0115, -0.0161, -0.0575, -0.0048, -0.0064, -0.0070, -0.0051, -0.0111,
        -0.0130, -0.0073, -0.0259, -0.0839, -0.0028, -0.0155, -0.0034, -0.0027,
        -0.0054, -0.0129, -0.1063, -0.0147, -0.0071, -0.0179, -0.2270, -0.0093,
        -0.0162, -0.0190, -0.0080, -0.0039, -0.0089,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1701, -0.0648, -0.0074, -0.0434, -0.0051, -0.0035, -0.0094, -0.0181,
        -0.0080, -0.0107, -0.0357, -0.0034, -0.0070, -0.0050, -0.0020, -0.0075,
        -0.0108, -0.0059, -0.0266, -0.0912, -0.0016, -0.0128, -0.0016, -0.0011,
        -0.0036, -0.1889, -0.0109, -0.0888, -0.0043, -0.0070, -0.1259, -0.0062,
        -0.0042, -0.0073,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1268, -0.0599, -0.0105, -0.0635, -0.0047, -0.0037, -0.0192, -0.0262,
        -0.0097, -0.0140, -0.0543, -0.0034, -0.0058, -0.0067, -0.0035, -0.0095,
        -0.0150, -0.0067, -0.0393, -0.2108, -0.0028, -0.0227, -0.0050, -0.0015,
        -0.0058, -0.0188, -0.1618, -0.0243, -0.0124, -0.0107, -0.0141, -0.0178,
        -0.0090,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1132, -0.1263, -0.0112, -0.0526, -0.0076, -0.0045, -0.0162, -0.0334,
        -0.0104, -0.0136, -0.0831, -0.0049, -0.0065, -0.0084, -0.0048, -0.0125,
        -0.0100, -0.0052, -0.0338, -0.1678, -0.0035, -0.0188, -0.0035, -0.0036,
        -0.0066, -0.0678, -0.0140, -0.1236, -0.0143, -0.0111, -0.0072,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1177, 0.0744, 0.0080, 0.0499, 0.0080, 0.0026, 0.0133, 0.0218, 0.0145,
        0.0116, 0.0424, 0.0033, 0.0057, 0.0073, 0.0048, 0.0087, 0.0108, 0.0038,
        0.0256, 0.0759, 0.0012, 0.0181, 0.0031, 0.0027, 0.0057, 0.0531, 0.0132,
        0.1091, 0.0056, 0.0166, 0.1404, 0.0087, 0.0092, 0.0090, 0.0142, 0.0329,
        0.0111, 0.0228, 0.0064, 0.0066], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.0749, 0.0414, 0.0074, 0.0081, 0.0685, 0.0046, 0.0029, 0.0032, 0.0051,
        0.0040, 0.0040, 0.0066, 0.0059, 0.0030, 0.0036, 0.0228, 0.0331, 0.0118,
        0.0025, 0.0050, 0.0695, 0.0103, 0.1125, 0.0128, 0.4559, 0.0076, 0.0052,
        0.0080, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([0.0985, 0.0518, 0.0071, 0.0138, 0.0606, 0.0068, 0.0047, 0.0036, 0.0050,
        0.0081, 0.0051, 0.0072, 0.0067, 0.0055, 0.0049, 0.0503, 0.0414, 0.0147,
        0.0039, 0.0058, 0.1062, 0.0102, 0.1155, 0.0166, 0.3080, 0.0104, 0.0090,
        0.0045, 0.0141, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1082, -0.0874, -0.0159, -0.0172, -0.0992, -0.0133, -0.0050, -0.0034,
        -0.0081, -0.0093, -0.0083, -0.0101, -0.0086, -0.0084, -0.0052, -0.0608,
        -0.0617, -0.0204, -0.0032, -0.0101, -0.1847, -0.0147, -0.1994, -0.0102,
        -0.0081, -0.0193,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0775, -0.0493, -0.0054, -0.0544, -0.0119, -0.0307, -0.0089, -0.0064,
        -0.0282, -0.0137, -0.0046, -0.0125, -0.1918, -0.0081, -0.0052, -0.0024,
        -0.0061, -0.1540, -0.0063, -0.0909, -0.0183, -0.1710, -0.0081, -0.0134,
        -0.0083, -0.0046, -0.0081,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1211, -0.0418, -0.0056, -0.0339, -0.0089, -0.0381, -0.0068, -0.0044,
        -0.0262, -0.0094, -0.0047, -0.0103, -0.0554, -0.0062, -0.0045, -0.0037,
        -0.0083, -0.2204, -0.0073, -0.1171, -0.0167, -0.2191, -0.0114, -0.0075,
        -0.0045, -0.0066,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #3000: [tensor([-0.0780, -0.0794, -0.0081, -0.0606, -0.0155, -0.0083, -0.0134, -0.0028,
        -0.0077, -0.5752, -0.0092, -0.0873, -0.0245, -0.0093, -0.0072, -0.0136,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0859, -0.0681, -0.0083, -0.0566, -0.0148, -0.0069, -0.0118, -0.0023,
        -0.0072, -0.4419, -0.0104, -0.0515, -0.0170, -0.0160, -0.1697, -0.0081,
        -0.0080, -0.0153,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1018, 0.0690, 0.0103, 0.0064, 0.0079, 0.0053, 0.0095, 0.0022, 0.0057,
        0.1176, 0.0075, 0.0151, 0.0174, 0.0100, 0.0132, 0.1128, 0.0113, 0.0077,
        0.0025, 0.0054, 0.1673, 0.0163, 0.2458, 0.0188, 0.0046, 0.0083, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1082, -0.0336, -0.0054, -0.0055, -0.0053, -0.0034, -0.0070, -0.0012,
        -0.0042, -0.0446, -0.0027, -0.0077, -0.0101, -0.0055, -0.0102, -0.0837,
        -0.0065, -0.0049, -0.0024, -0.0035, -0.1182, -0.0074, -0.0800, -0.0061,
        -0.3899, -0.0073, -0.0122, -0.0086, -0.0050, -0.0035, -0.0061],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1372, -0.1140, -0.0096, -0.0093, -0.0073, -0.0070, -0.0116, -0.0028,
        -0.0086, -0.1403, -0.0062, -0.0179, -0.0169, -0.0160, -0.0128, -0.2435,
        -0.0155, -0.0116, -0.0034, -0.0071, -0.0535, -0.0113, -0.0182, -0.0105,
        -0.0727, -0.0176, -0.0069, -0.0110,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1201, -0.1212, -0.0127, -0.0137, -0.0094, -0.0078, -0.0122, -0.0028,
        -0.0101, -0.0867, -0.0051, -0.0170, -0.0217, -0.0126, -0.0104, -0.1350,
        -0.0150, -0.0135, -0.0039, -0.0058, -0.0602, -0.0099, -0.0175, -0.0146,
        -0.0205, -0.2017, -0.0153, -0.0099, -0.0137,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0467, -0.0429, -0.0068, -0.0066, -0.0048, -0.0039, -0.0092, -0.0029,
        -0.0056, -0.1372, -0.0019, -0.0098, -0.0123, -0.0076, -0.0070, -0.1048,
        -0.0089, -0.0070, -0.0012, -0.0045, -0.1853, -0.0088, -0.0938, -0.0035,
        -0.2577, -0.0075, -0.0050, -0.0070,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([7.8731e-02, 4.7361e-02, 3.9443e-03, 5.0881e-03, 3.5074e-03, 3.4662e-03,
        5.4148e-03, 1.4002e-03, 2.7248e-03, 6.7325e-02, 3.0052e-03, 8.3955e-03,
        7.0235e-03, 6.6478e-03, 5.7998e-03, 5.4851e-02, 6.1423e-03, 4.9024e-03,
        2.5715e-04, 2.0734e-03, 1.3501e-01, 7.7757e-03, 5.0513e-03, 2.8404e-01,
        2.3204e-03, 4.8680e-02, 6.0728e-03, 1.8113e-01, 5.2130e-03, 2.3522e-03,
        4.2911e-03], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.0850, 0.0460, 0.0045, 0.0036, 0.0033, 0.0037, 0.0058, 0.0017, 0.0047,
        0.0478, 0.0029, 0.0082, 0.0090, 0.0057, 0.0066, 0.0500, 0.0087, 0.0052,
        0.0014, 0.0033, 0.1661, 0.0061, 0.0771, 0.0102, 0.0058, 0.4122, 0.0041,
        0.0032, 0.0079, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0646, -0.0569, -0.0058, -0.0072, -0.0056, -0.0050, -0.0074, -0.0027,
        -0.0041, -0.0685, -0.0025, -0.0125, -0.0142, -0.0078, -0.0112, -0.1588,
        -0.0078, -0.0064, -0.0013, -0.0041, -0.1766, -0.0101, -0.1166, -0.0101,
        -0.1566, -0.0471, -0.0158, -0.0038, -0.0089,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1175, 0.1237, 0.0194, 0.0081, 0.0082, 0.0100, 0.0187, 0.0041, 0.0137,
        0.1948, 0.0082, 0.0278, 0.0191, 0.0151, 0.0180, 0.2643, 0.0220, 0.0166,
        0.0054, 0.0097, 0.0185, 0.0209, 0.0194, 0.0170, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000, 0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0569, -0.1060, -0.0189, -0.0105, -0.0147, -0.0113, -0.0132, -0.0046,
        -0.0102, -0.1905, -0.0069, -0.0235, -0.0257, -0.0144, -0.0172, -0.3328,
        -0.0171, -0.0147, -0.0061, -0.0103, -0.0176, -0.0172, -0.0440, -0.0158,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #3050: [tensor([0.0838, 0.0877, 0.0117, 0.0037, 0.0068, 0.0304, 0.0045, 0.0673, 0.0091,
        0.0640, 0.0218, 0.0013, 0.0127, 0.1147, 0.0029, 0.0085, 0.0439, 0.0098,
        0.0051, 0.0003, 0.0035, 0.1975, 0.0056, 0.0196, 0.1358, 0.0042, 0.0093,
        0.0193, 0.0066, 0.0084], device='cuda:0', grad_fn=<DivBackward0>), tensor([-6.2574e-02, -2.5249e-02, -3.7553e-03, -9.6149e-04, -2.4795e-03,
        -1.2480e-02, -2.7907e-03, -1.7099e-02, -2.1843e-03, -1.3524e-02,
        -8.4034e-03, -5.0677e-04, -6.1295e-03, -4.8015e-02, -2.4461e-03,
        -4.0743e-03, -1.4434e-02, -4.4800e-03, -2.0751e-03,  4.1185e-04,
        -1.3761e-03, -2.2916e-03, -1.8542e-03, -2.2470e-02, -2.5333e-02,
        -7.0186e-01, -4.2144e-03, -2.3054e-03, -4.2205e-03,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 8.6992e-02,  7.1223e-02,  1.0060e-02,  1.7211e-03,  5.7139e-03,
         1.9766e-02,  4.8875e-03,  4.3463e-02,  6.7103e-03,  2.9861e-02,
         1.8237e-02, -4.8967e-04,  8.7538e-03,  1.1411e-01,  4.5014e-03,
         8.9682e-03,  2.8607e-02,  5.3506e-03,  3.4308e-03,  4.1119e-05,
         3.1372e-03,  2.8292e-03,  4.8409e-01,  2.1667e-02,  4.4857e-03,
         2.5878e-03,  8.3143e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.0865, 0.0094, 0.0118, 0.0117, 0.0058, 0.0087, 0.0128, 0.0056, 0.0183,
        0.0280, 0.0023, 0.0106, 0.0076, 0.0090, 0.0080, 0.0121, 0.0592, 0.2250,
        0.0085, 0.0024, 0.0057, 0.1917, 0.0103, 0.1270, 0.0609, 0.0096, 0.0360,
        0.0155, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-8.7034e-02, -2.6472e-03, -2.8969e-03, -3.8611e-03, -1.6479e-03,
        -4.5741e-03, -3.4812e-03, -2.6382e-03, -8.0967e-03, -1.0644e-02,
        -8.6363e-04, -4.0872e-03, -2.9041e-03, -3.6784e-03, -2.7103e-03,
        -6.7476e-03, -1.4029e-02, -6.9384e-02, -4.6232e-03,  4.5540e-04,
        -1.6224e-03, -8.5360e-03, -4.3353e-03, -2.9544e-02, -7.0162e-01,
        -2.3826e-03, -1.1115e-02, -3.8446e-03,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-7.9877e-02, -2.4631e-03, -2.0524e-03, -4.2115e-03, -2.0295e-03,
        -3.9032e-03, -2.6990e-03, -3.1217e-03, -8.1738e-03, -1.1386e-02,
        -1.3382e-03, -3.6993e-03, -3.1483e-03, -3.1362e-03, -2.5871e-03,
        -5.0810e-03, -1.6867e-02, -5.6242e-02, -3.8220e-03, -1.1702e-04,
        -1.3410e-03, -1.2511e-02, -2.9169e-03, -6.2004e-03, -7.5147e-01,
        -5.1047e-03, -4.4995e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1091, 0.1331, 0.0113, 0.0103, 0.0226, 0.0065, 0.0287, 0.0017, 0.0192,
        0.0061, 0.0078, 0.0060, 0.0498, 0.0137, 0.0497, 0.3270, 0.0053, 0.0121,
        0.0035, 0.0062, 0.0283, 0.0300, 0.0378, 0.0360, 0.0144, 0.0107, 0.0133,
        0.0000, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([6.0461e-02, 1.1402e-01, 9.2968e-03, 6.0052e-03, 1.1242e-02, 3.6905e-03,
        2.2244e-02, 7.4420e-05, 1.2651e-02, 4.8960e-03, 7.1037e-03, 6.2318e-03,
        3.8127e-02, 1.1655e-02, 3.3906e-02, 1.8151e-01, 4.6863e-03, 7.2489e-03,
        1.6492e-03, 3.6122e-03, 6.5580e-03, 1.2063e-02, 1.6329e-01, 1.9866e-01,
        2.3095e-02, 1.2183e-02, 1.0960e-03, 2.5377e-02, 6.0885e-03, 1.1282e-02],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-8.6743e-02, -2.0118e-02, -3.5464e-03, -3.0676e-03, -4.8558e-03,
        -2.0703e-03, -7.7938e-03,  5.3471e-04, -6.8568e-03, -2.5347e-03,
        -2.8673e-03, -2.1260e-03, -1.1383e-02, -6.0286e-03, -1.1699e-02,
        -3.6842e-02, -1.5026e-03, -3.3099e-03, -3.6233e-04, -1.4539e-03,
        -4.1953e-03, -3.8784e-03, -5.3590e-02, -2.2335e-02, -6.8266e-01,
        -3.1536e-03, -8.1521e-03, -2.3370e-03, -4.0063e-03,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1248, 0.0103, 0.0153, 0.0099, 0.0067, 0.0358, 0.0116, 0.0073, 0.2928,
        0.0094, 0.0703, 0.0311, 0.0111, 0.0088, 0.0097, 0.0273, 0.0395, 0.0150,
        0.0134, 0.1959, 0.0217, 0.0105, 0.0218, 0.0000, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1643, 0.0091, 0.0098, 0.0086, 0.0058, 0.0173, 0.0088, 0.0078, 0.1572,
        0.0105, 0.0375, 0.0340, 0.0113, 0.0016, 0.0061, 0.0176, 0.0240, 0.0202,
        0.0128, 0.0590, 0.0161, 0.0666, 0.1736, 0.0261, 0.0667, 0.0101, 0.0043,
        0.0128, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1253, 0.0073, 0.0100, 0.0093, 0.0046, 0.0182, 0.0055, 0.0055, 0.1726,
        0.0105, 0.0393, 0.0298, 0.0083, 0.0029, 0.0053, 0.2011, 0.0107, 0.1453,
        0.0282, 0.0380, 0.0782, 0.0264, 0.0059, 0.0118, 0.0000, 0.0000, 0.0000,
        0.0000, 0.0000, 0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #3100: [tensor([-9.1374e-02, -1.7245e-02, -1.2125e-03, -2.5265e-04, -1.8094e-04,
         4.4530e-05,  9.0440e-04,  8.9412e-04, -2.0376e-01, -1.6371e-03,
        -2.6092e-04,  8.7965e-05, -1.1135e-03, -2.4239e-03, -3.6022e-05,
        -1.2559e-04, -4.3712e-04, -6.9916e-04,  2.9612e-04,  7.5591e-04,
        -1.3155e-01,  5.2139e-04, -2.2438e-01,  8.5581e-04, -6.3305e-06,
        -1.0860e-04, -1.2587e-03, -1.1284e-01, -3.1230e-03, -5.3679e-04,
        -1.2282e-03, -1.1037e-02, -7.8240e-02, -7.9147e-05, -7.0959e-03,
        -3.4126e-03, -7.8856e-02, -1.2916e-02, -3.7620e-03, -2.2059e-03,
        -2.2472e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-8.0917e-02, -8.0042e-03, -1.0568e-03,  4.9202e-04, -2.7389e-04,
        -2.7549e-04,  8.1828e-04,  7.9686e-04, -2.3830e-01, -1.1680e-03,
        -3.4949e-05, -2.3628e-06, -1.0108e-03, -2.4944e-03,  2.7786e-04,
        -1.9522e-04, -4.8419e-04, -1.3264e-03,  8.2687e-04,  1.1768e-03,
        -2.2084e-01, -1.8937e-04, -1.8172e-01,  4.5433e-04,  2.5255e-04,
         2.3576e-04, -9.3951e-04, -5.8586e-02, -1.6169e-02, -5.9606e-02,
        -1.6730e-03, -9.5067e-02,  3.2144e-04, -9.4388e-03, -5.8997e-04,
        -8.2514e-03, -3.3679e-03, -2.3714e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-1.2268e-01, -4.6759e-02, -2.1140e-03,  4.2709e-04, -2.1776e-04,
         4.8734e-05,  3.0116e-04,  3.9031e-04, -1.5514e-02, -1.3777e-03,
        -1.1612e-04,  3.8048e-05, -8.8230e-04, -2.5516e-03,  8.4959e-05,
        -3.5203e-04, -1.2688e-03, -1.1859e-03,  7.6885e-04,  2.1312e-03,
        -2.3720e-01,  5.5653e-04, -1.3818e-01,  1.0170e-03,  3.0725e-04,
         1.5182e-04, -1.5261e-03, -7.9710e-02, -1.0401e-02, -7.4032e-02,
        -5.0832e-04, -1.2995e-01, -6.7225e-03, -8.4336e-02, -2.2632e-02,
        -6.9350e-03, -4.1108e-03, -2.5077e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-7.7618e-02, -3.2232e-03, -2.3054e-03, -1.9541e-04, -9.0234e-04,
        -5.2152e-04, -1.3709e-03,  3.6406e-04, -3.4335e-02, -1.8120e-03,
        -1.1866e-03, -2.0541e-04, -1.2156e-03, -2.4676e-03,  8.0442e-05,
        -1.1323e-03, -1.5107e-03, -8.0684e-04,  3.7243e-04,  6.4500e-04,
        -2.1861e-01,  3.9777e-04, -2.1855e-01, -2.0052e-04, -6.6641e-05,
        -8.6143e-04, -1.8022e-03, -9.2903e-02, -1.4703e-02, -1.9980e-03,
        -8.2897e-04, -6.0584e-02, -9.7992e-04, -1.2602e-01, -8.1760e-03,
        -8.7749e-02, -2.5576e-02, -2.8820e-03, -1.6074e-03, -3.2338e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-8.6050e-02, -4.8564e-03, -1.3111e-03, -1.5355e-04, -4.8806e-04,
        -9.6255e-05, -4.5409e-05,  8.8069e-04, -2.2457e-01, -1.2168e-03,
        -2.1666e-04, -3.0833e-04, -5.9735e-04, -2.2591e-03, -4.9036e-05,
        -3.2713e-04, -8.4514e-04, -9.3222e-04,  1.9290e-04,  7.3956e-04,
        -1.5537e-01,  3.0711e-04, -1.8979e-01,  4.9445e-04, -1.4596e-04,
        -2.4071e-04, -1.1497e-03, -6.3799e-02, -4.0837e-03, -3.7865e-02,
        -2.4651e-04, -2.2922e-03, -6.4200e-03, -9.5247e-02, -1.9081e-02,
        -6.6023e-03,  6.3609e-04, -1.0000e-03,  6.4297e-04, -1.5429e-03,
        -5.5712e-03, -7.6511e-02, -4.8679e-04, -1.9712e-03, -2.3703e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-7.0919e-02, -6.1880e-02, -9.6432e-04,  1.9281e-04, -1.2861e-04,
         2.7309e-04,  6.0902e-04,  8.1503e-04, -3.6907e-01, -1.4471e-03,
        -9.0733e-05,  2.5964e-04, -9.2084e-04, -1.9982e-03,  8.7030e-05,
        -2.3129e-04, -2.9825e-04, -3.9785e-04,  9.2520e-04,  9.7645e-04,
        -1.2926e-01,  1.6761e-04, -1.2287e-01,  8.0767e-04, -4.1935e-04,
         2.9528e-04, -9.4524e-04, -6.9482e-02, -6.1487e-03, -3.8121e-02,
        -2.0143e-03, -1.4142e-03, -4.6610e-04, -9.2599e-02, -1.3665e-02,
        -5.4029e-03, -1.9007e-03, -1.5415e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-6.0545e-02,  8.2794e-03, -1.5508e-03, -7.1971e-05, -5.3727e-04,
        -2.9219e-04,  4.2971e-04,  5.8629e-04, -2.5702e-01, -1.0119e-03,
        -2.6211e-04, -1.9898e-04, -6.6486e-04, -1.6960e-03,  3.9525e-04,
        -6.0910e-04, -1.3067e-03, -1.5074e-03, -5.9103e-04,  8.1801e-04,
        -1.7987e-01,  3.4749e-04, -1.8603e-01,  2.2494e-04,  4.3833e-04,
         1.6664e-04, -1.4585e-03, -7.5318e-02, -6.0508e-03, -4.9151e-02,
        -1.3995e-02, -8.9900e-02, -4.6033e-02, -2.8544e-03, -3.6883e-03,
        -6.0958e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-1.1857e-01, -4.6238e-02, -1.1278e-03,  3.9842e-04, -3.2851e-04,
        -2.9370e-04,  2.0136e-03,  4.9497e-04, -2.1177e-02, -1.6720e-03,
        -1.9904e-04, -5.7728e-05, -1.0367e-03, -3.4732e-03,  5.0364e-05,
        -4.8836e-04, -1.2359e-03, -1.1048e-03,  3.6798e-03,  1.7066e-03,
        -2.1295e-01,  2.3878e-04, -2.6912e-01,  2.1378e-04,  2.9525e-04,
         4.6276e-04, -1.0153e-03, -8.4691e-02, -2.0580e-02, -5.1859e-02,
        -2.9872e-03, -1.0236e-01, -6.8763e-03, -1.0566e-02, -1.6392e-02,
        -8.2376e-03, -2.9794e-03, -2.8296e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-4.8677e-02, -4.5483e-03, -1.0392e-03,  3.4493e-05, -1.5868e-04,
         1.9420e-05, -1.2452e-04,  5.5999e-04, -3.4980e-01, -1.2226e-03,
        -3.2621e-04,  1.6252e-04, -6.3753e-04, -1.2263e-03,  1.2684e-04,
        -2.3040e-04, -9.7894e-04, -1.0921e-03,  4.7354e-04,  9.3566e-04,
        -1.7382e-01,  2.6826e-04, -1.7751e-01,  1.2315e-03,  5.3356e-04,
         2.4988e-04, -1.0091e-03, -5.2428e-02, -1.1358e-02, -4.8393e-02,
        -1.0254e-01, -9.2266e-04, -9.4624e-03, -2.6093e-03, -8.6040e-04,
        -4.4309e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-5.3796e-02, -1.0826e-02, -2.4645e-03,  9.9737e-05, -4.3519e-03,
        -6.7305e-02, -1.4700e-03, -7.6873e-04, -3.8195e-04, -5.0452e-04,
        -4.0906e-03, -8.0609e-04, -7.4061e-04, -3.5743e-04,  4.4442e-03,
        -4.9831e-04, -8.6351e-05, -1.4346e-03, -1.2459e-03, -2.1432e-04,
        -9.3310e-06, -1.6784e-02, -3.0865e-04, -1.2157e-04, -3.4999e-01,
        -6.5861e-05, -2.8002e-04, -9.7502e-04, -1.5354e-03, -2.5834e-04,
         8.3093e-04, -4.0350e-04,  4.6651e-04, -7.2627e-03, -3.0082e-03,
        -4.6283e-03, -9.3694e-04, -9.4377e-04, -1.4735e-03, -2.8181e-04,
        -9.5010e-04, -5.8949e-04, -2.5131e-01, -2.8259e-03, -1.6172e-01,
        -1.0156e-02, -4.5706e-03, -1.3305e-02, -1.5301e-03, -1.4045e-03,
        -5.1837e-03,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-3.5250e-02, -3.6764e-02, -9.7013e-04, -9.2265e-06, -4.3218e-03,
        -7.3160e-02, -1.2882e-03, -5.5193e-04, -4.7588e-04, -4.8491e-04,
        -1.1801e-03, -1.8873e-04, -8.3135e-04, -1.2223e-03, -5.7942e-04,
        -3.0502e-04, -1.0657e-03, -8.3741e-04, -2.4569e-04,  3.0141e-04,
        -4.1038e-04, -1.0185e-02,  3.3854e-04, -1.7885e-04, -4.9844e-01,
        -1.3331e-04, -5.4338e-04, -1.4343e-04, -3.1978e-04,  9.7881e-05,
         3.7474e-04, -5.3783e-04,  6.4174e-04, -2.4495e-03,  4.4391e-05,
        -7.7609e-04, -1.0543e-03,  6.2634e-05, -3.9973e-04, -2.0517e-04,
         5.3911e-04, -7.6043e-04, -1.3432e-01, -1.3316e-03, -1.2402e-03,
        -1.2177e-01, -9.1886e-03, -4.0561e-02, -8.5622e-03, -1.4306e-03,
        -8.7358e-04, -2.0534e-03,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-1.1117e-01, -4.7362e-02, -4.2965e-03, -2.9124e-04, -1.5543e-03,
        -2.0936e-02, -1.6331e-03, -1.8023e-03, -6.7441e-04, -2.6056e-04,
        -3.0886e-03, -3.3709e-04, -6.9719e-04, -1.9345e-04,  2.0528e-03,
        -4.3650e-04, -4.0120e-04, -1.4587e-03, -1.5087e-03, -1.9611e-04,
         7.9716e-05, -1.4150e-02,  4.7607e-04,  3.1993e-04, -3.4338e-01,
        -2.8467e-05,  1.7065e-04, -9.4298e-04, -1.2374e-03,  2.6896e-04,
         5.4533e-04,  1.5445e-04,  7.3125e-04,  4.2562e-03, -3.8994e-03,
        -2.0477e-03, -1.0372e-03, -8.8985e-04, -3.9139e-04, -1.0378e-03,
        -8.3215e-04, -1.2483e-03, -1.5759e-01, -6.2308e-03, -1.2398e-01,
        -3.4804e-03, -8.6942e-02, -2.7217e-03, -7.2906e-03, -7.5272e-03,
        -1.4015e-02, -7.1290e-03, -4.6114e-03], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #3150: [tensor([-1.6854e-01, -7.4968e-02, -2.8952e-04,  2.1694e-02, -4.8349e-03,
         2.8432e-03,  1.6904e-02,  4.9315e-03, -3.8927e-03, -3.8347e-03,
        -3.5918e-03,  2.1930e-03, -2.3291e-03, -1.7966e-01,  2.5493e-03,
        -3.2552e-01, -1.0037e-01,  6.9038e-02, -1.2017e-02,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.4191e-01,  1.1709e-02,  7.1461e-03,  1.4513e-01,  6.9996e-04,
         4.0905e-03,  5.4561e-02, -7.0733e-04, -1.4659e-04,  4.5807e-03,
         1.5781e-03, -1.1891e-01, -3.0115e-02,  4.4122e-03, -1.9946e-03,
        -2.9173e-01, -3.2003e-03, -7.1125e-02, -8.9207e-02, -1.5134e-02,
         1.9096e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2529, -0.0041, -0.0013,  0.0144, -0.0037,  0.0010, -0.0145, -0.0043,
        -0.0044,  0.0004, -0.0026, -0.2799, -0.0512, -0.0483, -0.0075, -0.2025,
        -0.0706,  0.0243, -0.0122,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1981, -0.0116,  0.0012,  0.0387,  0.0002,  0.0017,  0.0155, -0.0017,
        -0.0011,  0.0022, -0.0008, -0.2156, -0.1191, -0.0780, -0.0045, -0.1991,
        -0.0929, -0.0104, -0.0079,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1301, -0.0200,  0.0066, -0.0145, -0.0082, -0.0072, -0.1052, -0.0028,
        -0.0010,  0.0138,  0.0039, -0.0346, -0.3311, -0.0610, -0.0168, -0.0325,
        -0.0300, -0.1284, -0.0237, -0.0005, -0.0282,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 1.0302e-01,  1.5602e-02, -8.3376e-03,  1.0923e-02,  6.7965e-03,
        -2.5010e-03,  1.8095e-01,  1.4614e-04, -2.3513e-03, -2.2113e-02,
        -1.6812e-03,  3.8110e-02,  4.1677e-02,  1.3470e-01,  3.6784e-03,
         1.5210e-02,  1.9692e-02, -3.3494e-01,  3.8328e-02,  9.4577e-03,
         9.7835e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1924, -0.0025,  0.0045, -0.0027, -0.0042,  0.0012,  0.1310, -0.0013,
        -0.0005,  0.0033, -0.0015, -0.0279, -0.0398,  0.0225,  0.0032, -0.3024,
        -0.1573, -0.0284, -0.0585, -0.0146,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.0407e-01, -2.8697e-03, -1.6892e-03,  7.7030e-02, -2.0085e-03,
        -3.6345e-03, -1.1508e-03, -3.4480e-05, -4.3569e-01,  2.7179e-03,
        -4.1788e-03, -1.7683e-01, -8.4910e-03, -1.3227e-01, -7.9032e-03,
        -5.4474e-03, -9.8000e-03,  2.4186e-02,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.2956e-01, -2.4422e-03, -1.6368e-03,  9.2951e-02, -2.4598e-03,
        -2.6362e-03,  5.8502e-05, -1.7367e-03, -3.0853e-01, -3.5526e-03,
        -1.6046e-01, -4.8230e-03, -2.4946e-01, -2.9119e-02, -3.3534e-03,
        -7.2117e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-7.9341e-02, -8.4301e-04, -9.1296e-04, -6.2121e-01, -6.4004e-04,
        -6.7216e-04, -9.5545e-04,  1.1949e-04, -3.9201e-03, -5.8710e-02,
        -4.5839e-03, -1.3137e-01, -7.8988e-02, -1.2908e-02, -4.8308e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0996, -0.0466,  0.0057, -0.0025,  0.0006,  0.0008,  0.0022, -0.0060,
        -0.0021, -0.0082,  0.0031, -0.0759, -0.0017,  0.0057,  0.0030, -0.0452,
        -0.0769,  0.0274, -0.0112, -0.0926, -0.0246, -0.3545,  0.0471, -0.0142,
         0.0337, -0.0088], device='cuda:0', grad_fn=<DivBackward0>), tensor([-2.3461e-01, -3.2230e-03,  6.8714e-03, -2.3104e-03, -1.2546e-03,
         1.5150e-03,  5.5029e-04, -4.5456e-03, -3.0527e-03, -9.7647e-03,
         2.6380e-03,  1.1325e-02, -3.7424e-03, -2.5288e-04,  7.6210e-04,
        -1.4233e-01, -1.9907e-02, -4.8794e-02,  3.8195e-03,  2.2814e-04,
        -3.0546e-01,  3.6846e-03,  4.6605e-02, -1.0916e-01,  2.1031e-02,
        -1.2562e-02], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #3200: [tensor([-0.3133, -0.0330, -0.0077, -0.0214, -0.0042, -0.0404, -0.0035, -0.0011,
        -0.0062, -0.2423, -0.0410, -0.1850, -0.0346, -0.0443, -0.0222,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2197, -0.0197, -0.0042, -0.0159, -0.0027, -0.0247, -0.0038,  0.0029,
        -0.0016, -0.1158, -0.0158, -0.1120, -0.2885, -0.1475, -0.0070, -0.0181,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2006,  0.0618,  0.0024,  0.0037, -0.0060,  0.0071,  0.0031, -0.0004,
         0.0021,  0.0024,  0.0035,  0.0235,  0.0017,  0.0054,  0.0035, -0.2802,
        -0.0772,  0.0116, -0.0460, -0.0054, -0.0706, -0.0585, -0.0047, -0.1019,
        -0.0068, -0.0098,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-9.6754e-02, -5.6038e-01,  2.0769e-04,  1.0702e-03, -2.2489e-03,
         3.2135e-03,  1.2587e-04,  7.4233e-04, -3.1510e-04,  8.4807e-04,
         2.0989e-03,  3.9790e-03,  9.0810e-04,  2.0667e-03,  1.2390e-03,
        -5.3773e-02, -5.4325e-03,  6.3341e-02, -7.2666e-04, -4.6570e-02,
        -3.7457e-02, -5.0911e-03, -7.9031e-03, -4.6147e-03, -1.3138e-03,
        -4.0503e-02, -2.5320e-02, -2.2301e-02,  1.0039e-04, -2.3932e-03,
        -2.7980e-03, -4.1674e-03,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1986,  0.1374,  0.0022,  0.0016, -0.0043,  0.0026,  0.0004, -0.0005,
        -0.0006,  0.0012, -0.0020,  0.0260,  0.0009,  0.0028,  0.0013, -0.1422,
        -0.0512,  0.0789, -0.0017, -0.0082,  0.0030,  0.0045, -0.0329, -0.0237,
        -0.0204, -0.1107,  0.1007, -0.0118, -0.0033, -0.0012,  0.0050, -0.0080,
        -0.0103], device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.0357e-01, -1.0976e-02,  1.1786e-02,  7.5978e-04,  2.5861e-03,
         3.4768e-03, -2.8442e-05,  4.4612e-05, -3.2676e-02,  3.9791e-03,
        -5.3633e-03, -1.8014e-03,  1.9805e-03,  5.3391e-03, -4.3017e-04,
        -1.6145e-01, -1.8830e-01,  4.5486e-02, -5.1376e-03, -1.8825e-01,
        -3.7474e-02, -7.9320e-04,  1.8830e-01,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1386, -0.0149, -0.0072, -0.0020, -0.0009,  0.0021,  0.0016,  0.0006,
        -0.0456, -0.0027, -0.0068, -0.0042,  0.0018,  0.0018,  0.0007, -0.0734,
        -0.3103,  0.0548, -0.0194, -0.0045, -0.0251, -0.0050,  0.2758,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1035, -0.0115,  0.0165,  0.0012,  0.0049,  0.0023,  0.0025,  0.0057,
        -0.0235,  0.0048, -0.0062,  0.0418,  0.0030,  0.0027,  0.0033, -0.0574,
        -0.3356,  0.0352, -0.0316, -0.0162, -0.0534,  0.0047,  0.2325,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-5.7226e-02, -6.2741e-01, -5.0673e-05, -1.0699e-03, -1.9765e-03,
        -2.1923e-05, -2.3301e-03,  2.8034e-04,  2.6146e-03,  5.5179e-03,
        -9.9064e-03, -1.2438e-03, -1.2450e-04,  9.6422e-04,  4.3055e-03,
         4.9891e-04, -1.7263e-03,  3.7843e-02, -1.9362e-01, -5.1004e-02,
         2.6252e-04,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-6.4477e-02,  2.1713e-02,  1.4765e-05, -1.7931e-03, -2.1661e-03,
        -1.1710e-03, -1.4260e-03,  2.3981e-03,  2.8645e-03, -1.8135e-01,
        -3.8879e-02, -7.0835e-04,  1.6362e-03,  1.0834e-03,  7.1710e-03,
        -9.9632e-04, -4.6252e-03,  1.8532e-01, -3.8031e-01, -7.9774e-02,
        -1.8938e-02, -1.1890e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-1.6104e-01, -2.3217e-01,  1.8632e-04,  4.7611e-03, -2.1261e-04,
         1.5635e-03, -1.7916e-03, -1.1890e-04,  1.5732e-03, -4.3710e-01,
         1.1455e-02,  5.8002e-04,  9.4184e-04,  2.2275e-03,  2.6812e-03,
        -2.5205e-04, -1.2076e-02, -8.0988e-02, -1.8110e-02, -2.2498e-02,
        -7.6606e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-1.0798e-01, -3.7082e-01, -3.4010e-04,  1.6850e-02,  2.1953e-02,
         1.3093e-03,  3.6562e-03,  2.5350e-03, -9.9333e-04,  8.5872e-02,
         5.4886e-03,  5.4562e-05,  7.9586e-04,  2.0122e-03,  1.1122e-02,
         1.1048e-03, -1.7623e-03,  8.8528e-04,  2.9357e-04, -8.4403e-02,
        -2.4548e-04, -4.7465e-02,  1.4284e-02, -4.4231e-02,  4.4079e-02,
        -1.9107e-02,  2.2788e-02,  1.9972e-02,  1.0868e-03, -1.3761e-02,
        -4.8421e-02, -4.3353e-03,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #3250: [tensor([-0.2535, -0.0349, -0.0023, -0.0125, -0.0068,  0.0007, -0.0059, -0.4399,
        -0.0155, -0.1962, -0.0140,  0.0054, -0.0125,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-1.4654e-01, -2.5175e-01,  2.0304e-03, -3.2407e-04,  6.2972e-03,
         1.1509e-02, -9.0206e-04, -3.9294e-01, -1.0101e-02, -2.0661e-02,
        -6.9485e-02, -5.0189e-02, -3.5248e-02, -2.0178e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-1.3135e-01,  1.3064e-01, -4.8746e-04,  7.2521e-03,  3.0318e-03,
         4.9159e-03,  5.0999e-04,  2.6163e-04,  7.9969e-04, -3.8091e-03,
         2.3789e-05, -3.7711e-01,  3.8484e-03, -4.8245e-03,  3.0487e-03,
        -5.3167e-04, -9.0097e-02,  2.0589e-02, -4.5755e-02, -7.6019e-02,
         1.1288e-02, -5.5350e-02,  1.3726e-02, -3.6495e-03, -1.1083e-02,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-6.3596e-02,  3.5302e-02,  3.2086e-04,  3.4025e-03,  4.6004e-03,
         1.8908e-03, -1.1748e-04,  2.1491e-04,  3.1953e-04, -7.6587e-05,
        -8.2436e-04, -6.9742e-01,  1.0558e-03, -1.6130e-03,  1.4263e-03,
        -3.5570e-04, -4.1421e-02,  1.3617e-02, -2.2920e-03, -3.6116e-02,
        -2.3316e-03, -2.3584e-02, -1.8707e-02, -1.5749e-03, -4.7491e-03,
        -2.5504e-02,  1.7563e-02,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-4.5327e-02, -3.0756e-01,  6.5122e-04,  7.0280e-03,  1.3916e-02,
         3.1416e-03,  5.3574e-04,  1.3402e-03,  7.0794e-04,  4.2403e-04,
        -2.1052e-04, -4.2312e-01,  2.3502e-03, -1.6059e-03,  3.5896e-03,
         1.2666e-03, -5.7887e-02,  8.1152e-03, -3.4243e-04,  8.2938e-03,
        -3.9340e-02, -1.1881e-02,  5.1744e-03, -3.0216e-02, -1.1863e-03,
        -1.3641e-02,  1.0981e-02, -1.7443e-04], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.2529, -0.0066, -0.0032, -0.0124, -0.0289, -0.0038, -0.0137, -0.0060,
        -0.0051, -0.0059, -0.0046, -0.1349, -0.0141, -0.1178,  0.0365,  0.0126,
        -0.3131,  0.0098, -0.0181,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1720, -0.0035, -0.0006, -0.0038, -0.0091, -0.0008, -0.0091, -0.0316,
        -0.0029,  0.0011, -0.0027, -0.1201, -0.0096, -0.0941, -0.2211, -0.0086,
        -0.1618, -0.1289, -0.0115, -0.0072,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.2329, -0.0037, -0.0032, -0.0075, -0.0181, -0.0028, -0.0149, -0.0494,
        -0.0059, -0.0053, -0.0045, -0.0922, -0.0109, -0.0999, -0.0058, -0.1337,
        -0.0105,  0.0158, -0.2665, -0.0041, -0.0123,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1777,  0.0013,  0.0090, -0.0005,  0.0095, -0.0027,  0.0089,  0.0011,
        -0.0175, -0.0078, -0.0065, -0.3268, -0.3460, -0.0847,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 0.0588,  0.0111,  0.0240,  0.0076,  0.0020,  0.0032,  0.0231,  0.0042,
        -0.0055,  0.2131, -0.0335,  0.3131, -0.1333,  0.1676,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 0.0428, -0.0087, -0.0099,  0.0032,  0.0127, -0.0021, -0.0241,  0.0007,
         0.0392, -0.5769,  0.1234, -0.1563,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0770, -0.0032, -0.0008,  0.0014,  0.0015,  0.0035, -0.0015, -0.0085,
        -0.0013, -0.1022, -0.0008, -0.0067, -0.2530, -0.0053,  0.0025, -0.0010,
        -0.0087,  0.0582, -0.4334, -0.0148, -0.0132, -0.0014,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #3300: [tensor([-1.4458e-01, -2.7027e-01, -5.5996e-03, -2.8080e-03, -1.4147e-03,
        -1.7589e-03, -9.4594e-04, -6.8765e-03, -5.6520e-03,  1.2360e-03,
        -7.7631e-03, -1.1328e-03, -4.7566e-03, -1.1529e-02, -1.1331e-03,
        -7.3449e-03, -5.4669e-03, -2.0567e-03, -1.6215e-04,  1.0091e-03,
        -6.9048e-05, -2.2853e-01,  3.6271e-02, -2.7169e-02, -5.0398e-02,
        -2.2897e-02,  1.5117e-01,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1982, -0.0138, -0.0047, -0.0036, -0.0016, -0.0102, -0.0149, -0.0028,
        -0.0002, -0.0087, -0.0011,  0.0015, -0.0019, -0.1762, -0.0091, -0.0087,
        -0.0024, -0.0936, -0.1648, -0.0203, -0.0024, -0.0473,  0.0636, -0.0031,
        -0.0050, -0.0260,  0.1091, -0.0054,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1308, -0.0302, -0.0032, -0.0052, -0.0031, -0.0099, -0.0339, -0.0040,
        -0.0012, -0.0105, -0.0019, -0.0022, -0.0030, -0.1390, -0.0081, -0.0104,
        -0.2309,  0.0246, -0.3415, -0.0031, -0.0034,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1669, -0.0355, -0.0052, -0.0059, -0.0013, -0.0252, -0.0224, -0.0037,
        -0.0025, -0.0091, -0.0032,  0.0005, -0.0039, -0.3124, -0.0137, -0.0193,
        -0.0107, -0.0058, -0.3452, -0.0035, -0.0042,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.8782e-01, -1.4555e-02, -1.0424e-03, -3.0125e-03, -7.9578e-03,
        -8.6669e-03, -1.6931e-03, -1.9548e-03, -6.5660e-04, -1.9759e-03,
        -1.5847e-03, -1.1906e-03, -4.6959e-04, -2.2359e-03,  7.1611e-05,
        -5.9997e-03, -6.7182e-03, -1.8812e-03, -5.9053e-04, -4.2134e-04,
        -3.7747e-03,  1.4149e-03,  1.3455e-03, -9.1491e-04, -5.7792e-04,
        -2.2188e-03,  1.3688e-04,  3.5123e-04, -4.5654e-04, -1.5627e-01,
        -2.6589e-02, -2.4959e-02, -4.2113e-03, -1.9854e-02, -9.0607e-03,
        -7.0977e-03, -4.7102e-02, -1.4418e-01, -3.1442e-02, -3.1854e-03,
        -1.0712e-01, -1.3804e-01, -1.1291e-02, -4.7624e-03, -3.1446e-03,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.3956e-01, -1.3345e-02, -2.2109e-03, -1.9832e-03, -3.5914e-03,
        -1.5710e-02, -8.2332e-04, -3.5254e-03, -3.7421e-04, -2.0103e-03,
        -7.0828e-04, -7.2148e-04,  5.4403e-04, -1.9653e-03, -1.9397e-04,
        -5.6608e-03, -7.6669e-03, -6.0672e-04, -3.8504e-04, -4.0899e-04,
        -3.4749e-03,  7.8311e-04,  1.5984e-03, -7.8547e-04, -8.5832e-04,
        -1.7223e-03,  1.2747e-03,  7.8204e-04, -3.7494e-04, -2.2940e-01,
        -1.0609e-02, -4.2353e-02, -3.5817e-03, -1.1365e-02, -6.7502e-03,
        -9.0592e-02, -3.4128e-03, -2.6980e-03, -8.4719e-02, -1.4632e-02,
        -2.4180e-02, -8.6559e-04, -9.6612e-02, -1.4482e-01, -1.9229e-03,
        -1.4053e-02, -3.7897e-03], device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.2156e-01, -1.1463e-02, -3.1456e-03, -2.8288e-03, -6.2310e-03,
        -1.4167e-02, -9.8347e-04, -2.4589e-03, -7.6485e-04, -2.6295e-03,
        -1.4111e-03, -3.8399e-04,  1.9917e-04, -2.0465e-03, -7.2673e-04,
        -5.4230e-03, -9.2388e-03, -1.6167e-03, -1.2083e-03, -9.5698e-04,
        -3.9062e-03,  3.8707e-04,  1.1850e-03, -7.8320e-04, -5.0551e-04,
        -8.4211e-04,  5.7265e-04,  6.1714e-04, -1.7667e-04, -1.2772e-01,
        -4.6922e-03, -9.4212e-02, -2.5399e-03, -1.2449e-01, -3.2219e-03,
        -2.2148e-02, -7.7799e-02, -5.5605e-04, -1.6399e-02, -1.8761e-01,
        -6.0218e-02, -2.0842e-02, -5.5222e-02, -3.0255e-03, -8.9205e-04,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-2.6509e-01, -2.9581e-02, -4.5832e-03, -4.0830e-03, -3.1203e-03,
        -8.0501e-03, -1.8765e-02, -1.1993e-03, -2.2434e-03, -5.9663e-04,
        -4.0664e-03, -2.3566e-03,  7.5507e-04, -2.5683e-03,  7.3937e-04,
        -1.4243e-03, -2.6889e-03, -1.0014e-03, -3.3196e-03,  6.5952e-05,
         7.8317e-04, -5.9376e-03, -1.8927e-04,  4.5410e-04, -1.8327e-04,
        -2.2894e-01,  1.4282e-02, -3.3899e-02, -1.1705e-01, -2.1201e-03,
        -5.2931e-03, -2.1743e-01, -4.8065e-03, -2.6513e-03, -6.2252e-03,
         3.4667e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.9148e-01, -4.7446e-02, -3.4413e-03, -4.2144e-03, -3.3666e-03,
        -9.1931e-03, -2.0922e-02, -1.5429e-03, -5.8882e-04, -1.0813e-03,
        -3.6894e-03, -1.6847e-03,  1.1049e-03, -2.3790e-03,  7.3993e-04,
        -8.8095e-04, -2.0796e-03, -1.1332e-03, -3.2255e-03,  1.5963e-04,
         1.2426e-03,  3.2853e-03,  4.5370e-04, -1.6927e-04,  8.6650e-04,
        -4.6439e-01,  5.1211e-03, -4.9589e-03, -1.3458e-01, -1.5412e-02,
        -6.8975e-03, -4.0134e-02, -3.6516e-03, -1.4699e-02, -3.7958e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2184, -0.0499, -0.0063, -0.0036, -0.0042, -0.0142, -0.0267, -0.0004,
        -0.0027, -0.0011, -0.0032, -0.0029,  0.0005, -0.0028,  0.0012, -0.0013,
        -0.0035, -0.0007, -0.0024, -0.0007,  0.0026, -0.0109,  0.0005, -0.0003,
        -0.0008, -0.1971,  0.0264, -0.0340, -0.1124,  0.0003, -0.0049, -0.2239,
        -0.0118, -0.0222, -0.0053,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.1556e-01, -3.1647e-02, -9.1892e-04, -1.3166e-02, -1.6512e-03,
        -2.9202e-03,  5.6583e-05, -2.5392e-02, -3.8772e-04, -4.8725e-03,
        -3.5890e-03, -2.8534e-03, -2.9743e-03, -3.3927e-03, -2.9603e-03,
        -3.6821e-03, -2.8855e-02, -1.1756e-03, -1.4522e-03, -3.7119e-03,
         2.2947e-04,  2.1315e-03, -2.2806e-04, -3.4935e-01, -3.3531e-03,
        -3.1722e-01,  5.2473e-02, -3.4888e-03,  1.2356e-02, -7.9608e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.4392e-01, -3.2151e-02, -1.8462e-03, -1.7769e-02, -2.6065e-03,
        -5.4779e-03, -8.4572e-04, -3.2942e-02, -1.3120e-04, -5.5449e-03,
        -4.6971e-03, -4.6735e-03, -4.3414e-03, -2.8753e-03, -4.8253e-03,
        -6.2855e-03, -3.8173e-02, -3.5090e-03, -3.7141e-03, -1.8361e-03,
        -2.8574e-03, -1.2245e-03,  6.9851e-04, -2.1548e-01,  1.0226e-02,
        -1.9012e-01, -3.7812e-03, -2.4574e-03, -1.5860e-01, -7.2257e-02,
        -1.8213e-02, -5.9176e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #3350: [tensor([ 1.7287e-01,  5.1066e-03,  2.1773e-03, -3.1423e-04,  1.8413e-03,
         5.0968e-03,  1.8891e-03,  2.4498e-02,  1.8042e-03, -9.8032e-04,
         1.1992e-03,  7.0351e-01,  6.0667e-03,  5.7577e-03,  1.9922e-03,
         7.9671e-03,  6.4477e-03,  4.8145e-03,  7.5256e-03,  2.7107e-02,
         5.9071e-03,  2.0685e-03,  3.0605e-03,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 1.3536e-01,  4.4599e-03,  5.2798e-04,  2.5793e-05,  2.4254e-03,
         4.7759e-03,  3.8115e-03,  2.8513e-02,  3.1695e-03, -1.3038e-04,
         1.5384e-03,  7.5475e-01,  7.6415e-03,  6.6678e-03,  1.5020e-02,
         4.7768e-03,  8.2339e-03,  7.6685e-03,  4.5902e-03,  2.1522e-03,
         3.7643e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-3.2226e-02, -3.6797e-02, -1.2389e-03, -2.1804e-02, -2.1851e-02,
         1.4125e-03, -4.9231e-03, -3.5362e-03, -1.9874e-03, -7.6248e-04,
        -1.1721e-03, -8.5431e-01, -6.5707e-03, -7.7220e-03, -3.6903e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.1260,  0.0387,  0.0029,  0.0140,  0.0196, -0.0018,  0.0059,  0.0037,
         0.0017, -0.0013,  0.0014,  0.7616,  0.0011,  0.0088,  0.0066,  0.0051,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.0450, -0.1553, -0.0060, -0.0759, -0.0430,  0.0020, -0.0072, -0.0082,
        -0.0019, -0.0009, -0.0032, -0.0334, -0.5873, -0.0213, -0.0094,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2331, -0.0136, -0.0195, -0.0255, -0.0092, -0.0123, -0.0073, -0.0080,
        -0.0032, -0.0310, -0.0316, -0.0882, -0.4702, -0.0221, -0.0151, -0.0101,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.0937, -0.0119, -0.0114, -0.0132, -0.0089, -0.0130, -0.0057, -0.0014,
        -0.0063, -0.0655, -0.0265, -0.6757, -0.0211, -0.0264, -0.0087, -0.0107,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0319, -0.0146, -0.0183, -0.0190, -0.0145, -0.0099, -0.0116, -0.0043,
        -0.0059, -0.0160, -0.0139, -0.7017, -0.0234, -0.0804, -0.0139, -0.0206,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([2.7496e-02, 1.5562e-02, 2.7120e-03, 1.3626e-02, 1.1165e-03, 1.4706e-02,
        1.8853e-03, 1.7527e-03, 1.3892e-02, 1.5232e-03, 1.8730e-04, 1.4587e-03,
        4.1042e-01, 7.7183e-03, 4.1555e-03, 4.3297e-03, 3.0707e-03, 6.5261e-03,
        4.9254e-03, 4.5759e-01, 2.7062e-03, 1.2999e-03, 1.3430e-03, 0.0000e+00,
        0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 8.7064e-03, -2.3787e-02, -2.4238e-03, -1.2926e-02, -1.9359e-03,
        -2.3428e-02, -2.6606e-03, -1.2742e-03, -1.1173e-02, -6.5808e-04,
        -1.5259e-04, -9.2064e-04, -8.0955e-01, -5.2694e-03, -1.9500e-02,
        -1.8823e-03, -5.8107e-02, -5.4331e-03, -5.0210e-03, -1.9406e-03,
        -9.9513e-04, -2.2502e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 5.9327e-02,  2.0018e-02,  2.0786e-03,  1.6226e-02,  1.8264e-03,
         1.1652e-02,  2.3385e-03,  4.4619e-04,  1.3472e-02,  1.2978e-03,
        -4.9086e-04,  1.7477e-03,  2.9358e-01,  5.9007e-03,  2.4217e-03,
         1.8804e-02,  1.0671e-02,  6.3998e-03,  3.9865e-03,  2.4914e-03,
         5.2103e-01,  1.2910e-03,  9.4517e-05,  6.3529e-04,  1.7704e-03],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([0.1282, 0.0323, 0.0028, 0.0086, 0.0026, 0.0039, 0.0141, 0.0038, 0.0023,
        0.0118, 0.0031, 0.0041, 0.0017, 0.0024, 0.0137, 0.0073, 0.0203, 0.7209,
        0.0057, 0.0067, 0.0035, 0.0000, 0.0000, 0.0000, 0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #3400: [tensor([ 0.0217, -0.0871, -0.0069, -0.0489, -0.0074, -0.0012, -0.0047, -0.0704,
        -0.0059, -0.0041, -0.0036, -0.0056, -0.0057, -0.0021, -0.0020, -0.2234,
        -0.0082, -0.4651, -0.0078, -0.0139, -0.0043,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-2.8594e-02, -5.4065e-02, -5.5467e-03, -2.5877e-02, -6.7037e-03,
        -1.4685e-03, -2.1709e-03, -6.6334e-02, -3.6099e-03, -4.0123e-03,
        -2.3554e-03, -5.0229e-03, -6.2384e-03, -2.0853e-03, -4.9309e-04,
        -5.3664e-01, -7.0108e-03, -1.5058e-02, -7.2075e-03, -2.0737e-01,
        -8.5108e-03, -3.6324e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1674, -0.0030, -0.0343, -0.0045, -0.0095, -0.0033, -0.0039, -0.0041,
        -0.0040, -0.0050, -0.0012, -0.0014, -0.0048, -0.0725, -0.0020, -0.0037,
        -0.0003, -0.0040, -0.0395, -0.0059, -0.0703, -0.1018, -0.0018, -0.0070,
        -0.2863, -0.1033, -0.0056, -0.0213, -0.0065, -0.0062, -0.0084, -0.0026,
        -0.0045,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0709, -0.0028, -0.0325, -0.0025, -0.0099, -0.0014, -0.0034, -0.0025,
        -0.0017, -0.0059, -0.0015, -0.0021, -0.0051, -0.2451, -0.0011, -0.0034,
        -0.0012, -0.0021, -0.0529, -0.0051, -0.0552, -0.0758, -0.0047, -0.0071,
        -0.0030, -0.0432, -0.0019, -0.0132, -0.2657, -0.0036, -0.0063, -0.0046,
        -0.0306, -0.0054, -0.0050, -0.0006, -0.0126, -0.0043, -0.0020, -0.0022],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0459, -0.0044, -0.0250, -0.0048, -0.0095, -0.0028, -0.0027, -0.0046,
        -0.0035, -0.0045, -0.0037, -0.0021, -0.0043, -0.0753, -0.0021, -0.0041,
        -0.0011, -0.0029, -0.0364, -0.0059, -0.0069, -0.0508, -0.0080, -0.0135,
        -0.2044, -0.0083, -0.4311, -0.0089, -0.0142, -0.0030, -0.0055,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1638, -0.0188, -0.0143, -0.1105, -0.0095, -0.2496, -0.0061, -0.0114,
        -0.0770, -0.0525, -0.0033, -0.0226, -0.0177, -0.0362, -0.0842, -0.0234,
        -0.0617, -0.0199, -0.0177,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1169, -0.0078, -0.0096, -0.0495, -0.0093, -0.1099, -0.0048, -0.0088,
        -0.0440, -0.0322, -0.0009, -0.0031, -0.0164, -0.0176, -0.0269, -0.0286,
        -0.4421, -0.0041, -0.0079, -0.0260, -0.0215, -0.0042, -0.0081,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-3.4253e-02, -4.7561e-03, -4.3010e-03, -1.9567e-02, -3.2181e-03,
        -6.9990e-02, -3.2286e-03, -4.2860e-03, -1.9982e-02, -1.3927e-02,
        -4.3709e-04, -5.5751e-03, -8.2408e-03, -1.1574e-02, -1.6576e-02,
        -8.5824e-03, -1.1654e-02, -2.0569e-01, -1.2629e-02, -1.6506e-02,
        -5.0365e-01, -1.1908e-02, -4.4010e-03, -5.0588e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.1120, -0.2471, -0.0086, -0.0065, -0.1073, -0.0040, -0.0061, -0.0091,
        -0.0049, -0.0540, -0.0141, -0.0081, -0.0039, -0.0074, -0.2311, -0.0180,
        -0.0631, -0.0520, -0.0070, -0.0152, -0.0081, -0.0124,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0386, -0.0971, -0.0054, -0.0036, -0.0361, -0.0009, -0.0045, -0.0055,
        -0.0026, -0.0315, -0.0066, -0.0038, -0.0016, -0.0037, -0.1299, -0.0098,
        -0.0060, -0.0124, -0.0101, -0.4761, -0.0064, -0.0570, -0.0422, -0.0043,
        -0.0008, -0.0033,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.1337, -0.1565, -0.0096, -0.0080, -0.0682, -0.0054, -0.0062, -0.0075,
        -0.0035, -0.0821, -0.0118, -0.0062, -0.0021, -0.0048, -0.1249, -0.0187,
        -0.0086, -0.0405, -0.0162, -0.0192, -0.1498, -0.1077,  0.0006, -0.0032,
        -0.0050,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2778, -0.0085, -0.0167, -0.0619, -0.0048, -0.0919, -0.0119, -0.0080,
        -0.1146, -0.0049, -0.0008, -0.0084, -0.0865, -0.0201, -0.0198, -0.0128,
        -0.0121, -0.0167, -0.0136, -0.0294, -0.0341, -0.0252, -0.0574, -0.0208,
        -0.0245, -0.0088, -0.0075,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #3450: [tensor([ 0.0669, -0.2369,  0.0009, -0.0387, -0.0085, -0.0059, -0.0150, -0.1768,
        -0.0067, -0.0062, -0.0017, -0.0098, -0.2012, -0.0217, -0.0210, -0.0098,
        -0.1277, -0.0226, -0.0100, -0.0117,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2483, -0.1766, -0.0005, -0.0332, -0.0077, -0.0064, -0.0160, -0.2276,
        -0.0082, -0.0189, -0.0019, -0.0073, -0.0967, -0.0059, -0.0159, -0.0175,
        -0.0114, -0.0289, -0.0260, -0.0182, -0.0181, -0.0074, -0.0015,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-4.3243e-02, -4.0081e-03, -5.9623e-03, -4.6621e-03, -5.4513e-02,
        -3.1187e-03, -3.7661e-03, -6.8738e-04, -1.4875e-03, -8.9136e-03,
        -1.0083e-02, -1.3578e-02, -8.4685e-03, -7.5075e-01, -4.9074e-03,
        -9.1335e-03, -5.0619e-02, -8.1967e-03, -7.4616e-03, -2.9068e-03,
        -3.5322e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2661, -0.0371, -0.0449, -0.0364, -0.2545, -0.0165, -0.0284, -0.0020,
        -0.0101, -0.0926, -0.0911, -0.0698, -0.0148, -0.0188, -0.0168,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1354, -0.0186, -0.0230, -0.0285, -0.1247, -0.0097, -0.0099, -0.0021,
        -0.0060, -0.0418, -0.0160, -0.3496, -0.0517, -0.0555, -0.0697, -0.0156,
        -0.0136, -0.0147, -0.0138,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-8.8419e-02, -3.7918e-02, -2.3028e-03, -3.9575e-03, -3.0340e-02,
        -2.6189e-03, -3.0143e-03, -8.4069e-03, -1.7127e-02, -2.6739e-04,
        -2.4172e-03, -5.6466e-02, -8.4394e-02, -3.4734e-03, -3.2479e-03,
        -1.5360e-03, -3.9108e-03, -9.7247e-03, -2.6548e-03, -1.3586e-01,
        -8.1705e-04, -2.5340e-02, -2.5595e-04, -3.8590e-03, -2.8923e-03,
         1.1865e-04,  1.6176e-04, -2.1032e-03, -9.4547e-02, -3.9305e-03,
        -1.7217e-03, -9.3907e-02, -2.6643e-01, -1.8613e-03, -4.0062e-03],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.0048, -0.1348, -0.0045, -0.0087, -0.0529, -0.0046, -0.0059, -0.0079,
        -0.0229, -0.0014, -0.0045, -0.0646, -0.1886, -0.0059, -0.0058, -0.0016,
        -0.0059, -0.0139, -0.0052, -0.1747, -0.0024, -0.0294, -0.0008, -0.0029,
        -0.0056, -0.0016, -0.0038, -0.0047, -0.1995, -0.0069, -0.0129, -0.0049,
        -0.0055,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-7.7585e-02, -1.4305e-01, -3.4809e-03, -5.7666e-03, -4.8860e-02,
        -3.1814e-03, -6.0093e-03, -8.0760e-03, -2.2049e-02, -1.3628e-03,
        -5.1231e-03, -9.8012e-02, -1.1817e-01, -7.3605e-03, -6.5384e-03,
        -3.4660e-03, -4.7252e-03, -1.9212e-02, -6.1637e-03, -1.0681e-01,
        -3.7289e-03, -4.9309e-02, -1.5181e-04, -3.8705e-03, -5.7470e-03,
        -1.2692e-03, -2.4739e-03, -5.5516e-03, -2.2170e-01, -6.6961e-03,
        -4.5071e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.1741e-01, -3.5690e-03, -1.6450e-02, -5.4258e-02, -1.3875e-03,
        -4.5884e-03, -3.6684e-03, -2.7348e-02, -2.9805e-03, -1.6242e-02,
        -1.1173e-02, -7.0185e-03, -2.5464e-03, -2.8611e-03, -1.4961e-04,
        -2.3759e-03, -7.6329e-04, -7.8409e-03, -2.3560e-03, -1.0088e-03,
        -1.1210e-02, -3.6584e-02, -6.5969e-01, -3.0375e-03, -3.4859e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.0108, -0.0064, -0.0505, -0.1733, -0.0036, -0.0055, -0.0058, -0.0667,
        -0.0040, -0.1030, -0.0266, -0.0141, -0.0021, -0.0088, -0.0017, -0.0032,
        -0.0020, -0.0134, -0.0026, -0.0176, -0.1233, -0.3500, -0.0007, -0.0044,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-4.7201e-02, -3.6278e-03, -1.6332e-02, -2.9590e-02, -1.1892e-03,
        -4.9119e-03, -2.8015e-03, -2.4082e-02, -4.6334e-03, -1.6403e-02,
        -1.4313e-02, -6.4690e-03, -2.7455e-03, -4.9705e-03, -1.1814e-03,
        -4.6433e-04, -1.0924e-03, -8.8061e-03, -1.2264e-03, -1.7616e-03,
        -1.2164e-02, -2.2708e-02, -7.6494e-01, -3.5240e-03, -2.8619e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.1241e-01, -4.7758e-03, -1.3304e-02, -3.7072e-02, -1.2333e-03,
        -4.0700e-03, -3.2414e-03, -2.7652e-02, -2.7880e-03, -1.6708e-02,
        -1.3525e-02, -5.5357e-03, -2.7918e-03, -2.8757e-03, -8.9147e-04,
        -1.7457e-03, -4.9149e-04, -7.9155e-03, -2.3455e-03, -8.4654e-03,
        -2.8304e-02, -1.6499e-02, -6.7821e-01, -3.9275e-03, -3.2166e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #3500: [tensor([-0.1647, -0.0156, -0.0272, -0.0452, -0.0130, -0.0103, -0.0142,  0.0010,
        -0.0136, -0.0177, -0.0131, -0.0210, -0.2108, -0.0240, -0.0083, -0.0103,
        -0.0484, -0.0617, -0.0276, -0.1689, -0.0281, -0.0244, -0.0184, -0.0124,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-3.8110e-02, -4.5209e-03, -3.9730e-03, -9.9314e-03, -3.2092e-03,
        -3.5386e-03, -3.4581e-03, -6.3414e-04, -2.9067e-03, -3.1084e-03,
        -3.8205e-03, -3.5793e-03, -6.6442e-02, -4.3041e-03, -1.7030e-03,
        -2.7512e-03, -9.7331e-03, -8.4120e-03, -6.6282e-03, -1.5797e-02,
        -3.2112e-03, -6.2855e-03, -7.8409e-01, -3.7073e-03, -1.8034e-03,
        -4.3443e-03,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1564, -0.0102, -0.0161, -0.0250, -0.0087, -0.0068, -0.0097, -0.0026,
        -0.0070, -0.0098, -0.0095, -0.0102, -0.2151, -0.0131, -0.0041, -0.0057,
        -0.0232, -0.3659, -0.0355, -0.0228, -0.0133, -0.0089, -0.0123, -0.0080,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0075, -0.0043, -0.0037,  0.0010, -0.0055,  0.0009, -0.0060, -0.0072,
        -0.0381, -0.0111, -0.0046, -0.8355, -0.0068, -0.0025, -0.0029, -0.0092,
        -0.0111, -0.0088, -0.0153, -0.0097, -0.0031, -0.0053,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1988, -0.0027, -0.0021, -0.0035, -0.0031, -0.0014, -0.0058, -0.0069,
        -0.0251, -0.0084, -0.0038, -0.6654, -0.0046, -0.0033, -0.0032, -0.0095,
        -0.0054, -0.0157, -0.0110, -0.0092, -0.0077, -0.0034,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0880, -0.0056, -0.0012, -0.0018, -0.0044, -0.0013, -0.0036, -0.0045,
        -0.0162, -0.0070, -0.0036, -0.6214, -0.0077, -0.0017, -0.0013, -0.0085,
        -0.0042, -0.0111, -0.0516, -0.0090, -0.0147, -0.0127, -0.0201, -0.0101,
        -0.0623, -0.0163, -0.0044, -0.0057], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0499, -0.1459, -0.0066, -0.0203, -0.0104, -0.0227, -0.0008, -0.1067,
        -0.0048, -0.0084, -0.0047, -0.0134, -0.0030, -0.0048, -0.0064, -0.0432,
        -0.0105, -0.4607, -0.0548, -0.0125, -0.0045, -0.0051,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 1.1378e-02, -2.7155e-01, -4.4222e-03, -1.5316e-02, -8.9391e-03,
        -2.2177e-02, -7.5661e-04, -1.1706e-01, -6.8678e-03, -1.0495e-02,
        -8.0551e-03, -9.8488e-03, -4.2577e-03, -5.7157e-03, -2.2677e-01,
        -1.1777e-02, -1.9607e-02, -1.6396e-02, -8.5319e-02, -2.0604e-05,
        -1.1470e-01, -8.9530e-03, -1.9322e-04, -4.4189e-03, -7.9227e-03,
        -7.0860e-03,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 0.0488, -0.1468, -0.0060, -0.0145, -0.0122, -0.0146,  0.0004, -0.0846,
        -0.0057, -0.0075, -0.0040, -0.0109, -0.0012, -0.0055, -0.0107, -0.0712,
        -0.0092, -0.2538, -0.2529, -0.0101, -0.0070, -0.0038, -0.0090, -0.0052,
        -0.0043,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0265, -0.1784, -0.0050, -0.0100, -0.0129, -0.1275, -0.0085, -0.0102,
        -0.0027, -0.0019, -0.1855, -0.0177, -0.2571, -0.0225, -0.0779, -0.0341,
        -0.0064, -0.0152,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1351, -0.1996, -0.0053, -0.0088, -0.0095, -0.0794, -0.0068, -0.0093,
        -0.0022, -0.0060, -0.1599, -0.0110, -0.1302, -0.0190, -0.1926, -0.0093,
        -0.0051, -0.0108,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0544, -0.0534, -0.0032, -0.0046, -0.0045, -0.0381, -0.0045, -0.0058,
        -0.0009, -0.0010, -0.0311, -0.0062, -0.0594, -0.0102, -0.0333, -0.0046,
        -0.0081, -0.6622, -0.0073, -0.0022, -0.0050,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #3550: [tensor([-0.0026, -0.0232, -0.0040, -0.0302, -0.0158, -0.0067, -0.0037, -0.0067,
        -0.0079, -0.0021, -0.0018, -0.0683, -0.0014, -0.0014, -0.0020, -0.0768,
        -0.0078, -0.3631, -0.0043, -0.0090, -0.3421, -0.0046, -0.0061, -0.0036,
        -0.0046,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0301, -0.0464, -0.0028, -0.0505, -0.0301, -0.0067, -0.0044, -0.0079,
        -0.0092, -0.0056, -0.0029, -0.0861, -0.0039, -0.0013, -0.0026, -0.1207,
        -0.0079, -0.4557, -0.0084, -0.0187, -0.0115, -0.0085, -0.0455, -0.0124,
        -0.0025, -0.0086, -0.0055, -0.0036,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1745, -0.0068, -0.0019, -0.0189, -0.0281, -0.2200, -0.0075, -0.0046,
        -0.0025, -0.0046, -0.0057, -0.0105, -0.0018, -0.1821, -0.0139, -0.1115,
        -0.0154, -0.0332, -0.0110, -0.1347, -0.0059, -0.0047,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2067, -0.0130,  0.0007, -0.0168, -0.0550, -0.1454, -0.0079, -0.0030,
        -0.0011, -0.0070, -0.0095, -0.0252, -0.0047, -0.2675, -0.0143, -0.1490,
        -0.0197, -0.0079, -0.0231, -0.0036, -0.0145, -0.0042,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1456, -0.0037, -0.0010, -0.0103, -0.0431, -0.0822, -0.0064, -0.0051,
        -0.0035, -0.0034, -0.0044, -0.0091, -0.0044, -0.4420, -0.0135, -0.1543,
        -0.0197, -0.0090, -0.0120, -0.0096, -0.0077, -0.0102,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-8.2853e-02, -7.6124e-02, -5.0662e-03, -3.5744e-02, -4.3760e-03,
        -2.0823e-03, -5.0059e-03, -4.8570e-02, -8.0462e-03, -3.1312e-03,
        -2.9801e-03, -3.7647e-03, -1.8829e-03, -2.8257e-02, -1.4001e-03,
         9.7908e-05, -2.7059e-03, -5.1199e-01, -7.6874e-03, -7.1011e-03,
        -5.9669e-03, -7.3692e-03, -3.7583e-03, -5.3801e-02, -4.2089e-03,
        -4.1247e-03, -1.0765e-02, -8.8663e-03, -4.0057e-02, -7.2609e-03,
        -3.7537e-03, -4.8824e-03, -2.9356e-03, -3.3867e-03], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 0.0113, -0.2021, -0.0095, -0.0772, -0.0047, -0.0038, -0.0071, -0.1241,
        -0.0114, -0.0056, -0.0034, -0.0075, -0.0028, -0.0507, -0.0015, -0.0009,
        -0.0027, -0.3428, -0.0106, -0.0097, -0.0096, -0.0870, -0.0040, -0.0037,
        -0.0063,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-3.5852e-02, -3.6875e-02, -5.7629e-03, -3.0308e-02, -3.9619e-03,
        -3.9045e-03, -5.1144e-03, -3.7052e-02, -8.6678e-03, -3.6409e-03,
        -6.0010e-03, -2.9935e-03, -3.2456e-03, -2.8501e-02, -2.5777e-04,
         1.5066e-04, -4.2001e-03, -2.4972e-01, -1.2011e-02, -1.4732e-02,
        -7.2134e-03, -7.0340e-03, -4.7791e-01, -6.3086e-03, -3.5886e-03,
        -4.9964e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0172, -0.0187, -0.0027, -0.0188, -0.0033, -0.0023, -0.0146, -0.0036,
        -0.0027,  0.0009, -0.0019, -0.8675, -0.0087, -0.0091, -0.0075, -0.0035,
        -0.0082, -0.0038, -0.0051,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0585, -0.0128, -0.0033, -0.0126, -0.0019, -0.0008, -0.0109, -0.0027,
        -0.0016,  0.0005, -0.0011, -0.0436, -0.0067, -0.0188, -0.0036, -0.0086,
        -0.0062, -0.3154, -0.0059, -0.0100, -0.0037, -0.0020, -0.4593, -0.0032,
        -0.0006, -0.0023, -0.0005, -0.0029,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-2.9173e-02, -1.8054e-02, -3.2036e-03, -1.7881e-02, -1.9621e-03,
        -1.3530e-03, -1.1896e-02, -4.6451e-03, -1.3816e-03,  2.9272e-04,
        -5.7329e-04, -8.1123e-01, -5.6643e-03, -6.0869e-02, -6.2449e-03,
        -4.8023e-03, -5.3214e-03, -5.0467e-03, -4.8410e-03, -2.0797e-03,
        -3.4828e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0513, -0.0906, -0.0121, -0.0006, -0.0028, -0.0386, -0.0043, -0.0023,
        -0.0045, -0.0019, -0.0065, -0.5744, -0.0074, -0.1750, -0.0118, -0.0070,
        -0.0091,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #3600: [tensor([-0.0510, -0.0262, -0.0046, -0.0024, -0.0134, -0.0029, -0.0124, -0.0043,
        -0.0034, -0.0033, -0.0042, -0.0054, -0.0261, -0.0017,  0.0013, -0.0024,
        -0.0076, -0.0051, -0.0072, -0.0071, -0.0043, -0.0060, -0.7739, -0.0050,
        -0.0046, -0.0062, -0.0040, -0.0040,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-1.0751e-01, -5.4779e-01, -8.9312e-03, -4.2977e-03, -2.5113e-02,
        -7.2894e-03, -2.4238e-02, -7.7522e-03, -2.5515e-03, -5.3201e-03,
        -6.7692e-03, -1.1916e-02, -1.6483e-01, -3.7493e-03, -5.1138e-04,
        -4.3017e-03, -9.7957e-03, -1.4196e-02, -1.0368e-02, -2.6657e-02,
        -6.1187e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0382, -0.0345, -0.0017, -0.0151, -0.0145, -0.0014, -0.0036, -0.0024,
        -0.0033, -0.0013, -0.0015, -0.0015, -0.0024, -0.2172, -0.0050, -0.0363,
        -0.0059, -0.5859, -0.0063, -0.0060, -0.0058, -0.0051, -0.0020, -0.0030,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 0.0054, -0.0651, -0.0014, -0.0248, -0.0222, -0.0017, -0.0032, -0.0030,
        -0.0036, -0.0012, -0.0018, -0.0019, -0.0025, -0.4422, -0.0043, -0.0586,
        -0.0086, -0.0039, -0.0086, -0.3185, -0.0036, -0.0073, -0.0034, -0.0031,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-4.2145e-02, -2.6361e-02, -6.7426e-04, -1.4690e-02, -1.5817e-02,
        -1.2518e-03, -2.3262e-03, -3.3724e-03, -2.2393e-03, -2.4244e-03,
        -1.3995e-03,  7.1751e-06, -1.7168e-03, -2.5209e-01, -4.3501e-03,
        -3.8576e-02, -4.4950e-03, -5.6108e-01, -4.8090e-03, -6.9988e-03,
        -3.7008e-03, -5.7844e-03, -7.2749e-04, -2.9618e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 0.2228, -0.2254, -0.0067, -0.0142, -0.0528, -0.2643, -0.0077, -0.0093,
        -0.0155, -0.0063, -0.0084, -0.0180, -0.0101, -0.0080, -0.0112, -0.0157,
        -0.0173, -0.0196, -0.0092, -0.0134, -0.0246, -0.0100, -0.0098,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-5.9328e-02, -3.2357e-02, -2.7487e-03, -2.7452e-03, -9.2890e-03,
        -3.4352e-02, -1.2790e-03, -4.0841e-03, -4.7944e-03, -1.2270e-03,
        -1.7174e-03, -2.0922e-03, -1.5992e-04, -2.1245e-03, -2.9758e-02,
        -4.4838e-03, -6.8526e-03, -6.6857e-03, -5.7423e-03, -3.0610e-03,
        -4.2044e-03, -2.9320e-03, -1.5114e-02, -6.0369e-03, -7.4006e-01,
        -1.0659e-02, -2.9450e-03, -3.1692e-03,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0355, -0.1254, -0.0035, -0.0036, -0.0207, -0.0669, -0.0041, -0.0059,
        -0.0073, -0.0037, -0.0029, -0.0049, -0.0008, -0.0015, -0.1559, -0.0065,
        -0.0105, -0.0116, -0.5117, -0.0091, -0.0034, -0.0047,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-1.9700e-02, -4.6304e-02, -1.1743e-03, -3.4556e-03, -4.8306e-04,
        -1.4255e-03, -1.1912e-02, -4.6849e-02, -3.2458e-03, -2.1344e-03,
        -1.2067e-02, -9.6457e-03, -2.6153e-03, -1.4994e-03, -2.8452e-03,
        -6.3110e-03, -4.1778e-03, -1.4133e-03, -1.4726e-03, -3.5407e-01,
        -4.1835e-03, -4.2991e-02, -6.6190e-03, -6.5621e-03, -6.3397e-03,
        -3.6196e-01, -3.4444e-02,  2.8380e-05, -4.0688e-03], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 3.9089e-03, -5.4996e-02, -4.0073e-04, -2.8610e-03, -1.6613e-03,
        -2.0791e-03, -2.1268e-02, -5.6651e-02, -5.9712e-03, -3.8293e-03,
        -1.5148e-02, -1.4347e-02, -2.5065e-03, -1.0142e-03, -4.1503e-03,
        -9.8334e-03, -5.6746e-03, -4.4574e-04, -3.3530e-03, -4.4990e-01,
        -5.2531e-03, -7.5759e-02, -3.4365e-03, -7.6695e-03, -2.3498e-01,
        -4.6703e-03, -3.4542e-03, -4.7776e-03,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-6.1131e-02, -7.2692e-02,  2.5460e-04, -2.2728e-03, -4.0487e-05,
        -2.6213e-03, -1.2587e-02, -4.2460e-02, -4.7240e-03, -2.0974e-03,
        -1.4117e-02, -1.3531e-02, -1.2847e-03, -2.0010e-03, -3.2499e-03,
        -1.0234e-02, -5.2743e-03, -1.7012e-03, -1.9430e-03, -6.6621e-01,
        -6.1353e-03, -5.8702e-02, -4.6356e-03, -4.4505e-03, -1.9259e-03,
        -3.7234e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0851, -0.0041, -0.0287, -0.0053, -0.0019, -0.0012, -0.0031, -0.0057,
        -0.0029, -0.0068, -0.0038, -0.0051, -0.0077, -0.0009, -0.0013, -0.5704,
        -0.0064, -0.0171, -0.2043, -0.0086, -0.0107, -0.0113, -0.0030, -0.0045,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #3650: [tensor([-1.3591e-01, -2.2226e-01, -4.3875e-03, -5.0733e-03, -2.4359e-03,
        -6.6250e-03, -7.7859e-03, -9.3677e-04, -3.1365e-03, -9.4966e-03,
        -6.3841e-03, -1.9600e-02, -3.7202e-03,  6.2472e-05, -2.3651e-03,
        -3.1319e-01, -9.5030e-03, -1.9738e-01, -9.9450e-03, -1.7656e-02,
        -3.0759e-03, -5.5206e-03, -7.6700e-03, -5.8862e-03,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0306, -0.1108, -0.0057, -0.0646, -0.0016, -0.0726, -0.0038, -0.0134,
        -0.0048, -0.0045, -0.0069, -0.0049, -0.0042, -0.0026, -0.0006, -0.6034,
        -0.0078, -0.0364, -0.0097, -0.0066, -0.0045,  0.0000,  0.0000,  0.0000,
         0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0128, -0.1029, -0.0055, -0.0430, -0.0034, -0.0648, -0.0039, -0.0107,
        -0.0038, -0.0059, -0.0057, -0.0043, -0.0069, -0.0008, -0.0013, -0.3847,
        -0.0086, -0.0219, -0.2876, -0.0125, -0.0046, -0.0044,  0.0000,  0.0000,
         0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0188, -0.1506, -0.0047, -0.0293, -0.0035, -0.0785, -0.0049, -0.0108,
        -0.0043, -0.0022, -0.0050, -0.0076, -0.0025, -0.0012, -0.0025, -0.2283,
        -0.0065, -0.2228, -0.0128, -0.1911, -0.0044, -0.0044, -0.0033,  0.0000,
         0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2806, -0.0032, -0.0025, -0.3722, -0.0108, -0.0125, -0.0178, -0.0210,
        -0.0080, -0.0099, -0.1003, -0.0591, -0.0140, -0.0158, -0.0162, -0.0119,
        -0.0126, -0.0158, -0.0157,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1721, -0.0026,  0.0009, -0.3592, -0.0093, -0.0155, -0.0117, -0.0141,
        -0.0037, -0.0068, -0.0716, -0.0658, -0.0134, -0.1485, -0.0049, -0.0074,
        -0.0180, -0.0346, -0.0152, -0.0116, -0.0130,  0.0000,  0.0000,  0.0000,
         0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.8269e-01,  3.1863e-05, -1.4458e-03, -3.6486e-01, -3.9669e-03,
        -6.5787e-03, -6.4524e-03, -9.2373e-03, -2.2327e-03, -1.9982e-03,
        -4.9158e-02, -3.7561e-02, -5.7203e-03, -1.0619e-02, -2.4202e-01,
        -2.1165e-02, -1.1057e-02, -2.2396e-02, -9.6779e-03, -5.4942e-03,
        -5.6366e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2347, -0.0280, -0.0138, -0.1781, -0.0305, -0.0108, -0.0152, -0.0053,
        -0.1996, -0.0363, -0.0049, -0.0110, -0.0085, -0.0568, -0.0279, -0.0343,
        -0.0259, -0.0650, -0.0132,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0760, -0.0112, -0.0063, -0.0378, -0.0042, -0.0033, -0.0041, -0.0030,
        -0.0520, -0.0088, -0.0032, -0.0018, -0.0036, -0.0250, -0.0079, -0.0642,
        -0.0105, -0.0071, -0.0141, -0.0085, -0.5890, -0.0130, -0.0317, -0.0091,
        -0.0046], device='cuda:0', grad_fn=<DivBackward0>), tensor([-4.2063e-02, -7.2369e-03, -4.2252e-03, -1.8342e-02, -4.5989e-03,
        -2.6956e-03, -2.3233e-03, -1.8977e-03, -2.4527e-02, -7.9474e-03,
        -2.3454e-03, -3.9611e-04, -1.8411e-03, -1.1099e-02, -7.1941e-03,
        -1.7042e-02, -5.6748e-03, -8.1418e-01, -6.4504e-03, -9.8415e-03,
        -3.1990e-03, -4.8833e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0389, -0.0107, -0.0017, -0.0403, -0.0077, -0.0045, -0.0061, -0.0682,
        -0.0053, -0.0038, -0.0092, -0.0082, -0.0358, -0.0079, -0.0076, -0.7119,
        -0.0072, -0.0147, -0.0044, -0.0060,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0566, -0.0062, -0.0021, -0.0167, -0.0049, -0.0024, -0.0049, -0.0286,
        -0.0056, -0.0031, -0.0070, -0.0031, -0.0052, -0.0571, -0.0075, -0.0051,
        -0.0075, -0.7513, -0.0072, -0.0075, -0.0049, -0.0017, -0.0038,  0.0000,
         0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #3700: [tensor([-0.1802, -0.2094, -0.0171, -0.0340, -0.0029, -0.0181, -0.3074, -0.0384,
        -0.0511, -0.0183, -0.0570, -0.0218, -0.0443,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2010, -0.1397, -0.0234, -0.0243, -0.0181, -0.0062, -0.1486, -0.0228,
        -0.0545, -0.0732, -0.0364, -0.0336, -0.0540, -0.0378, -0.0337, -0.0699,
        -0.0229,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1101, -0.2120, -0.0170, -0.0378, -0.0187, -0.0202, -0.0590, -0.3255,
        -0.0302, -0.1436, -0.0259,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.0157, -0.1052, -0.0139, -0.0191, -0.0150, -0.0075, -0.1234, -0.0253,
        -0.0205, -0.0416, -0.0123, -0.0347, -0.0380, -0.4971, -0.0162, -0.0144,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1894, -0.1350, -0.0101, -0.0335, -0.0125, -0.0141, -0.1775, -0.0306,
        -0.0308, -0.0278, -0.0174, -0.1835, -0.0978, -0.0400,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.0592, -0.2755, -0.0213, -0.0383, -0.0227, -0.0243, -0.2576, -0.0365,
        -0.1441, -0.0412, -0.0451, -0.0341,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1881, -0.2298, -0.0217, -0.0236, -0.0120, -0.0212, -0.1687, -0.0243,
        -0.2609, -0.0222, -0.0274,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1264, -0.2461, -0.0159, -0.0389, -0.0322, -0.0168, -0.2915, -0.0554,
        -0.0854, -0.0295, -0.0281, -0.0336,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1602, -0.1318, -0.0175, -0.0209, -0.0128, -0.0087, -0.2073, -0.0356,
        -0.0191, -0.0601, -0.0177, -0.0451, -0.0704, -0.1592, -0.0168, -0.0167,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.1136e-01, -9.0502e-02, -1.3786e-03, -1.9028e-03, -5.1572e-03,
        -2.1822e-03, -1.1015e-02, -1.4689e-02, -2.5146e-03, -7.2575e-03,
        -2.0851e-02, -2.5348e-03, -3.7454e-03, -2.0453e-03, -2.1313e-03,
        -2.4706e-03,  3.4841e-04, -2.0085e-03, -4.6669e-02, -8.7700e-04,
        -1.8726e-03, -1.3354e-03,  2.1965e-04, -1.9105e-03, -1.3646e-03,
        -1.8236e-03, -2.2311e-03, -2.0444e-03,  4.7000e-06, -3.5861e-03,
        -3.3241e-03, -4.2016e-03, -9.2359e-04, -8.4073e-04, -5.0126e-01,
        -4.8996e-03, -9.0979e-02, -1.1754e-02, -9.9051e-03, -2.6554e-03,
        -6.6237e-03, -6.5192e-03, -4.3931e-03, -3.6850e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0734, -0.2006, -0.0022, -0.0031, -0.0058, -0.0023, -0.0211, -0.0253,
        -0.0032, -0.0120, -0.0307, -0.0018, -0.0047, -0.0021, -0.0025, -0.0081,
         0.0006, -0.0028, -0.0740,  0.0004, -0.0027, -0.0005, -0.0013, -0.0026,
        -0.0017, -0.0025, -0.0007, -0.0046,  0.0009, -0.0052, -0.0074, -0.0064,
        -0.0018, -0.0013, -0.0318, -0.0117, -0.1831, -0.0078, -0.0107, -0.0146,
        -0.1928, -0.0121, -0.0075, -0.0074, -0.0041,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-5.3507e-02, -4.5885e-02, -2.7417e-04, -1.6958e-03, -3.0215e-03,
        -2.4231e-03, -1.2190e-02, -1.3521e-02, -2.6133e-03, -1.1333e-02,
        -1.7404e-02, -1.7370e-03, -6.0139e-03, -2.9414e-03, -2.1266e-03,
        -4.5463e-03,  1.3186e-04, -1.9894e-03, -3.9532e-02, -3.7421e-04,
        -1.2710e-03, -8.3248e-04,  4.3044e-04, -1.4331e-03, -9.5244e-04,
        -1.4238e-03,  2.9461e-04, -2.9110e-03,  1.3273e-04, -2.5374e-03,
        -1.6900e-03, -3.1364e-03, -7.3466e-04, -1.0970e-03, -8.4234e-02,
        -9.6086e-03, -4.8778e-03, -1.2891e-02, -6.0036e-01, -5.9801e-03,
        -1.2823e-02, -3.9546e-03, -5.2946e-03, -5.5850e-03, -6.0228e-03,
        -2.6398e-03, -3.5863e-03], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #3750: [tensor([-7.8884e-02, -4.2688e-03, -5.4903e-03, -7.8467e-03, -2.8379e-03,
        -9.1512e-03, -3.4791e-02, -6.7510e-03, -2.6958e-04, -2.3792e-03,
        -1.1535e-02, -2.4955e-01, -5.3524e-01, -8.6693e-03, -1.2655e-02,
        -7.7876e-03, -8.1470e-03, -5.9806e-03, -7.7631e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-3.5040e-04, -6.9700e-02, -3.2005e-03, -1.3786e-02, -2.9042e-02,
        -1.9443e-03, -1.8844e-03,  6.6675e-04, -2.5992e-03, -3.3943e-03,
        -6.5035e-03, -4.7599e-01, -1.3485e-03, -8.6516e-03, -2.7719e-03,
        -2.0343e-03, -1.1087e-03, -2.2707e-03, -6.4191e-02, -5.6164e-03,
        -7.1698e-02, -1.3469e-02, -4.7930e-03, -4.5321e-03, -1.9820e-01,
        -2.7684e-03, -3.5590e-03, -3.9318e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-3.3882e-02, -1.1225e-01, -2.0251e-03, -3.2708e-02, -6.2564e-02,
        -2.8435e-03, -2.6508e-03,  3.9783e-04, -4.7942e-03, -3.4174e-03,
        -8.6330e-03, -4.1828e-01, -2.4622e-03, -1.0796e-02, -4.8078e-03,
        -5.3177e-03, -9.9001e-04, -4.8443e-03, -1.4137e-01, -8.1306e-03,
        -1.1322e-01, -9.8070e-03, -2.8799e-03, -4.1233e-03, -6.7969e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-6.5777e-02, -7.3513e-02, -1.0290e-03, -2.1605e-02, -3.2420e-02,
        -2.2441e-03, -2.2710e-03, -1.4189e-04, -2.6474e-03, -1.9010e-03,
        -5.3089e-03, -4.8741e-01, -2.1465e-03, -1.0839e-02, -4.1021e-03,
        -1.8947e-03, -4.7439e-04, -2.3042e-03, -1.6786e-01, -5.1303e-03,
        -7.3529e-02, -6.0702e-03, -2.1061e-02, -3.6036e-03, -7.2898e-04,
        -3.9815e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-8.1931e-02, -2.9531e-02, -2.2527e-03, -1.7564e-02, -1.9559e-02,
        -3.3046e-03, -2.6042e-03, -2.7091e-03, -1.5529e-02, -1.4471e-03,
         5.5497e-04, -3.2072e-03, -3.8817e-03, -5.0380e-04, -6.3292e-03,
        -1.1864e-02, -2.8814e-03, -6.3170e-04, -7.9827e-04, -1.4728e-01,
        -4.3470e-03, -8.6538e-03, -4.4081e-03, -6.7364e-03, -1.5363e-03,
        -2.3082e-02, -5.8293e-01, -5.7000e-03, -3.7420e-03, -1.3718e-03,
        -3.1323e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-1.4985e-02, -1.2049e-01, -2.8666e-03, -3.1374e-02, -5.1020e-02,
        -8.2190e-03, -3.5893e-03, -4.1006e-03, -6.2422e-02, -2.6691e-03,
         1.9595e-04, -5.5299e-03, -6.2349e-03, -1.4123e-03, -1.6118e-02,
        -2.6272e-02, -3.3509e-03, -2.1762e-03, -3.3649e-03, -7.8039e-02,
        -4.6755e-03, -7.9036e-02, -1.2945e-02, -4.4687e-01, -1.5132e-03,
        -5.6004e-03, -4.9263e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 3.4868e-04, -3.4120e-02, -2.4916e-03, -2.5168e-02, -3.3956e-02,
        -5.2206e-03, -2.5266e-03, -5.4326e-03, -2.4623e-02, -2.3638e-03,
         8.1146e-04, -3.1023e-03, -4.4418e-03, -1.1689e-03, -1.3635e-02,
        -2.7065e-02, -2.8096e-03, -1.7097e-03, -2.5984e-03, -2.8823e-01,
        -3.6424e-03, -5.4382e-03, -1.1907e-02, -4.7262e-01, -1.2565e-02,
        -4.3195e-03, -4.8694e-03, -2.8137e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-4.0736e-02, -3.9935e-02, -4.8047e-04, -3.7060e-03, -3.3306e-03,
        -3.3585e-02, -3.1436e-03, -1.7489e-03, -2.1085e-03, -4.3495e-03,
        -3.4260e-03, -1.4125e-03, -2.0093e-03, -3.6626e-03, -1.1490e-03,
        -5.6417e-04, -1.4366e-02, -3.4990e-02, -1.8405e-03,  1.5311e-04,
        -6.1507e-04, -2.1856e-01, -1.9021e-03, -2.0119e-03, -9.9863e-03,
        -2.8207e-01, -1.1599e-03, -4.0205e-03, -5.6211e-03, -5.4920e-03,
        -5.2954e-03, -3.6129e-03, -4.4171e-03, -7.9361e-03, -1.5173e-01,
        -9.1124e-02, -1.9936e-03, -1.9286e-03, -3.8302e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 4.9812e-02, -4.9334e-02, -8.5108e-04, -1.9829e-03, -2.6479e-03,
        -3.8372e-02, -2.0133e-03, -1.4132e-03, -3.4977e-03, -3.8266e-03,
        -3.0639e-03, -1.5909e-03, -2.2327e-03, -4.0698e-03, -1.0668e-03,
        -1.5376e-03, -1.4749e-02, -3.0914e-02, -2.7931e-03, -1.2120e-04,
        -1.9776e-03, -3.5483e-01, -2.2927e-03, -2.5942e-03, -3.3817e-03,
        -1.4316e-01, -8.8995e-03, -4.2191e-03, -5.9775e-03, -5.1123e-03,
        -6.1634e-03, -2.8739e-03, -4.1605e-03, -9.4872e-03, -3.0787e-03,
        -3.7086e-03, -9.0026e-02, -2.9925e-02, -4.2096e-03, -3.8216e-03,
        -8.5386e-02, -6.4245e-04, -4.0312e-03, -4.1571e-03], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-9.4135e-02, -9.7677e-02, -1.2844e-03, -2.8161e-03, -3.4163e-03,
        -9.4200e-02, -4.0647e-03, -1.9336e-03, -4.2440e-03, -6.2404e-03,
        -5.0479e-03, -2.9495e-03, -2.1093e-03, -4.2449e-03, -9.0471e-04,
        -2.1974e-03, -2.6668e-02, -3.8888e-02, -2.3961e-03, -3.0914e-04,
        -1.8357e-03, -3.9801e-01, -6.3805e-03, -7.4680e-02, -3.1715e-02,
        -8.7685e-03, -2.1312e-03, -8.4861e-03, -7.4730e-03, -1.0708e-02,
        -9.1459e-03, -4.2251e-03, -1.6196e-02, -1.5990e-02, -4.0774e-03,
        -4.4499e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-5.8341e-02, -2.1189e-02, -2.2248e-03, -1.3632e-02, -1.6261e-03,
        -4.3565e-04, -4.5567e-03, -1.9887e-04, -2.8751e-03, -1.9405e-03,
        -3.2612e-03, -1.1041e-02, -2.1846e-02, -6.4337e-03, -2.2482e-03,
         7.1543e-04, -3.1598e-03, -4.1619e-01, -6.0645e-03, -2.3797e-02,
        -4.2417e-03, -1.7918e-02, -3.6236e-01, -6.2491e-03, -3.3200e-03,
        -1.8733e-03, -2.2627e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-6.1058e-02, -3.6687e-02, -3.2879e-03, -1.6594e-02, -2.8443e-03,
        -1.1647e-03, -4.6775e-03, -6.8154e-04, -2.8674e-03, -2.3172e-03,
        -2.6890e-03, -1.7475e-02, -3.6436e-02, -5.8750e-03, -2.0372e-03,
        -1.2870e-06, -6.4997e-04, -6.2437e-01, -6.2436e-03, -2.2413e-02,
        -5.1368e-03, -1.0721e-01, -2.2724e-02, -4.4854e-03, -3.6377e-03,
        -2.9952e-03, -8.4241e-04, -2.5996e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #3800: [tensor([-4.1749e-02, -1.4959e-01, -1.3323e-03, -3.7905e-03, -2.2279e-03,
        -1.7838e-02, -3.6725e-03, -4.5483e-03, -3.9040e-03, -1.7047e-01,
        -4.2380e-03, -2.0677e-03, -5.0609e-03, -1.1853e-01, -6.1023e-03,
        -3.6583e-03, -1.3084e-03, -8.7110e-03, -4.3960e-03, -2.7023e-03,
        -2.1078e-03,  2.1235e-04, -2.0601e-03, -2.7956e-01, -1.0924e-02,
        -1.2167e-01, -9.0515e-03, -4.3286e-03, -3.7848e-03, -4.5919e-03,
        -5.8057e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-2.2845e-02, -1.5946e-02, -8.2328e-04, -3.3215e-03, -1.5189e-03,
        -9.4202e-03, -1.7593e-03, -1.7196e-03, -2.9395e-03, -3.4777e-02,
        -2.0714e-03, -4.7183e-04, -2.4988e-03, -2.9796e-02, -5.0356e-03,
        -2.5555e-03, -1.5656e-03, -6.4235e-03, -1.4388e-03, -1.5161e-03,
        -1.2653e-03, -4.7491e-05, -1.0708e-03, -1.9158e-01, -2.7542e-03,
        -4.4184e-02, -1.7586e-03, -4.7884e-03, -5.9491e-01, -4.1754e-03,
        -2.3771e-03, -2.6526e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 0.0429, -0.0728, -0.0010, -0.0034, -0.0015, -0.0233, -0.0027, -0.0027,
        -0.0056, -0.4044, -0.0047, -0.0019, -0.0044, -0.1538, -0.0056, -0.0057,
        -0.0021, -0.0080, -0.0054, -0.0031, -0.0068, -0.0007, -0.0010, -0.0500,
        -0.0069, -0.1605, -0.0102, -0.0029, -0.0060,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0143, -0.1326, -0.0024, -0.0071, -0.0019, -0.0371, -0.0021, -0.0043,
        -0.0058, -0.2746, -0.0063, -0.0045, -0.0051, -0.1744, -0.0070, -0.0050,
        -0.0031, -0.0138, -0.0025, -0.0050, -0.0101, -0.0015, -0.0024, -0.2463,
        -0.0101, -0.0077, -0.0034, -0.0031, -0.0066,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-4.9101e-02, -3.9118e-02, -1.7002e-03, -3.2055e-03, -1.7974e-03,
        -1.9048e-02, -3.2093e-03, -3.2498e-03, -4.5551e-03, -2.3531e-01,
        -3.0919e-03, -1.8953e-03, -2.9793e-03, -1.2900e-01, -5.0271e-03,
        -3.5305e-03, -1.3495e-03, -8.2081e-03, -2.4457e-03, -2.2155e-03,
        -2.7688e-03,  2.4868e-04,  5.1748e-04, -2.5374e-01, -5.7721e-03,
        -3.4528e-03, -1.5402e-02, -6.0721e-03, -4.1637e-03, -1.6460e-01,
        -5.6476e-03, -7.0243e-03, -7.2034e-03, -3.3459e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-1.7094e-02, -2.4262e-02, -7.0505e-04, -1.8725e-03, -1.7472e-03,
        -1.4275e-02, -2.0946e-03, -1.9038e-03, -2.5034e-03, -1.1367e-01,
        -3.1796e-03, -1.3587e-03, -4.4539e-03, -5.6369e-02, -3.5545e-03,
        -2.8197e-03, -1.7986e-03, -7.0005e-03, -1.8555e-03, -2.2062e-03,
        -2.9565e-03, -1.1263e-04, -1.4515e-03, -4.7655e-01, -2.8955e-03,
        -5.1606e-03, -5.0645e-03, -2.2542e-01, -3.8554e-03, -7.2145e-03,
        -2.8116e-03, -1.7759e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 2.5330e-02, -4.9179e-02, -1.3503e-03, -3.0196e-03, -2.0023e-03,
        -1.8353e-02, -1.3626e-03, -3.3612e-03, -4.2831e-03, -5.6187e-01,
        -3.4751e-03, -2.4974e-03, -4.0121e-03, -8.2593e-02, -3.4669e-03,
        -2.1453e-03, -2.0908e-03, -6.1911e-03, -2.9963e-03, -1.7505e-03,
        -5.5137e-03,  2.7261e-04, -6.4108e-04, -1.1535e-01, -7.8188e-03,
        -6.1691e-03, -4.0430e-03, -5.4856e-02, -7.1119e-03, -1.3232e-02,
        -3.6703e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0013, -0.0434, -0.0009, -0.0030, -0.0012, -0.0095, -0.0019, -0.0026,
        -0.0028, -0.0787, -0.0035, -0.0017, -0.0021, -0.0612, -0.0037, -0.0024,
        -0.0018, -0.0056, -0.0025, -0.0021, -0.0018, -0.0013,  0.0010, -0.1341,
        -0.0036, -0.0041, -0.3339, -0.0043, -0.0598, -0.0037, -0.0062, -0.1559,
        -0.0056, -0.0039, -0.0055, -0.0071, -0.0294, -0.0041, -0.0028],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 3.6106e-02, -5.4728e-02, -2.3091e-03, -3.2769e-03, -1.8735e-03,
        -1.6780e-02, -2.1024e-03, -2.5753e-03, -4.1984e-03, -2.6934e-01,
        -4.3506e-03,  1.5461e-04, -3.7056e-03, -9.5892e-02, -4.2317e-03,
        -3.8681e-03, -1.4169e-03, -8.9184e-03, -2.7958e-03, -2.9564e-03,
        -3.9376e-03,  5.4929e-04, -1.2544e-04, -2.4610e-01, -4.7924e-03,
        -7.5955e-02, -8.3996e-03, -1.1910e-01, -9.7599e-03, -5.2471e-03,
        -2.3129e-03, -2.1495e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-6.1104e-02, -2.7359e-02, -5.4309e-04, -1.9589e-03, -1.0019e-03,
        -9.8977e-03, -1.5225e-03, -1.9382e-03, -2.7623e-03, -5.7011e-01,
        -2.6779e-03, -1.3294e-03, -2.0424e-03, -5.7239e-02, -2.8951e-03,
        -2.1666e-03, -1.0363e-03, -3.1401e-03, -1.3532e-03, -1.3881e-03,
        -2.1627e-03, -1.7984e-04, -3.1858e-04, -1.5632e-01, -3.3316e-03,
        -3.2121e-03, -1.2275e-02, -3.2370e-03, -5.8888e-03, -3.2816e-03,
        -3.2211e-03, -2.9811e-03, -2.5396e-02, -6.3753e-03, -2.9055e-03,
        -5.8523e-03, -6.9283e-03, -2.6629e-03,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0146, -0.1494, -0.0010, -0.0051, -0.0023, -0.0321, -0.0050, -0.0065,
        -0.0056, -0.1940, -0.0062, -0.0036, -0.0061, -0.1200, -0.0067, -0.0045,
        -0.0023, -0.0121, -0.0065, -0.0032, -0.0055, -0.0012, -0.0030, -0.0923,
        -0.0142, -0.2847, -0.0030, -0.0035, -0.0059,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-4.5220e-02, -2.4252e-02, -7.4415e-04, -1.5631e-03, -1.5265e-03,
        -8.9644e-03, -1.1672e-03, -1.8798e-03, -1.8121e-03, -2.2156e-01,
        -2.4913e-03, -9.0582e-04, -1.4000e-03, -2.5584e-02, -4.2552e-03,
        -1.9357e-03, -1.3431e-03, -5.2271e-03, -1.3804e-03, -9.5609e-04,
        -8.0711e-04,  6.3918e-04, -6.7149e-05, -6.3013e-02, -1.7375e-03,
        -5.8914e-02, -2.1641e-03, -3.4662e-01, -4.0160e-03, -4.0094e-03,
        -4.9673e-03, -1.5337e-01, -4.0291e-03, -1.4872e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #3850: [tensor([-2.4464e-01, -2.5169e-02, -1.3309e-02, -1.6827e-02, -1.3627e-02,
        -3.3676e-02, -8.5328e-03,  1.5342e-04, -1.3922e-02, -9.6816e-03,
        -5.7118e-03, -2.1977e-02, -1.7915e-02, -4.7762e-01, -2.2052e-02,
        -4.4995e-02, -1.1462e-02, -1.8727e-02,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2625, -0.0514, -0.0265, -0.0273, -0.0368, -0.0521, -0.0153,  0.0021,
        -0.0332, -0.0085, -0.0133, -0.0997, -0.1758, -0.0443, -0.1053, -0.0156,
        -0.0303,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0300, -0.0272, -0.0136, -0.0213, -0.0191, -0.0373, -0.0074,  0.0036,
        -0.0104, -0.0067, -0.0057, -0.0415, -0.1106, -0.0767, -0.0104, -0.0250,
        -0.5068, -0.0206, -0.0147, -0.0115,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-1.8581e-02, -1.0199e-02, -6.6122e-03, -7.5390e-03, -7.4870e-03,
        -1.8216e-02, -6.1901e-03,  2.5775e-03, -8.1574e-03,  5.1407e-04,
        -2.5163e-03, -1.7640e-02, -2.0848e-02, -8.6195e-01, -7.0131e-03,
        -3.9614e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2991, -0.0378, -0.0240, -0.0340, -0.0278, -0.0443, -0.0106, -0.0012,
        -0.0216, -0.0131, -0.0060, -0.0138, -0.1862, -0.1217, -0.0245, -0.0669,
        -0.0225, -0.0233, -0.0216,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1757, -0.0147, -0.0280, -0.0213, -0.0056, -0.0233, -0.0243, -0.0359,
        -0.0145, -0.0303, -0.2827, -0.0329, -0.1612, -0.0216, -0.0693, -0.0299,
        -0.0287,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.2611, -0.0142, -0.0203, -0.0137,  0.0011, -0.0138, -0.0137, -0.0189,
        -0.0125, -0.0058, -0.1084, -0.0296, -0.4186, -0.0323, -0.0210, -0.0149,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.2480, -0.0196, -0.0290, -0.0093, -0.0047, -0.0169, -0.0218, -0.0153,
        -0.0062, -0.0175, -0.2280, -0.0315, -0.2471, -0.0214, -0.0265, -0.0321,
        -0.0252,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-2.1218e-02, -4.2405e-02, -3.1946e-03, -3.7591e-03, -1.5103e-03,
        -4.2635e-03, -1.7064e-03, -4.3260e-03, -2.2258e-03,  4.6406e-04,
        -1.6048e-03, -8.8694e-01, -3.6856e-03, -7.9187e-03, -5.1749e-03,
        -3.4017e-03, -6.2066e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-5.0843e-02, -3.1593e-02, -2.7130e-03, -3.4825e-03, -5.4432e-04,
        -2.3824e-03, -2.2846e-03, -3.7687e-03, -1.8879e-03, -2.6315e-04,
        -1.4428e-03, -8.1708e-01, -5.9545e-03, -6.8821e-03, -4.3028e-03,
        -5.3895e-03, -3.5808e-02, -9.5287e-03, -6.6787e-03, -3.3894e-03,
        -3.7839e-03], device='cuda:0', grad_fn=<DivBackward0>), tensor([-3.2518e-02, -2.5989e-02, -3.0094e-03, -2.5177e-03, -2.1817e-03,
        -8.7875e-04, -2.9434e-03, -2.8401e-03, -1.9290e-03, -4.7404e-04,
        -2.1025e-03, -3.7018e-01, -1.1733e-02, -3.2606e-03, -6.3907e-03,
        -5.6725e-03, -7.3897e-03, -5.0614e-01, -7.5782e-03, -1.2457e-03,
        -3.0263e-03], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1528, -0.3889, -0.0169, -0.0101, -0.0100, -0.0212, -0.0159, -0.0031,
        -0.0053, -0.0121, -0.1041, -0.0249, -0.0283, -0.0325, -0.0074, -0.0113,
        -0.0208, -0.1014, -0.0100, -0.0081, -0.0149], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #3900: [tensor([-1.4393e-01, -1.0468e-02, -3.7642e-02, -6.0479e-03, -3.7632e-03,
        -2.8392e-03, -6.8088e-03, -6.8341e-02, -4.0798e-02, -4.3196e-03,
         1.0085e-04, -7.3294e-03, -1.6264e-02, -1.5359e-01, -1.2503e-02,
        -4.3908e-01, -9.0404e-03, -1.1666e-02, -9.4572e-03, -8.6566e-03,
        -7.3494e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.0188, -0.5649, -0.0077, -0.0249, -0.0058, -0.0077, -0.0041, -0.0332,
        -0.0083, -0.0205, -0.0121, -0.0065, -0.0074, -0.0220, -0.0087, -0.0216,
        -0.0111, -0.0105, -0.1820, -0.0146, -0.0077,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0457, -0.6652, -0.0179, -0.0423, -0.0037, -0.0091, -0.0142, -0.0260,
        -0.0089, -0.0347, -0.0159, -0.0084, -0.0111, -0.0175, -0.0195, -0.0149,
        -0.0203, -0.0248,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1040, -0.6230, -0.0153, -0.0409, -0.0052, -0.0049, -0.0130, -0.0291,
        -0.0113, -0.0225, -0.0162, -0.0046, -0.0128, -0.0169, -0.0145, -0.0119,
        -0.0337, -0.0201,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0937, -0.3682,  0.0007, -0.0145, -0.0072, -0.0121, -0.0115, -0.0167,
        -0.0044, -0.0076, -0.0088, -0.0421, -0.0184, -0.0343, -0.1595, -0.0090,
        -0.0365, -0.1186, -0.0205, -0.0156,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-7.1836e-02, -1.6551e-01, -6.2361e-04, -4.5557e-03, -3.2882e-03,
        -3.8693e-03, -5.1627e-03, -4.8143e-03, -2.6822e-04, -3.6213e-03,
        -1.4226e-02, -1.8414e-02, -1.0820e-02, -5.8855e-01, -7.9893e-03,
        -1.9083e-02, -8.6477e-03, -9.6886e-03, -6.5187e-03, -4.5120e-03,
        -1.1360e-02, -6.9688e-03, -1.3469e-02, -7.7551e-03, -2.9338e-03,
        -5.5202e-03], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1231, -0.1617,  0.0016, -0.0131, -0.0095, -0.0079, -0.0148, -0.0084,
        -0.0044, -0.0091, -0.0740, -0.0328, -0.0397, -0.3071, -0.1183, -0.0268,
        -0.0238, -0.0113, -0.0126,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1007, -0.3086,  0.0019, -0.0201, -0.0069, -0.0179, -0.0208, -0.0141,
        -0.0033, -0.0138, -0.1099, -0.0616, -0.1274, -0.1004, -0.0337, -0.0175,
        -0.0130, -0.0285,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.0187e-01, -1.0146e-01, -1.2854e-04, -6.5800e-03, -4.7580e-03,
        -6.7170e-03, -2.8300e-03, -8.6870e-03, -5.6180e-03, -5.1740e-03,
        -1.1095e-01, -3.5046e-02, -6.1229e-02, -1.0480e-02, -1.0241e-02,
        -8.3987e-03, -4.3610e-01, -1.6605e-02, -2.9855e-02, -1.2058e-02,
        -1.4136e-02, -5.8721e-03, -5.2092e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1122, -0.2080,  0.0012, -0.0042, -0.0038, -0.0050, -0.0078, -0.0075,
        -0.0024, -0.0032, -0.0098, -0.1271, -0.0093, -0.0088, -0.0077, -0.0193,
        -0.0077, -0.0115, -0.3783, -0.0040, -0.0515, -0.0042, -0.0058,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-5.1935e-02, -3.6765e-02,  1.1104e-04, -4.5116e-03, -1.4241e-03,
        -2.8950e-03, -4.1794e-03, -3.6684e-03, -7.8958e-04, -3.1551e-03,
        -1.1300e-02, -1.2293e-02, -9.4586e-03, -6.9850e-01, -5.0081e-03,
        -1.0240e-02, -5.5768e-03, -5.6790e-03, -1.0305e-01, -4.0856e-03,
        -3.5765e-03, -2.2647e-03, -1.3228e-02, -2.4447e-03, -3.8658e-03,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1064, -0.3080, -0.0005, -0.0128, -0.0064, -0.0101, -0.0167, -0.0139,
        -0.0043, -0.0040, -0.0155, -0.0343, -0.0097, -0.0162, -0.3544, -0.0061,
        -0.0328, -0.0270, -0.0104, -0.0105,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #3950: [tensor([-2.6010e-02, -3.9530e-02, -2.4823e-03, -1.5757e-02, -1.8393e-02,
        -1.3033e-03, -2.7533e-03, -6.3885e-04, -1.8395e-03, -1.5523e-01,
        -1.3891e-03,  3.5646e-05, -2.1409e-03, -1.3731e-02, -1.5618e-02,
        -4.6693e-01, -3.7982e-03, -6.6851e-03, -3.5931e-03, -2.1611e-01,
        -2.2638e-03, -1.6186e-03, -2.1457e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-7.0654e-02, -2.6671e-02, -2.3423e-03, -3.8231e-03, -6.8403e-03,
        -1.5051e-03, -2.1862e-03, -2.9661e-03, -1.0086e-02, -1.3209e-03,
        -1.5833e-03, -2.0110e-01, -1.0799e-03, -4.2058e-04, -9.7498e-04,
        -3.4644e-02, -5.5261e-03, -6.1297e-03, -1.5596e-02, -8.4851e-03,
        -2.6328e-03, -2.9320e-03, -7.7672e-03, -3.7903e-03, -1.3448e-03,
        -1.3725e-03, -5.6993e-01, -2.5178e-03, -1.6273e-03, -2.1502e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-1.8588e-02, -3.1062e-02, -4.2919e-03, -4.7910e-03, -9.7288e-03,
        -1.4872e-03, -2.8005e-03, -4.8371e-03, -1.2468e-02, -2.0345e-03,
        -1.5027e-03, -5.0149e-01, -1.0333e-03,  3.9310e-05, -1.0603e-03,
        -2.2060e-01, -5.7316e-03, -1.1652e-01, -3.5869e-03, -7.8257e-03,
        -4.4840e-02, -1.2355e-03, -2.4010e-04, -2.2098e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-2.8427e-02, -3.5304e-02, -3.8675e-03, -3.0217e-03, -7.4153e-03,
        -7.2396e-04, -1.2062e-03, -2.9807e-03, -9.7139e-03, -2.9317e-03,
        -1.2976e-03, -6.3206e-01, -1.7314e-03, -1.3667e-04, -1.0344e-03,
        -1.2719e-01, -5.6316e-03, -6.9741e-02, -8.3587e-03, -4.0833e-03,
        -6.1470e-03, -4.1502e-02, -1.6476e-03, -8.7061e-04, -2.9752e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-4.1446e-02, -3.3892e-02, -2.4406e-04, -3.7686e-03, -6.1148e-05,
        -7.4412e-04, -2.2094e-02, -8.2861e-05, -1.9689e-03,  4.8721e-05,
        -2.3727e-03, -8.1614e-01, -6.3896e-03, -3.0576e-02, -1.1163e-02,
        -1.0167e-02, -8.0264e-03, -4.7802e-03, -6.0383e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-3.3941e-02, -3.2841e-02, -1.1140e-03, -3.2047e-03, -6.3227e-04,
        -2.3018e-03, -1.9682e-02,  6.9804e-04, -1.7180e-03, -5.0817e-05,
        -1.7820e-03, -8.4321e-01, -7.8395e-03, -2.9929e-02, -8.3519e-03,
        -2.8681e-03, -4.8076e-03, -5.0331e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-3.9003e-02, -3.4426e-02,  1.9309e-04, -3.0080e-03, -1.1510e-03,
        -1.0978e-03, -1.8433e-02, -8.0023e-04, -1.4736e-03, -1.2423e-04,
        -1.6833e-03, -6.6661e-01, -8.0676e-03, -3.2854e-03, -4.1070e-03,
        -7.4095e-03, -4.1283e-03, -6.4551e-03, -8.7977e-03, -2.7550e-03,
        -2.0980e-03, -6.9854e-03, -1.7191e-01, -2.9133e-03, -7.8384e-04,
        -2.3026e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-4.9175e-02, -2.2540e-02, -2.6327e-03, -1.1480e-02, -1.5395e-03,
        -8.5733e-05, -1.1563e-02, -2.3459e-03, -1.1362e-03, -1.1027e-01,
        -3.0162e-04, -8.6920e-04, -2.5003e-03, -2.9606e-02, -7.5964e-04,
        -3.4829e-03, -4.0958e-03, -5.3194e-03,  1.7177e-04,  1.5244e-04,
        -1.0781e-01, -3.6148e-03, -2.3091e-01, -9.5400e-02, -2.4142e-03,
        -5.4618e-03, -2.4836e-01, -1.8431e-03, -1.0737e-03, -3.2954e-02,
        -4.1651e-03, -2.5331e-03, -3.4250e-03], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-2.2657e-02, -1.5258e-02, -1.4895e-03, -1.3853e-02, -1.5280e-03,
        -7.2656e-04, -7.6902e-03, -1.5879e-03, -8.8861e-04, -3.8233e-02,
        -2.0786e-04, -1.1980e-03, -2.1144e-03, -6.7997e-02, -1.1900e-03,
        -2.5466e-03, -3.3656e-03, -2.9790e-03, -1.5779e-04, -4.0791e-04,
        -1.0087e-01, -3.2819e-03, -3.2140e-03, -2.0934e-03, -3.1280e-01,
        -1.6655e-03, -1.6219e-03, -3.5999e-03, -3.7385e-01, -3.1100e-03,
        -4.1326e-03, -8.4683e-04, -2.8361e-03], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-7.0659e-02, -5.9314e-02, -1.8591e-03, -1.1480e-02, -2.2388e-03,
        -8.1125e-04, -1.0122e-02, -3.4261e-03, -1.6033e-03, -7.0534e-02,
         2.9253e-04, -2.4145e-03, -3.1845e-03, -4.9246e-02, -2.1159e-03,
        -2.4426e-03, -3.0542e-03, -5.1059e-03,  9.4077e-04, -2.1437e-04,
        -9.1601e-02, -4.7047e-03, -5.7986e-03, -3.9502e-03, -5.8414e-01,
        -3.5227e-03, -1.6643e-03, -3.5641e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0623, -0.0821, -0.0013, -0.0034, -0.0148, -0.0013, -0.0030, -0.0012,
        -0.0016, -0.3115,  0.0006,  0.0005, -0.0010, -0.0023, -0.0991, -0.0120,
        -0.0050, -0.0016, -0.0050, -0.3786, -0.0018, -0.0033, -0.0026, -0.0041,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0979, -0.1083, -0.0036, -0.0065, -0.0239, -0.0066, -0.0032, -0.0008,
        -0.0034, -0.4577, -0.0018, -0.0035, -0.0019, -0.0035, -0.2041, -0.0184,
        -0.0081, -0.0053, -0.0086, -0.0060, -0.0122, -0.0051, -0.0097,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #4000: [tensor([-2.2918e-02, -1.5189e-01, -2.8279e-03, -1.1572e-02, -4.0688e-03,
        -7.0609e-03, -4.1026e-02, -3.8024e-03, -4.2425e-03, -3.4882e-04,
        -5.4501e-03, -9.2835e-03, -1.1785e-02,  4.7477e-04, -3.2359e-03,
        -4.3953e-03, -2.8174e-03, -4.8942e-03, -1.0069e-01, -1.7870e-03,
        -8.7432e-03, -3.5519e-02, -1.0593e-01, -5.1441e-03, -1.3547e-04,
        -4.0582e-04, -4.1309e-02, -9.0752e-03, -4.7184e-02, -2.2875e-01,
        -1.1838e-02, -6.8366e-02, -1.6352e-02, -1.3018e-02, -5.3282e-03,
        -8.3352e-03,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-7.1908e-02, -3.2446e-02,  4.3643e-04, -3.7468e-03, -3.5817e-03,
        -1.2907e-03, -1.7203e-02, -1.1803e-03, -2.8904e-03, -3.1975e-04,
        -3.0086e-03, -3.1604e-03, -5.7652e-03,  3.6211e-05, -1.4337e-03,
        -2.3847e-03, -1.6777e-03, -2.1877e-03, -2.0193e-02, -3.0973e-04,
        -2.4266e-03, -1.1740e-02, -3.7042e-02, -1.5380e-03,  7.3405e-04,
        -5.4165e-04, -6.6831e-01, -4.4118e-03, -2.0417e-03, -3.0718e-02,
        -5.1960e-02, -3.5920e-03, -5.1283e-03, -1.9081e-03, -2.7454e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-7.3852e-02, -1.5303e-02, -1.0766e-03, -3.2114e-03, -2.8036e-03,
        -2.0498e-03, -1.0710e-02, -1.8196e-03, -2.4870e-03, -2.7039e-04,
        -2.3626e-03, -3.0306e-03, -3.8821e-03,  1.0829e-04, -1.0883e-03,
        -3.2494e-03, -2.1137e-03, -1.4295e-03, -1.3124e-02, -2.6795e-04,
        -2.7683e-03, -8.8029e-03, -1.5391e-02, -1.1824e-03,  5.6759e-04,
        -4.7394e-04, -3.3080e-01, -3.3247e-03, -5.0203e-03, -3.6377e-03,
        -3.2536e-03, -7.9050e-03, -1.9506e-02, -3.6707e-03, -7.0079e-03,
        -4.3587e-01, -3.7397e-03, -2.8376e-03], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-6.4443e-02, -1.9929e-02, -8.7127e-04, -4.1114e-03, -3.5085e-03,
        -2.0947e-03, -1.3784e-02, -1.8158e-03, -2.6969e-03, -3.0607e-04,
        -3.6393e-03, -3.0140e-03, -6.1792e-03, -4.6160e-04, -1.5304e-03,
        -3.8130e-03, -2.2139e-03, -2.5760e-03, -1.8103e-02, -5.8198e-04,
        -2.7075e-03, -1.0453e-02, -1.5354e-02, -1.2483e-03,  3.8043e-04,
        -6.5762e-04, -5.6788e-01, -2.6332e-03, -3.7805e-03, -1.0979e-02,
        -4.0186e-03, -2.1673e-01, -4.9208e-03, -2.5899e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-8.8571e-02, -2.6134e-02, -1.0205e-03, -4.3357e-03, -2.8476e-03,
        -1.4133e-03, -1.3933e-02, -1.6949e-03, -3.0197e-03,  3.8725e-04,
        -2.6308e-03, -3.5869e-03, -4.9266e-03, -3.8907e-04, -1.4536e-03,
        -2.6301e-03, -1.6606e-03, -2.1154e-03, -2.2742e-02, -3.4182e-04,
        -1.7847e-03, -1.0108e-02, -1.9385e-02, -1.4985e-03,  2.3401e-03,
        -1.3292e-03, -6.9275e-01, -2.2133e-03, -6.4636e-03, -8.2483e-03,
        -3.5073e-03, -4.8334e-02, -5.8305e-03, -5.5410e-03, -1.6656e-03,
        -3.1685e-03,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-6.6423e-02, -2.9518e-02, -1.3406e-03, -4.6482e-03, -2.5203e-03,
        -3.1396e-03, -2.6600e-02, -1.9557e-03, -3.4026e-03, -2.4429e-04,
        -4.1651e-03, -3.4151e-03, -6.0619e-03, -1.7691e-04, -2.4274e-03,
        -2.7120e-03, -2.6134e-03, -2.0062e-03, -2.4924e-02, -8.8253e-04,
        -2.4516e-03, -1.4470e-02, -2.7784e-02, -1.9506e-03,  3.3885e-04,
        -1.3765e-03, -5.4602e-01, -6.1722e-03, -4.5653e-03, -2.7033e-02,
        -1.6607e-01, -3.5783e-03, -6.2788e-03, -2.7278e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-7.5545e-02, -3.1488e-02, -1.1149e-03, -5.4582e-03, -2.9102e-03,
        -1.2176e-03, -1.5902e-02, -2.1428e-03, -3.3656e-03,  2.7018e-04,
        -3.7865e-03, -2.9934e-03, -5.7130e-03, -2.8206e-04, -1.4235e-03,
        -2.8057e-03, -1.9499e-03, -2.2333e-03, -2.1191e-02, -2.3947e-04,
        -1.4626e-03, -1.1317e-02, -5.7348e-02, -1.8418e-03,  6.2439e-04,
         3.5820e-05, -6.7514e-01, -4.6649e-03, -4.6639e-03, -5.0343e-02,
        -6.5080e-03, -4.0212e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-7.4777e-02, -4.1617e-02, -1.1716e-03, -3.7914e-03, -2.6671e-03,
        -1.5171e-03, -1.7741e-02, -1.4342e-03, -1.8861e-03,  2.2527e-04,
        -1.8289e-03, -4.3176e-03, -6.8536e-03,  1.5272e-04, -1.1373e-03,
        -4.0463e-03, -1.6493e-03, -1.5557e-03, -1.5409e-02, -1.0122e-03,
        -2.0974e-03, -1.0884e-02, -4.7192e-02, -1.9203e-03,  1.5147e-03,
        -1.3343e-03, -5.5028e-01, -2.4173e-03, -5.3735e-03, -6.0043e-03,
        -5.1280e-03, -1.7338e-01, -3.4806e-03, -1.9248e-03, -2.2757e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0898, -0.2990, -0.0146, -0.0249, -0.0319, -0.0066, -0.0093, -0.0106,
        -0.0078, -0.0055, -0.0032, -0.0024, -0.0050, -0.2810, -0.0263, -0.1557,
        -0.0129, -0.0134,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1038, -0.1758, -0.0166, -0.0370, -0.0660, -0.0128, -0.0119, -0.0121,
        -0.0107, -0.0059, -0.0070, -0.0085, -0.0073, -0.3148, -0.0247, -0.1362,
        -0.0237, -0.0125, -0.0127,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1783, -0.2628, -0.0143, -0.0273, -0.0330, -0.0069, -0.0081, -0.0112,
        -0.0073, -0.0045, -0.0067, -0.0108, -0.0038, -0.1863, -0.0285, -0.1853,
        -0.0084, -0.0164,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0896, -0.2546, -0.0140, -0.0106, -0.0087, -0.1896, -0.0119, -0.0113,
        -0.0079, -0.0082, -0.0033, -0.0312, -0.0103, -0.0058, -0.0928, -0.0182,
        -0.0418, -0.0172, -0.0134, -0.0261, -0.0186, -0.0115, -0.0200, -0.0339,
        -0.0310, -0.0094, -0.0090,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #4050: [tensor([-5.7257e-02, -6.2004e-02, -2.6855e-03, -3.6053e-03, -4.2988e-03,
        -2.2157e-03, -3.0745e-03, -3.0352e-03, -2.3387e-02, -2.6669e-03,
        -3.8036e-03, -5.8050e-03, -1.5723e-03, -4.0379e-03, -3.7796e-03,
        -2.1194e-03, -1.8633e-02, -8.2171e-03, -2.5818e-03, -1.8542e-03,
        -3.1065e-03, -7.7987e-04,  2.2053e-04, -1.2699e-03, -9.2935e-02,
        -3.6841e-03, -5.4766e-01, -8.8090e-03, -5.9740e-03, -9.0739e-02,
        -5.6569e-03, -4.7326e-03, -6.1827e-03, -4.3731e-03, -2.0987e-03,
        -5.1424e-03], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.0031, -0.0803, -0.0017, -0.0077, -0.0062, -0.0030, -0.0024, -0.0022,
        -0.0522, -0.0031, -0.0024, -0.0061, -0.0011, -0.0056, -0.0042, -0.0049,
        -0.0640, -0.0057, -0.0025, -0.0039, -0.0035, -0.0029, -0.0012, -0.0016,
        -0.2282, -0.0052, -0.4012, -0.0087, -0.0082, -0.0049, -0.0556, -0.0048,
        -0.0052, -0.0018, -0.0045,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-5.9570e-02, -3.0580e-02, -2.4104e-03, -3.6895e-03, -2.8640e-03,
        -2.5779e-03, -3.3399e-03, -2.0992e-03, -2.0732e-02, -2.1088e-03,
        -2.4418e-03, -4.4429e-03,  1.5292e-04, -3.0332e-03, -2.7089e-03,
        -2.1593e-03, -2.7501e-02, -5.5252e-03, -2.6432e-03, -3.0996e-04,
        -1.4957e-03, -8.7642e-04,  4.1734e-04, -2.2203e-04, -6.3409e-01,
        -3.3999e-03, -1.6397e-01, -1.0411e-02, -1.8187e-03, -2.4097e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-2.8378e-02, -4.5396e-02, -7.2108e-03, -3.6875e-03, -5.8136e-03,
        -3.5787e-02, -6.1383e-03, -2.5089e-03, -3.3110e-03, -2.4882e-02,
        -5.5416e-03, -7.8482e-03,  3.6342e-04, -3.7312e-03, -4.5893e-02,
        -6.3794e-03, -1.0201e-02, -6.9839e-01, -5.3385e-03, -5.5991e-03,
        -3.4098e-02, -7.5035e-03, -2.0222e-03, -3.9785e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-9.5142e-02, -3.9865e-01, -1.6353e-02, -4.6396e-03, -8.2450e-03,
        -1.0043e-01, -7.5906e-03, -1.2681e-03, -5.7448e-03, -6.2286e-02,
        -8.0619e-03, -3.1497e-02, -2.5518e-04, -4.3465e-03, -1.0973e-01,
        -7.6304e-03, -4.4070e-02, -9.3615e-03, -8.4279e-03, -2.8912e-02,
        -1.9897e-02, -1.7303e-02, -4.5942e-03, -5.5636e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0313, -0.1880, -0.0095, -0.0062, -0.0140, -0.1101, -0.0089, -0.0041,
        -0.0058, -0.0588, -0.0058, -0.0198, -0.0003, -0.0068, -0.1877, -0.0121,
        -0.0498, -0.0030, -0.0104, -0.2424, -0.0129, -0.0029, -0.0095,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-2.7804e-02, -4.5871e-03, -8.6492e-03, -4.8877e-03, -5.7209e-03,
        -7.1833e-02, -3.2324e-03, -1.2412e-03, -4.6342e-03, -4.6095e-03,
        -1.2743e-02, -7.4834e-01, -3.4155e-03, -2.3943e-03, -8.0796e-03,
        -1.3870e-02,  1.6949e-04, -8.2425e-03, -1.8043e-03,  1.3807e-03,
        -7.5050e-04, -1.1757e-03, -1.0746e-02, -4.1927e-02, -3.7312e-03,
        -4.0301e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-5.1948e-02, -3.3594e-03, -5.0077e-03, -4.6134e-03, -2.0615e-03,
        -2.0458e-02, -3.1431e-03, -1.5282e-03, -2.6298e-03, -2.0497e-03,
        -7.5883e-03, -2.4308e-01, -3.0191e-03, -2.6229e-03, -5.6239e-03,
        -6.4795e-03, -1.2635e-03, -3.5609e-03, -9.6825e-04,  7.2751e-04,
        -5.3883e-04, -5.2632e-03, -1.4097e-02, -1.1079e-02, -3.5100e-03,
        -3.6814e-03, -5.7859e-01, -4.3909e-03, -4.1938e-03, -2.9212e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.7038e-01, -5.3426e-03, -1.4080e-02, -4.6071e-03, -8.5467e-03,
        -8.6328e-02, -4.5828e-03, -2.7346e-03, -4.7556e-03, -4.5322e-03,
        -1.7206e-02, -5.1540e-01, -2.9236e-03, -3.0183e-03, -1.3126e-02,
        -1.3087e-02, -2.3015e-03, -8.3267e-03, -2.3423e-03, -5.5066e-04,
        -1.8704e-03, -7.9912e-03, -7.1150e-02, -2.9530e-02, -1.8307e-06,
        -5.2803e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-3.0206e-02, -3.3961e-02, -1.9966e-03, -2.0891e-02, -2.5397e-03,
        -2.9300e-02, -2.1363e-03, -2.7460e-03, -9.1893e-03, -2.5038e-03,
        -5.2275e-03, -1.9072e-01, -2.3856e-03, -2.2641e-03, -1.8697e-03,
        -7.7059e-02, -1.8560e-03, -1.2562e-03, -3.1511e-04, -5.1018e-01,
        -4.0864e-03, -3.2665e-02, -6.5026e-03, -4.0918e-03, -4.7745e-03,
        -5.0789e-03, -1.7251e-03, -4.0640e-03, -3.5654e-03, -1.4987e-03,
        -3.3347e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0698, -0.0426, -0.0032, -0.0333, -0.0038, -0.0325, -0.0023, -0.0035,
        -0.0121, -0.0022, -0.0070, -0.1721, -0.0019, -0.0024, -0.0015, -0.0761,
        -0.0022, -0.0013, -0.0013, -0.4676, -0.0057, -0.0385, -0.0118, -0.0034,
        -0.0021,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0612, -0.0383, -0.0017, -0.0179, -0.0030, -0.0273, -0.0027, -0.0029,
        -0.0106, -0.0032, -0.0056, -0.2955, -0.0022, -0.0016, -0.0015, -0.0360,
        -0.0015, -0.0007, -0.0009, -0.1410, -0.0033, -0.0462, -0.0096, -0.0030,
        -0.0045, -0.2569, -0.0035, -0.0033, -0.0041, -0.0064, -0.0017, -0.0022,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #4100: [tensor([-0.2706, -0.3059, -0.0216, -0.0166, -0.1289, -0.0157, -0.0090, -0.0052,
        -0.0088, -0.0409, -0.0121, -0.0926, -0.0218, -0.0219, -0.0110, -0.0173,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2454, -0.3251, -0.0180, -0.0371, -0.1379, -0.0171, -0.0104, -0.0044,
        -0.0059, -0.0289, -0.0125, -0.0655, -0.0163, -0.0112, -0.0223, -0.0122,
        -0.0054, -0.0126, -0.0119,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1219, -0.1688, -0.0028, -0.1768, -0.0085, -0.1506, -0.0138, -0.0086,
        -0.0020, -0.0054, -0.0974, -0.0404, -0.0145, -0.1704, -0.0070, -0.0113,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.6204e-02, -1.6470e-01, -8.7155e-04, -3.9516e-02, -6.2670e-03,
        -6.2170e-02, -9.8459e-03, -4.5623e-03, -7.1281e-05, -2.9752e-03,
        -5.1375e-03, -5.7353e-01, -1.5615e-02, -7.0901e-02, -6.9088e-03,
        -6.2851e-03, -2.5844e-03, -6.5813e-03, -5.2706e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1628, -0.2960, -0.0071, -0.1149, -0.0104, -0.1519, -0.0160, -0.0111,
        -0.0018, -0.0075, -0.0888, -0.0793, -0.0155, -0.0139, -0.0050, -0.0180,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-7.6705e-02, -6.7501e-02, -1.2795e-03, -3.5540e-03, -1.1406e-03,
        -6.1399e-03, -2.6834e-02, -3.1145e-03, -3.1004e-03, -3.3804e-03,
        -1.8960e-03, -1.9301e-03, -2.9851e-03, -1.0607e-03, -1.1909e-03,
        -2.4671e-03, -3.0594e-03, -7.7534e-04, -5.5245e-04, -7.8824e-04,
        -7.2353e-01, -4.8494e-03, -2.8981e-03, -5.5285e-03, -1.1228e-03,
        -2.6720e-03, -6.5288e-03, -7.4536e-03, -8.0011e-03, -5.6631e-03,
        -5.1919e-03, -2.6482e-03, -6.3268e-03, -3.6895e-03, -4.4427e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-4.1881e-02, -1.6712e-01, -3.7481e-03, -5.6866e-03, -3.8638e-03,
        -1.3601e-02, -5.2752e-02, -6.7579e-03, -6.5266e-03, -9.6362e-03,
        -2.9390e-03, -4.0967e-03, -6.1417e-03, -2.9496e-03, -3.5065e-03,
        -5.0208e-03, -9.5053e-03, -1.4834e-04, -3.1785e-03, -3.0614e-03,
        -6.1834e-01, -6.4236e-03, -4.7741e-03, -9.3637e-03, -2.6287e-03,
        -6.3434e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-5.9401e-03, -3.5074e-02, -1.3229e-03, -4.1037e-03, -7.4425e-04,
        -6.2820e-03, -2.1307e-02, -3.3019e-03, -2.8446e-03, -4.2159e-03,
        -1.3512e-03, -2.0141e-03, -2.9950e-03, -1.4170e-03, -1.7878e-03,
        -3.7420e-03, -3.8857e-03, -1.2023e-03, -5.3581e-04, -8.7230e-04,
        -6.3922e-01, -9.3437e-03, -5.7178e-03, -6.1709e-03, -6.1714e-03,
        -2.1329e-01, -1.1792e-02, -3.3547e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2080, -0.0919, -0.0038, -0.0038, -0.0018, -0.0021, -0.0361, -0.0081,
        -0.0061, -0.0024, -0.0011, -0.0046, -0.0064, -0.0041,  0.0004, -0.0023,
        -0.1370, -0.0086, -0.0072, -0.0037, -0.0151, -0.3596, -0.0241, -0.0060,
        -0.0076, -0.0064, -0.0131, -0.0100, -0.0080, -0.0043, -0.0063,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0890, -0.1023, -0.0048, -0.0019, -0.0020, -0.0030, -0.0399, -0.0071,
        -0.0040, -0.0025, -0.0008, -0.0051, -0.0064, -0.0029,  0.0006, -0.0024,
        -0.1164, -0.0074, -0.0080, -0.0071, -0.5063, -0.0106, -0.0110, -0.0052,
        -0.0012, -0.0092, -0.0310, -0.0047, -0.0032, -0.0041,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-2.8103e-02, -8.5987e-02, -4.8801e-03, -2.8414e-03, -1.5135e-03,
        -3.4255e-03, -2.7094e-02, -5.7436e-03, -5.2567e-03, -2.6854e-03,
        -1.2329e-03, -4.7550e-03, -4.1589e-03, -2.1205e-03, -2.9773e-04,
        -1.7328e-03, -1.0350e-01, -5.9608e-03, -5.2041e-03, -4.0431e-03,
        -6.5871e-03, -6.3264e-01, -1.5352e-02, -6.8051e-03, -4.4657e-03,
        -3.0632e-03, -1.0345e-02, -8.5099e-03, -5.3308e-03, -1.1671e-03,
        -5.1914e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0615, -0.1241, -0.0074, -0.0236, -0.0009, -0.0014, -0.0206, -0.0010,
        -0.0043, -0.0033, -0.0163, -0.0049, -0.0032, -0.0050, -0.0029, -0.0163,
        -0.0227, -0.0034, -0.0031, -0.0010, -0.0020, -0.0046, -0.0003, -0.0022,
        -0.2713, -0.0065, -0.0168, -0.0080, -0.0082, -0.0138, -0.0940, -0.0083,
        -0.0055, -0.0250, -0.0114, -0.1685, -0.0096, -0.0089, -0.0041, -0.0041],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #4150: [tensor([-9.2444e-02, -1.7268e-01, -5.2549e-03, -5.6312e-03, -5.4025e-03,
        -1.1618e-02, -9.7363e-03, -5.7354e-03, -2.6811e-02, -8.7924e-03,
        -2.0985e-02, -1.4812e-02, -1.7134e-01, -3.6130e-03, -4.7401e-03,
        -4.3203e-02, -4.6544e-03, -1.3881e-03, -5.4768e-03, -3.4068e-03,
         1.5093e-04, -2.6212e-03, -7.3861e-03, -1.9297e-02, -2.6607e-01,
        -1.0525e-02, -1.2249e-02, -1.3197e-02, -3.6809e-02, -8.7134e-03,
        -5.2570e-03], device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.1645e-01, -2.7747e-02, -3.0322e-03, -2.9851e-03, -2.3852e-03,
        -4.5637e-03, -3.6586e-03, -2.3550e-03, -1.3254e-02, -1.6455e-03,
        -1.2715e-02, -4.1365e-03, -2.4776e-02, -1.8130e-03, -2.3685e-03,
        -1.1684e-02, -2.9877e-03, -1.4084e-03, -2.9232e-03, -7.1659e-04,
         1.0643e-03, -3.4878e-04, -6.2553e-01, -5.6635e-03, -1.6337e-02,
        -9.1563e-02, -4.3859e-03, -6.2129e-03, -2.1142e-03, -3.1700e-03,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.1647e-01, -2.5581e-02, -1.1690e-03, -4.1405e-03, -4.1241e-03,
        -4.1764e-03, -4.4042e-03, -2.1967e-03, -1.2883e-02, -3.6364e-03,
        -1.0836e-02, -3.2330e-03, -4.2347e-02, -2.1220e-03, -3.7498e-03,
        -1.2276e-02, -2.2602e-03, -6.0786e-04, -3.1402e-03, -1.6419e-03,
         8.8116e-04, -1.6399e-03, -6.8232e-01, -4.5053e-03, -2.4326e-02,
        -5.5871e-03, -6.2965e-03, -6.8735e-03, -2.9725e-03, -3.6086e-03,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1048, -0.1263, -0.0050, -0.0112, -0.0066, -0.0162, -0.0113, -0.0087,
        -0.0362, -0.0082, -0.0307, -0.0220, -0.2432, -0.0054, -0.0053, -0.0408,
        -0.0040, -0.0031, -0.0105, -0.0052, -0.0032, -0.0043, -0.1386, -0.0903,
        -0.0086, -0.0235, -0.0107, -0.0077, -0.0084,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1565, -0.3574, -0.0014, -0.0170, -0.0080, -0.0088, -0.0119, -0.1781,
        -0.0077, -0.0015, -0.0042, -0.0414, -0.0272, -0.0298, -0.1094, -0.0169,
        -0.0107, -0.0121,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1525, -0.2552, -0.0097, -0.0119, -0.0082, -0.0110, -0.0207, -0.3731,
        -0.0094, -0.0068, -0.0053, -0.0723, -0.0265, -0.0109, -0.0114, -0.0151,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0718, -0.1047, -0.0024, -0.0086, -0.0033, -0.0046, -0.0084, -0.0566,
        -0.0035, -0.0040, -0.0022, -0.0211, -0.0198, -0.0159, -0.0085, -0.6356,
        -0.0121, -0.0083, -0.0086,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.0370, -0.1561, -0.0064, -0.0081, -0.0663, -0.0051, -0.0084, -0.0421,
        -0.0088, -0.0032, -0.0033, -0.0086, -0.0058, -0.0051, -0.0118, -0.0226,
        -0.0124, -0.4754, -0.0942, -0.0092, -0.0055, -0.0045,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1312, -0.3011, -0.0028, -0.0140, -0.1516, -0.0074, -0.0130, -0.0625,
        -0.0167, -0.0107, -0.0086, -0.0079, -0.0073, -0.0134, -0.0171, -0.0415,
        -0.0232, -0.0945, -0.0193, -0.0321, -0.0085, -0.0154,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0460, -0.2451, -0.0099, -0.0110, -0.1324, -0.0040, -0.0107, -0.0754,
        -0.0138, -0.0046, -0.0038, -0.0099, -0.0061, -0.0059, -0.0156, -0.0269,
        -0.0118, -0.1036, -0.2156, -0.0308, -0.0091, -0.0079,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0575, -0.0135, -0.0123, -0.0217, -0.0183, -0.0093, -0.0088, -0.1919,
        -0.0192, -0.0122, -0.0011, -0.0081, -0.0276, -0.1583, -0.0186, -0.2360,
        -0.1178, -0.0370, -0.0114, -0.0195,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0070, -0.0112, -0.0152, -0.0183, -0.0229, -0.0087, -0.0119, -0.2103,
        -0.0169, -0.0075, -0.0019, -0.0071, -0.2028, -0.0308, -0.0111, -0.3298,
        -0.0110, -0.0222, -0.0210, -0.0095, -0.0138, -0.0090,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #4200: [tensor([-0.2069, -0.1085, -0.0033, -0.0152, -0.0117, -0.0709, -0.0035, -0.0177,
        -0.0062, -0.0024, -0.0031, -0.0161, -0.0026, -0.0041, -0.0841, -0.0087,
        -0.0123, -0.3950, -0.0103, -0.0085, -0.0090,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1230, -0.2650, -0.0054, -0.0145, -0.0096, -0.0440, -0.0037, -0.0147,
        -0.0071, -0.0010, -0.0055, -0.0131, -0.0041, -0.0047, -0.1012, -0.0121,
        -0.0150, -0.0276, -0.0127, -0.0321, -0.2645, -0.0082, -0.0113,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1037, -0.1962, -0.0052, -0.0153, -0.0157, -0.0379, -0.0045, -0.0165,
        -0.0097, -0.0053, -0.0049, -0.0166, -0.0054, -0.0078, -0.0649, -0.0150,
        -0.0240, -0.4191, -0.0087, -0.0155, -0.0082,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0393, -0.0583, -0.0034, -0.0043, -0.0198, -0.0040, -0.0035, -0.0146,
        -0.0041, -0.1206, -0.0021, -0.0009, -0.0023, -0.0898, -0.0062, -0.0397,
        -0.0048, -0.5569, -0.0071, -0.0041, -0.0028, -0.0040, -0.0035, -0.0041,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0274, -0.0372, -0.0049, -0.0028, -0.0327, -0.0037, -0.0028, -0.0144,
        -0.0040, -0.1294, -0.0023, -0.0016, -0.0024, -0.5847, -0.0075, -0.0081,
        -0.0215, -0.0098, -0.0906, -0.0056, -0.0021, -0.0046,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0251, -0.0304, -0.0027, -0.0035, -0.0200, -0.0045, -0.0027, -0.0166,
        -0.0036, -0.2150, -0.0023, -0.0008, -0.0018, -0.5283, -0.0062, -0.0116,
        -0.0066, -0.0936, -0.0055, -0.0044, -0.0066, -0.0050, -0.0010, -0.0021,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2201, -0.0090, -0.0166, -0.0139, -0.0168, -0.0044, -0.0129, -0.0141,
        -0.0109, -0.1347, -0.0075, -0.0150, -0.3061, -0.0175, -0.0050, -0.0070,
        -0.0162, -0.0231, -0.0903, -0.0278, -0.0114, -0.0049, -0.0150,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1299, -0.0083, -0.0147, -0.0117, -0.0123, -0.0040, -0.0053, -0.0063,
        -0.0060, -0.0602, -0.0055, -0.0131, -0.2559, -0.0129, -0.0016, -0.0051,
        -0.0138, -0.0237, -0.0467, -0.0137, -0.3257, -0.0064, -0.0097, -0.0075,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-2.4989e-01, -7.6037e-03, -1.4097e-02, -1.1881e-02, -1.3216e-02,
        -3.4669e-03, -7.2129e-03, -1.5764e-02, -7.7834e-03, -7.6225e-02,
        -3.6586e-03, -1.5846e-02, -4.4906e-01, -9.5429e-03, -4.0898e-04,
        -1.3331e-03, -1.2443e-02, -1.5032e-02, -6.3750e-02, -7.7685e-03,
        -6.9519e-03, -7.0653e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-5.0325e-02, -4.6338e-03, -2.6368e-03, -2.2411e-03, -1.7576e-02,
        -6.3585e-04, -7.4697e-03, -1.3124e-03, -1.2349e-02, -3.4790e-03,
        -6.4334e-03, -2.0211e-02, -2.7018e-03, -1.0968e-03, -5.4579e-04,
        -3.1879e-03, -4.4028e-03, -9.4502e-03, -5.4121e-03, -1.1383e-01,
        -1.2685e-03, -6.5156e-03, -7.1468e-01, -2.6020e-03, -1.6281e-03,
        -3.3784e-03], device='cuda:0', grad_fn=<DivBackward0>), tensor([-4.4099e-02, -4.2235e-03, -2.7453e-03, -2.6217e-03, -2.0110e-02,
        -1.6503e-03, -8.7494e-03, -2.4620e-03, -1.3637e-02, -2.5046e-03,
        -7.3710e-03, -3.3856e-02, -2.4811e-03, -9.2959e-04,  2.9299e-04,
        -1.1821e-01, -4.3522e-03, -4.3892e-03, -5.2766e-03, -5.5495e-03,
        -6.4120e-03, -4.4249e-03, -6.8998e-01, -8.6925e-03, -2.1790e-03,
        -2.8044e-03], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0621, -0.0074, -0.0065, -0.0034, -0.0698, -0.0027, -0.0119, -0.0064,
        -0.0294, -0.0113, -0.0085, -0.0880, -0.0057, -0.0028, -0.0025, -0.0077,
        -0.0078, -0.0166, -0.2921, -0.0044, -0.0096, -0.2980, -0.0296, -0.0050,
        -0.0110,  0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #4250: [tensor([-4.5892e-02, -2.0253e-01, -5.1639e-03, -1.7805e-02, -7.3962e-03,
        -1.3440e-02, -2.5423e-03, -4.7995e-03, -5.2882e-02, -1.9798e-02,
        -1.6769e-03,  3.5723e-05, -3.7925e-03, -1.6539e-02, -1.2301e-02,
        -5.4492e-01, -2.4760e-02, -1.0430e-02, -5.9702e-03, -7.3228e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-1.9522e-02, -5.1771e-02, -5.9721e-03, -1.1720e-02, -2.1367e-03,
        -1.1170e-02, -1.8428e-03, -1.0559e-03, -2.3101e-02, -8.2192e-03,
        -1.7825e-03, -6.9524e-04, -3.1670e-03, -8.9094e-03, -1.1407e-02,
        -7.1999e-03, -7.5974e-03, -8.0869e-01, -7.1712e-03, -2.8311e-03,
        -4.0416e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 0.0630, -0.2839, -0.0148, -0.0122, -0.0572, -0.0055, -0.0132, -0.0102,
        -0.1106, -0.0008, -0.0160, -0.0027, -0.0042, -0.0036, -0.2498, -0.0176,
        -0.1048, -0.0128, -0.0105, -0.0067,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.0306, -0.1744, -0.0129, -0.0155, -0.0447, -0.0106, -0.0149, -0.0079,
        -0.0978, -0.0011, -0.0177, -0.0059, -0.0034, -0.0048, -0.3625, -0.0248,
        -0.0777, -0.0087, -0.0165, -0.0457, -0.0125, -0.0094,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0604, -0.2106, -0.0084, -0.0180, -0.0344, -0.0145, -0.0158, -0.0083,
        -0.1118, -0.0021, -0.0140, -0.0041, -0.0004, -0.0081, -0.2779, -0.0154,
        -0.1045, -0.0578, -0.0140, -0.0082, -0.0048, -0.0065,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1020, -0.0730, -0.0041, -0.0122, -0.0026, -0.0169, -0.0022, -0.0053,
        -0.0026, -0.0180, -0.0161, -0.0383, -0.0066, -0.0071, -0.0252, -0.0006,
        -0.0033, -0.0024, -0.0011, -0.2842, -0.0069, -0.0703, -0.0064, -0.0103,
        -0.2605, -0.0039, -0.0094, -0.0033, -0.0055,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1021, -0.1278, -0.0059, -0.0133, -0.0042, -0.0366, -0.0031, -0.0076,
        -0.0034, -0.0143, -0.0237, -0.0663, -0.0067, -0.0119, -0.0622, -0.0039,
        -0.0067, -0.0013, -0.0034, -0.0248, -0.0087, -0.0343, -0.0534, -0.0060,
        -0.0105, -0.0097, -0.0109, -0.1583, -0.1209, -0.0285, -0.0118, -0.0074,
        -0.0059, -0.0048], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1279, -0.2328, -0.0068, -0.0171, -0.0078, -0.0302, -0.0050, -0.0088,
        -0.0038, -0.0434, -0.0269, -0.1080, -0.0100, -0.0186, -0.0915, -0.0033,
        -0.0054, -0.0052, -0.0034, -0.1713, -0.0113, -0.0392, -0.0109, -0.0083,
        -0.0031,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-4.7624e-02, -1.1130e-01, -3.9788e-03, -1.1527e-02, -3.2403e-04,
        -3.1714e-03, -3.2376e-03, -8.7355e-03, -5.2514e-02, -4.3649e-03,
        -1.0214e-02, -1.6396e-02, -8.0159e-03, -7.6712e-03, -2.4879e-04,
        -2.8816e-03, -2.6331e-01, -8.1173e-03, -2.2507e-02, -5.7513e-03,
        -6.7984e-03, -8.1870e-03, -9.4308e-03, -2.6437e-01, -1.5198e-02,
        -2.4038e-02, -6.0748e-02, -1.1687e-02, -3.3216e-03, -4.3307e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 0.0012, -0.0587, -0.0042, -0.0112, -0.0009, -0.0041, -0.0045, -0.0088,
        -0.0464, -0.0036, -0.0089, -0.0163, -0.0050, -0.0062, -0.0009, -0.0012,
        -0.1012, -0.0074, -0.0145, -0.0019, -0.0077, -0.0099, -0.0042, -0.5615,
        -0.0065, -0.0172, -0.0683, -0.0096, -0.0035, -0.0046,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0437, -0.5202, -0.0048, -0.0168, -0.0010, -0.0070, -0.0057, -0.0091,
        -0.0547, -0.0094, -0.0100, -0.0152, -0.0055, -0.0069, -0.0011, -0.0026,
        -0.1661, -0.0112, -0.0245, -0.0029, -0.0113, -0.0184, -0.0420, -0.0038,
        -0.0063,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-5.4967e-02, -5.1784e-02, -4.4160e-03, -3.1591e-03, -2.4974e-04,
        -2.1744e-03, -1.9052e-02, -4.5416e-03, -3.7917e-03, -3.6393e-03,
        -4.1877e-03, -2.9055e-03, -7.6986e-03, -6.5113e-02, -5.6437e-04,
        -1.3217e-03, -2.5786e-03, -7.4209e-01, -5.9000e-03, -5.6769e-03,
        -4.6943e-03, -6.4048e-03, -3.0877e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #4300: [tensor([-5.6414e-02, -2.6588e-02, -2.9512e-03, -1.3411e-02, -2.7205e-03,
        -1.9807e-03, -1.4837e-03, -1.0616e-02, -1.5178e-03, -6.2739e-04,
        -5.0936e-03, -9.8451e-02, -1.4833e-03,  5.9441e-04, -1.2234e-03,
        -2.5379e-03, -4.5413e-03, -1.3360e-02, -2.3757e-03,  1.1222e-03,
         3.4620e-05, -1.0618e-01, -3.3333e-03, -1.7971e-02, -4.9856e-03,
        -5.3237e-03, -5.4487e-01, -4.9358e-03, -8.3201e-03, -2.7017e-02,
        -1.9399e-02, -4.2346e-03, -2.0355e-03, -2.2676e-03], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0650, -0.1644, -0.0061, -0.0279, -0.0378, -0.0019, -0.0018, -0.0093,
        -0.0318,  0.0005, -0.0039, -0.4795, -0.0039, -0.0021,  0.0014, -0.0008,
        -0.1291, -0.0105, -0.0127, -0.0035, -0.0021, -0.0041,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-6.9758e-02, -6.9755e-02, -3.8510e-03, -2.1706e-02, -2.9709e-02,
        -2.9283e-03, -7.6254e-04, -6.5425e-03, -2.7535e-02, -1.3498e-04,
        -5.1590e-03, -1.3403e-01, -4.1911e-03, -2.4249e-03,  3.7990e-04,
        -7.4709e-04, -5.1354e-02, -8.9935e-03, -5.7465e-03, -7.9474e-03,
        -1.0148e-03, -1.6526e-03, -5.2853e-01, -7.9412e-03, -2.6952e-03,
        -4.5132e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-1.0579e-01, -3.2094e-02, -3.8764e-03, -1.8855e-02, -1.9543e-02,
        -1.9787e-03, -5.1035e-04, -5.7985e-03, -1.8280e-02,  6.5252e-04,
        -3.8835e-03, -1.0296e-01, -4.2551e-03, -1.3195e-03,  7.2626e-04,
        -1.3456e-03, -2.6642e-02, -4.2599e-03, -3.8225e-03, -5.0608e-03,
        -3.6277e-03, -2.8742e-03, -6.2534e-01, -2.4873e-03, -8.0435e-04,
        -3.2060e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.2300, -0.0284, -0.0449, -0.0367, -0.0883, -0.0115, -0.0330, -0.0186,
        -0.0058, -0.0425, -0.0098, -0.0145, -0.0123, -0.0220, -0.0299, -0.2557,
        -0.0460, -0.0276, -0.0216, -0.0210,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1167, -0.0100, -0.0347, -0.0140, -0.0341, -0.0077, -0.0168, -0.0048,
        -0.0024, -0.0079, -0.0058, -0.0065, -0.0018, -0.0079, -0.0111, -0.0717,
        -0.0081, -0.5132, -0.0164, -0.0266, -0.0094, -0.0070, -0.0204, -0.0197,
        -0.0043, -0.0083, -0.0125,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.0932, -0.0276, -0.0848, -0.0281, -0.0674, -0.0035, -0.0206, -0.0193,
        -0.0065, -0.0305, -0.0096, -0.0054, -0.0136, -0.0075, -0.0262, -0.2223,
        -0.0182, -0.0354, -0.1837, -0.0194, -0.0088, -0.0219, -0.0149, -0.0160,
        -0.0155,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2277, -0.0071, -0.0041, -0.0046, -0.0042, -0.0097, -0.0506, -0.0156,
        -0.0035, -0.0053, -0.1664, -0.0114, -0.0126, -0.0171, -0.0091, -0.0095,
        -0.0864, -0.0109, -0.0235, -0.2930, -0.0111, -0.0083, -0.0085,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.0405, -0.0041, -0.0018, -0.0053, -0.0016, -0.0060, -0.0257, -0.0110,
        -0.0023, -0.0034, -0.2649, -0.0063, -0.0060, -0.0132, -0.0076, -0.0086,
        -0.0137, -0.0088, -0.3822, -0.0087, -0.0237, -0.1361, -0.0067, -0.0044,
        -0.0073,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.0600, -0.0082, -0.0066, -0.0046, -0.0058, -0.0087, -0.0571, -0.0253,
        -0.0040, -0.0039, -0.2060, -0.0151, -0.0142, -0.0140, -0.3055, -0.0361,
        -0.0205, -0.1234, -0.0147, -0.0497, -0.0073, -0.0092,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-4.0019e-02, -1.3610e-01, -2.4106e-03, -1.5448e-02, -7.0957e-03,
        -3.3006e-04, -9.7659e-04, -4.8611e-03, -2.5288e-03, -7.5227e-03,
        -1.0369e-03, -2.1028e-03, -1.3368e-02, -6.7639e-03, -4.9508e-03,
        -7.2516e-01, -5.4327e-03, -4.9492e-03, -1.1027e-02, -3.1834e-03,
        -4.7337e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-6.3577e-02, -1.8153e-01, -2.8866e-03, -1.5863e-02, -4.7969e-03,
        -7.6169e-04, -2.6297e-03, -2.7434e-03, -3.9950e-03, -7.5388e-03,
        -1.9720e-04, -2.4257e-03, -9.4627e-03, -1.3237e-02, -9.7304e-03,
        -2.0001e-01, -1.0823e-02, -1.8178e-01, -2.6672e-01, -8.7060e-03,
        -4.3537e-03, -6.2329e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #4350: [tensor([-0.0440, -0.0080, -0.0066, -0.0974, -0.0060, -0.0137, -0.0091, -0.0041,
        -0.0049, -0.0056, -0.0068, -0.0108, -0.0101, -0.0109, -0.0099, -0.0015,
        -0.0051, -0.0113, -0.0163, -0.0987, -0.1884, -0.1608, -0.0065, -0.0074,
        -0.0143, -0.0057, -0.0058, -0.0181, -0.1602, -0.0217, -0.0131, -0.0073,
        -0.0099,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1224, -0.0186, -0.0016, -0.0033, -0.0084, -0.0019, -0.0022, -0.0025,
        -0.0010, -0.0055, -0.0026, -0.0025, -0.0021, -0.0033, -0.0020, -0.0030,
        -0.0023, -0.0892, -0.0056, -0.0029,  0.0009, -0.0007, -0.4423, -0.0030,
        -0.0490, -0.0039, -0.0038, -0.0046, -0.1701, -0.0067, -0.0042, -0.0031,
        -0.0040, -0.0018, -0.0036, -0.0063, -0.0038, -0.0024, -0.0032],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-4.8703e-02, -2.1824e-02, -2.2915e-03, -5.5068e-03, -9.3646e-03,
        -3.2729e-03, -1.9460e-03, -2.9901e-03, -1.4257e-03, -9.7931e-03,
        -3.1772e-03, -2.5755e-03, -2.5438e-03, -4.0973e-03, -2.5948e-03,
        -3.6170e-03, -3.3896e-03, -5.9575e-02, -6.0536e-03, -2.6474e-03,
         3.1085e-04, -1.4327e-03, -5.3929e-01, -3.9490e-03, -4.4743e-02,
        -6.5249e-03, -1.9205e-01, -4.4223e-03, -4.3074e-03, -1.8143e-03,
        -3.7718e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-7.6720e-02, -2.9713e-02, -1.7573e-03, -5.0021e-03, -8.7633e-03,
        -1.9679e-03, -1.9999e-03, -2.6697e-03, -1.1901e-03, -7.4993e-03,
        -1.2310e-03, -3.1284e-03, -3.0409e-03, -4.0845e-03, -2.2770e-03,
        -3.6607e-03, -3.5651e-03, -8.5782e-02, -6.5951e-03, -2.2063e-03,
         4.7642e-04, -1.7637e-03, -5.3014e-01, -4.1507e-03, -3.3201e-03,
        -1.8317e-01, -1.6153e-02, -3.9300e-03, -1.4111e-03, -2.6363e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0421, -0.0051, -0.0048, -0.0048, -0.0274, -0.0021, -0.0009, -0.0032,
        -0.0047, -0.0533, -0.0068, -0.8206, -0.0128, -0.0052, -0.0061,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.0437, -0.0146, -0.0326, -0.0151, -0.1404, -0.0166, -0.0066, -0.0102,
        -0.0211, -0.6339, -0.0206, -0.0254, -0.0192,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0378, -0.0172, -0.0247, -0.0101, -0.1178, -0.0092, -0.0042, -0.0049,
        -0.0292, -0.6979, -0.0134, -0.0140, -0.0196,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.0196, -0.0882, -0.0016, -0.0504, -0.0300, -0.0032, -0.0044, -0.0117,
        -0.0014, -0.0373, -0.0027, -0.0159, -0.0042, -0.0074, -0.0042, -0.0591,
        -0.0058, -0.0015, -0.0012, -0.0173, -0.0412, -0.4478, -0.0062, -0.0101,
        -0.0034, -0.0948, -0.0079, -0.0170, -0.0012, -0.0032,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0742, -0.3105, -0.0022, -0.0313, -0.0268, -0.0025, -0.0047, -0.0183,
        -0.0005, -0.0233, -0.0022, -0.0083, -0.0022, -0.0056, -0.0037, -0.0507,
        -0.0054, -0.0021, -0.0013, -0.0160, -0.0805, -0.2593, -0.0038, -0.0110,
        -0.0059, -0.0070, -0.0144, -0.0050, -0.0052, -0.0122, -0.0038,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.0034, -0.0531, -0.0026, -0.0278, -0.0304, -0.0026, -0.0076, -0.0190,
        -0.0012, -0.0319, -0.0031, -0.0146, -0.0042, -0.0084, -0.0029, -0.0656,
        -0.0059, -0.0010, -0.0023, -0.0160, -0.0514, -0.2215, -0.0031, -0.0027,
        -0.3545, -0.0053, -0.0418, -0.0100, -0.0059,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0421, -0.2029, -0.0094, -0.0087, -0.0140, -0.0087, -0.0047, -0.0942,
        -0.0063, -0.0085, -0.1036, -0.0261, -0.0041, -0.0059, -0.0104, -0.0348,
        -0.0197, -0.0222, -0.3417, -0.0171, -0.0065, -0.0083,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0317, -0.0367, -0.0048, -0.0054, -0.0095, -0.0030, -0.0040, -0.0872,
        -0.0048, -0.0040, -0.0481, -0.0094, -0.0008, -0.0029, -0.0067, -0.0088,
        -0.0056, -0.6864, -0.0083, -0.0151, -0.0095, -0.0032, -0.0041,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #4400: [tensor([-9.6101e-02, -5.1269e-03, -6.5838e-03, -4.1604e-03, -6.2566e-02,
        -9.8390e-04, -3.9771e-03, -7.5488e-03, -2.3155e-02, -5.2305e-01,
        -3.8039e-03, -1.4065e-02, -4.5754e-04, -3.8505e-03, -1.4251e-02,
        -1.5432e-02, -1.5186e-02, -9.2635e-03, -1.6284e-01, -2.2287e-02,
        -1.1384e-03, -4.1747e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0572, -0.0039, -0.0046, -0.0026, -0.0487, -0.0020, -0.0023, -0.0051,
        -0.0196, -0.2790, -0.0025, -0.0129, -0.0010, -0.0025, -0.0116, -0.0094,
        -0.0149, -0.0073, -0.0069, -0.3838, -0.0194, -0.0046, -0.0234, -0.0573,
        -0.0115, -0.0027, -0.0034], device='cuda:0', grad_fn=<DivBackward0>), tensor([-5.8927e-02, -6.0608e-03, -5.3127e-03, -6.2585e-03, -4.2008e-02,
        -2.9351e-03, -1.0954e-02, -2.4342e-03, -1.1935e-03, -5.1709e-01,
        -7.1695e-03, -9.4798e-03,  1.1361e-04, -3.4266e-03, -1.1498e-02,
        -8.1793e-03, -8.1091e-03, -1.4799e-02, -2.7006e-01, -8.3737e-03,
        -2.8884e-03, -2.7301e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0904, -0.0097, -0.0106, -0.0072, -0.0742, -0.0036, -0.0203, -0.0064,
        -0.0009, -0.3023, -0.0093, -0.0231, -0.0017, -0.0061, -0.0200, -0.0176,
        -0.0070, -0.0079, -0.3278, -0.0387, -0.0054, -0.0099,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1133, -0.0096, -0.0108, -0.0058, -0.1024, -0.0067, -0.0197, -0.0059,
        -0.0027, -0.5085, -0.0106, -0.0532, -0.0052, -0.0074, -0.0341, -0.0182,
        -0.0154, -0.0138, -0.0335, -0.0078, -0.0153,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0240, -0.1924, -0.0037, -0.0053, -0.0266, -0.0586, -0.0031, -0.0038,
        -0.0058, -0.4496, -0.0044, -0.0085, -0.0012, -0.0028, -0.1765, -0.0107,
        -0.0084, -0.0077, -0.0068,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0189, -0.1008, -0.0030, -0.0031, -0.0173, -0.0433, -0.0024, -0.0031,
        -0.0032, -0.1444, -0.0016, -0.0050, -0.0010, -0.0029, -0.1055, -0.0067,
        -0.0076, -0.0069, -0.0077, -0.0213, -0.0604, -0.4194, -0.0066, -0.0036,
        -0.0044,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-4.2317e-02, -4.0447e-02, -1.6882e-03, -2.4010e-03, -1.2361e-02,
        -2.7102e-02, -3.1567e-03, -1.6766e-03, -2.8598e-03, -1.1957e-01,
        -2.3411e-03, -4.3513e-03, -4.6157e-04, -1.8765e-03, -4.0397e-02,
        -5.5749e-03, -2.2676e-02, -6.3548e-01, -5.4120e-03, -7.1485e-03,
        -4.4484e-03, -1.0873e-02, -1.8187e-03, -3.5646e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0797, -0.0152, -0.0076, -0.0118, -0.0015, -0.0519, -0.0099, -0.0057,
        -0.0914, -0.0068, -0.0343, -0.0105, -0.0018, -0.0059, -0.0141, -0.0194,
        -0.0399, -0.0087, -0.5510, -0.0257, -0.0028, -0.0046,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.0413, -0.0275, -0.0151, -0.0152, -0.0022, -0.0913, -0.0195, -0.0120,
        -0.2432, -0.0251, -0.0530, -0.0198, -0.0049, -0.0091, -0.0324, -0.0187,
        -0.0764, -0.0214, -0.0126, -0.1436, -0.0868, -0.0076, -0.0212,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0174, -0.0426, -0.0160, -0.0193, -0.0040, -0.0797, -0.0119, -0.0179,
        -0.1736, -0.0184, -0.0575, -0.0229, -0.0094, -0.0085, -0.0374, -0.0256,
        -0.0569, -0.0119, -0.0590, -0.2433, -0.0093, -0.0061, -0.0360, -0.0152,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0166, -0.0386, -0.0053, -0.0014, -0.0036, -0.0104, -0.0217, -0.0016,
        -0.0037, -0.0051, -0.0026, -0.3620, -0.0015, -0.0007, -0.0010, -0.1783,
        -0.0062, -0.1763, -0.0077, -0.1471, -0.0024, -0.0018, -0.0041,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #4450: [tensor([-0.3064, -0.0150, -0.0200, -0.0378, -0.0071, -0.0140, -0.0607, -0.3274,
        -0.0111, -0.0079, -0.0032, -0.0095, -0.0346, -0.0391, -0.0110, -0.0262,
        -0.0287, -0.0166, -0.0237,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-2.6575e-02, -3.3294e-03, -7.1487e-03, -2.3739e-02, -3.0847e-03,
        -7.5498e-04, -6.1049e-03, -2.5331e-03, -2.8971e-03, -1.4954e-03,
        -6.3817e-03, -1.4068e-02, -4.4900e-02, -1.1219e-02, -1.4592e-02,
        -4.0400e-03, -6.1925e-03, -8.0788e-01, -5.6946e-03, -2.8376e-03,
        -4.5309e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.0065, -0.0078, -0.0073, -0.0555, -0.0041, -0.0027, -0.0069, -0.0062,
        -0.0026, -0.0009, -0.0083, -0.1543, -0.0069, -0.7037, -0.0132, -0.0060,
        -0.0071,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-6.2351e-02, -5.0092e-03, -7.2922e-03, -2.5583e-02, -3.5898e-03,
        -1.5084e-04, -7.3966e-03, -3.9574e-03, -3.0133e-03, -2.4759e-03,
        -6.7611e-03, -2.1904e-02, -8.5317e-02, -5.7247e-03, -1.8569e-02,
        -4.3499e-03, -8.9883e-02, -2.0381e-02, -4.6221e-03, -7.3279e-03,
        -6.0059e-01, -4.1447e-03, -5.2696e-03, -4.3328e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([ 4.1643e-02, -6.3337e-03, -5.7132e-03, -6.2497e-03, -6.6895e-03,
        -2.7576e-03, -8.3910e-03, -3.0148e-03, -6.5037e-03, -8.8994e-03,
        -8.3546e-03, -6.0523e-01, -4.8028e-03, -1.8844e-02, -5.8087e-03,
         5.6017e-04, -2.8633e-03, -8.9089e-03, -1.4926e-02, -6.4192e-02,
        -6.3283e-03, -2.2637e-02, -3.3314e-02, -8.5200e-02, -1.6252e-02,
        -2.3761e-03, -3.2092e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-2.0602e-03, -5.1911e-03, -5.0137e-03, -9.3073e-03, -8.0273e-03,
        -1.6638e-03, -5.9358e-03, -5.1044e-03, -1.3283e-02, -1.1258e-02,
        -7.4391e-03, -7.4498e-01, -2.7679e-03, -2.4069e-02, -1.0346e-02,
        -1.7565e-03, -3.2424e-03, -1.6423e-02, -2.8481e-02, -7.0039e-02,
        -4.5146e-03, -3.8432e-04, -1.2488e-02, -6.2221e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-6.8273e-02, -3.3064e-03, -2.8876e-03, -4.2449e-03, -2.2110e-03,
        -1.2867e-03, -4.1117e-03, -1.4532e-03, -4.5936e-03, -3.2063e-03,
        -4.5795e-03, -9.6616e-02, -2.9047e-03, -8.8258e-03, -2.6668e-03,
         4.6545e-05, -2.0592e-03, -4.5012e-03, -7.5003e-03, -3.2795e-03,
        -3.2064e-03, -5.3211e-02, -1.8689e-02, -9.7030e-03, -1.3778e-02,
        -5.4399e-03, -6.3674e-03, -6.5019e-01, -2.9029e-03, -3.1419e-03,
        -1.1738e-03, -3.6407e-03], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1293, -0.0076, -0.0114, -0.0099, -0.0021, -0.0045, -0.0535, -0.0004,
        -0.0074, -0.0108, -0.0043, -0.0193, -0.0036, -0.0044, -0.0745, -0.0116,
        -0.0085, -0.2519, -0.0063, -0.2278, -0.1372, -0.0037, -0.0048, -0.0052,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0516, -0.0135, -0.0178, -0.0209, -0.0024, -0.0084, -0.1365, -0.0006,
        -0.0199, -0.0165, -0.0089, -0.0273, -0.0076, -0.0085, -0.0200, -0.1546,
        -0.0127, -0.0548, -0.2225, -0.0124, -0.0510, -0.0197, -0.0714, -0.0140,
        -0.0267,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([ 0.0313, -0.0144, -0.0254, -0.0200, -0.0141, -0.0180, -0.2457, -0.0025,
        -0.0272, -0.0119, -0.0107, -0.0514, -0.0139, -0.0157, -0.0380, -0.2315,
        -0.0217, -0.0444, -0.0171, -0.0258, -0.0632, -0.0194, -0.0368,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.3764e-01, -4.8896e-03, -4.2079e-03, -3.3334e-03, -1.0948e-02,
        -2.2242e-03, -4.4325e-03, -2.2670e-03, -4.4735e-03, -4.4555e-03,
        -1.9697e-03, -3.5279e-02, -4.3231e-02,  5.6743e-04,  8.4701e-04,
        -1.0306e-03, -5.2975e-03, -5.4809e-03, -1.2621e-02, -8.6389e-03,
        -3.6195e-03, -6.3504e-03, -1.4070e-01, -4.7764e-03, -1.3576e-02,
        -2.9985e-02, -5.0251e-01,  2.5023e-04, -2.5100e-03, -1.8885e-03,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-5.7460e-02, -4.8834e-03, -8.0083e-03, -4.5272e-03, -1.7605e-02,
        -3.5227e-03, -7.0032e-03, -1.6381e-03, -5.1484e-03, -3.8762e-02,
        -2.0568e-03, -4.2012e-02, -7.7982e-02, -1.7141e-04, -1.0747e-03,
        -2.0318e-03, -6.3431e-03, -7.4650e-03, -2.0479e-02, -4.8835e-02,
        -6.3492e-01, -6.7843e-04, -4.2878e-03, -3.1021e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #4500: [tensor([-1.2797e-01, -3.7290e-02, -3.7236e-03, -5.5078e-03, -2.3553e-03,
        -4.1654e-03, -2.1045e-03, -1.7931e-03, -5.0112e-03, -3.6119e-03,
        -3.3424e-03, -9.6784e-03, -3.3613e-02, -3.2267e-03,  6.4268e-04,
        -2.3783e-03, -4.7709e-02, -4.5308e-03, -2.6335e-02, -6.6506e-03,
        -5.1125e-03, -9.2405e-03, -6.1907e-01, -6.9831e-03, -1.7249e-02,
        -6.2377e-03, -5.2058e-04, -3.9459e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2201, -0.2254, -0.0081, -0.0080, -0.0026, -0.0065, -0.0055, -0.0006,
        -0.0130, -0.0110, -0.0062, -0.0213, -0.1158, -0.0020, -0.0011, -0.0020,
        -0.2257, -0.0199, -0.0312, -0.0037, -0.0369, -0.0131, -0.0107, -0.0096,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0526, -0.0284, -0.0252, -0.0263, -0.2779, -0.0126, -0.0072, -0.0105,
        -0.0365, -0.4137, -0.0174, -0.0462, -0.0230, -0.0225,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2663, -0.0329, -0.0283, -0.0231, -0.1858, -0.0166, -0.0073, -0.0113,
        -0.1756, -0.0366, -0.1163, -0.0272, -0.0277, -0.0258, -0.0193,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0891, -0.0096, -0.0058, -0.0104, -0.1040, -0.0099, -0.0061, -0.0071,
        -0.0870, -0.0321, -0.0291, -0.0319, -0.3357, -0.2113, -0.0081, -0.0113,
        -0.0116,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-5.3109e-02, -1.0073e-01, -3.1608e-03, -2.8265e-03, -2.5935e-02,
        -3.2398e-03, -2.2567e-03, -1.7873e-03, -2.9450e-03, -3.6865e-03,
        -1.6696e-03, -2.0359e-01, -3.2432e-03, -1.8043e-02, -1.8094e-03,
        -6.3033e-03, -2.2285e-02, -5.9185e-03, -2.5486e-04, -1.0867e-03,
        -3.9362e-01, -5.6162e-03, -1.3598e-02, -5.8380e-03, -6.6666e-03,
        -2.9843e-03, -1.4217e-02, -3.7489e-03, -2.0468e-03, -6.6552e-02,
        -4.4864e-03, -7.1425e-03, -4.4138e-03, -1.0555e-03, -4.1324e-03],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-9.5362e-02, -4.3106e-02, -4.4002e-03, -6.1496e-03, -2.7240e-02,
        -3.6750e-03, -2.2344e-03, -2.1395e-03, -3.7013e-03, -4.6090e-03,
        -2.3742e-03, -1.1536e-01, -2.5420e-03, -1.5195e-02, -3.6898e-03,
        -9.0595e-03, -3.2505e-02, -9.5689e-03, -3.0316e-04, -1.5152e-03,
        -8.3813e-02, -1.2659e-02, -4.9433e-01, -5.1474e-03, -5.6565e-03,
        -7.2152e-03, -1.8304e-03, -4.6171e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-4.7472e-02, -3.6565e-02, -2.2451e-03, -2.7647e-03, -1.0162e-02,
        -3.0466e-03, -1.2154e-03, -5.3495e-04, -2.3496e-03, -4.4237e-03,
        -1.7360e-04, -5.7404e-02, -2.6009e-03, -1.0858e-02, -2.1135e-03,
        -5.2643e-03, -1.4832e-02, -3.9026e-03,  2.8473e-04, -2.3643e-04,
        -2.1059e-01, -4.0142e-03, -1.3116e-03, -4.7744e-03, -7.6693e-02,
        -3.8520e-03, -1.6624e-02, -4.6217e-01, -3.5749e-03, -3.3253e-03,
        -1.9876e-03, -2.6339e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0421, -0.0057, -0.0080, -0.0077, -0.0492, -0.0067, -0.0010, -0.0038,
        -0.0132, -0.0716, -0.0105, -0.7512, -0.0127, -0.0073, -0.0094,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0014, -0.0090, -0.0244, -0.0146, -0.2265, -0.0146, -0.0076, -0.0089,
        -0.0223, -0.2552, -0.0144, -0.0429, -0.2357, -0.0412, -0.0534, -0.0156,
        -0.0125,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2506, -0.0098, -0.0132, -0.0139, -0.1382, -0.0075, -0.0036, -0.0051,
        -0.0172, -0.3256, -0.0073, -0.0238, -0.1424, -0.0242, -0.0057, -0.0119,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-3.6775e-02, -2.4938e-03, -3.8207e-03, -3.7690e-03, -3.4860e-03,
        -8.1098e-04, -1.2844e-02, -1.7165e-03, -4.6589e-03, -5.0357e-03,
        -3.2328e-02, -9.2337e-03, -4.7016e-03, -1.9251e-02,  9.4187e-05,
         5.5293e-04, -2.7330e-03, -7.2658e-02, -1.0664e-02, -3.9419e-02,
        -4.0190e-03, -4.3525e-02, -3.1054e-03, -7.7979e-03, -8.7063e-03,
        -3.5782e-03, -7.4760e-03, -5.2460e-03, -6.4181e-01, -4.3877e-03,
        -3.3010e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #4550: [tensor([-0.0148, -0.0207, -0.0180, -0.0139, -0.0019, -0.0052, -0.0089, -0.0062,
        -0.0101, -0.0099, -0.0055, -0.0195, -0.0214, -0.0045, -0.0182, -0.0053,
        -0.0055, -0.0099, -0.0174, -0.0011, -0.0016, -0.0054, -0.0934, -0.0190,
        -0.5069, -0.0229, -0.0800, -0.0160, -0.0113, -0.0128, -0.0129,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.9644e-01, -2.2351e-02, -1.3613e-02, -1.0720e-02, -4.6396e-03,
        -6.2802e-03, -8.8179e-03, -4.6033e-03, -6.3673e-03, -8.2453e-03,
        -3.8722e-03, -1.9419e-02, -3.2269e-02, -7.5527e-03, -2.0424e-02,
        -5.0569e-03, -3.2820e-03, -1.6049e-02, -1.5147e-02, -2.6672e-03,
        -3.0544e-04, -3.8084e-03, -5.5239e-02, -9.2918e-03, -4.9011e-01,
        -1.0129e-02, -7.2524e-04, -1.1376e-02, -5.1695e-03, -6.0240e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 0.0814, -0.0388, -0.0288, -0.0182,  0.0004, -0.0110, -0.0155, -0.0023,
        -0.0074, -0.0151, -0.0043, -0.0452, -0.0421, -0.0084, -0.0257, -0.0087,
        -0.0014, -0.0242, -0.0271, -0.0053, -0.0033, -0.0071, -0.2491, -0.1421,
        -0.1106, -0.0250, -0.0180, -0.0082, -0.0140, -0.0114,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0608, -0.0058, -0.0049, -0.0032, -0.0015, -0.0020, -0.0037, -0.0009,
        -0.0013, -0.0035, -0.0019, -0.0060, -0.0099, -0.0023, -0.0072, -0.0017,
        -0.0010, -0.0045, -0.0053, -0.0006,  0.0006, -0.0016, -0.0404, -0.0050,
        -0.0035, -0.0056, -0.0127, -0.5009, -0.0064, -0.0056, -0.0048, -0.2706,
        -0.0103, -0.0015, -0.0026,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-2.1494e-01, -4.0078e-02, -3.6402e-02, -2.4667e-02, -5.7368e-03,
        -7.5757e-03, -1.9496e-02, -8.2521e-03, -8.2427e-03, -2.1938e-02,
        -1.0980e-02, -3.4581e-02, -4.4356e-02, -6.8701e-03, -3.0248e-02,
        -7.3471e-03, -5.2349e-03, -1.1235e-02, -2.3362e-02, -4.0679e-03,
        -3.8526e-05, -9.3477e-03, -2.5675e-01, -3.8482e-02, -5.1065e-02,
        -9.3123e-03, -4.5471e-02, -2.3929e-02,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0913, -0.0385, -0.0307, -0.0255, -0.0091, -0.0058, -0.0217, -0.0067,
        -0.0109, -0.0237, -0.0082, -0.0418, -0.0518, -0.0130, -0.0312, -0.0167,
        -0.0061, -0.0192, -0.0248, -0.0069, -0.0034, -0.0146, -0.1704, -0.0569,
        -0.0825, -0.1393, -0.0070,  0.0016, -0.0257, -0.0151,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.0102e-01, -6.9638e-02, -4.4438e-03, -1.1926e-02, -4.7923e-03,
        -1.5529e-02, -2.5390e-03, -1.3208e-03, -2.4706e-03, -4.3379e-03,
        -4.2436e-03, -3.7915e-03, -5.3742e-03, -3.6160e-03, -4.0831e-02,
        -5.0940e-03, -8.2493e-03, -1.6439e-03, -6.3769e-03, -1.4693e-01,
        -7.0738e-03,  9.0147e-05, -1.3705e-03, -8.7231e-03, -4.3695e-03,
        -6.1297e-03, -4.5927e-01, -1.0046e-02, -8.0235e-03, -3.9364e-03,
        -7.4186e-03, -1.0402e-02, -2.1543e-02, -2.5427e-03, -4.8979e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1569, -0.1663, -0.0047, -0.0203, -0.0039, -0.0312, -0.0067, -0.0022,
        -0.0022, -0.0058, -0.0062, -0.0102, -0.0084, -0.0038, -0.0646, -0.0059,
        -0.0081, -0.0050, -0.0050, -0.1133, -0.0075, -0.0013, -0.0048, -0.1672,
        -0.0113, -0.0285, -0.0182, -0.0106, -0.0041, -0.0731, -0.0030, -0.0053,
        -0.0133, -0.0072, -0.0047, -0.0090,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-5.6278e-02, -4.8334e-02, -2.0761e-03, -5.9120e-03, -1.7564e-03,
        -8.4441e-03, -1.1115e-03, -8.9301e-04, -1.6465e-03, -1.8301e-03,
        -8.6459e-04, -2.8513e-03, -2.5128e-03, -1.9837e-03, -1.1102e-02,
        -1.8421e-03, -1.9599e-03, -1.0423e-03, -1.9138e-03, -4.0822e-02,
        -1.4486e-03,  1.0361e-04,  2.3851e-04, -3.2917e-03, -1.6319e-02,
        -2.0620e-02, -5.6142e-03, -6.1357e-03, -5.5105e-02, -2.3241e-03,
        -2.2788e-03, -2.8734e-02, -3.0837e-03, -3.7651e-03, -9.4265e-03,
        -6.3766e-01, -5.3465e-03, -1.5801e-03, -1.7519e-03], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-2.9868e-02, -2.3673e-02, -2.1516e-03, -5.4942e-03, -2.3558e-03,
        -4.7621e-03, -1.7004e-03, -1.0733e-03, -1.2501e-03, -1.8968e-03,
        -7.0220e-04, -1.7114e-03, -1.7947e-03, -1.8666e-03, -7.9803e-03,
        -1.8212e-03, -2.5445e-03, -1.6098e-03, -2.0218e-03, -4.4359e-02,
        -2.1969e-03,  2.6399e-04, -1.7912e-04, -7.1406e-02, -2.2274e-03,
        -5.4536e-03, -5.4305e-03, -3.3884e-03, -3.7755e-03, -2.0846e-03,
        -3.2934e-03, -8.7254e-02, -3.4038e-03, -3.1169e-03, -2.8409e-03,
        -6.5565e-01, -4.6294e-03, -2.7732e-03,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.2101, -0.1583, -0.0041, -0.0158, -0.0074, -0.0164, -0.0041, -0.0012,
        -0.0036, -0.0075, -0.0044, -0.0101, -0.0095, -0.0048, -0.1214, -0.0061,
        -0.0092, -0.0070, -0.0087, -0.1541, -0.0103, -0.0016, -0.0080, -0.0069,
        -0.0011, -0.0601, -0.0814, -0.0117, -0.0071, -0.0171, -0.0155, -0.0072,
        -0.0081,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0526, -0.0862, -0.0048, -0.0136, -0.0053, -0.0120, -0.0047, -0.0004,
        -0.0030, -0.0067, -0.0040, -0.0039, -0.0052, -0.0063, -0.0784, -0.0050,
        -0.0085, -0.0055, -0.0046, -0.1051, -0.0055, -0.0006, -0.0029, -0.0083,
        -0.0056, -0.2761, -0.0352, -0.0136, -0.2243,  0.0009, -0.0055, -0.0056,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #4600: [tensor([-3.6568e-02, -7.8725e-02, -8.0568e-03, -8.6486e-03, -4.0524e-02,
        -2.9491e-03, -2.2292e-02, -5.6958e-03, -4.6225e-02, -7.6876e-03,
         1.0133e-04, -3.0245e-03, -4.1963e-01, -1.2477e-02, -4.0748e-02,
        -1.0716e-02, -2.3407e-01, -8.3057e-03, -6.0038e-03, -7.5483e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 7.1916e-03, -8.5067e-02, -2.8636e-03, -4.9846e-03, -3.6178e-02,
        -1.4358e-03, -1.4077e-02, -4.4323e-03, -2.5472e-02, -4.2867e-03,
        -2.0100e-04, -1.7433e-03, -6.8388e-03, -6.1393e-03, -6.4445e-03,
        -1.0393e-02, -6.5842e-03, -3.1966e-01, -7.4625e-03, -3.8223e-01,
        -5.6868e-03, -6.5228e-03, -6.9589e-03, -7.4319e-03, -5.3920e-03,
        -7.4798e-03, -1.9775e-02, -1.6268e-03, -5.4411e-03], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-5.9156e-02, -9.8601e-02, -5.7598e-03, -9.2958e-03, -4.6695e-02,
        -2.8790e-03, -1.4390e-02, -5.1795e-03, -3.3416e-02, -3.3536e-03,
         6.8652e-05, -3.1307e-03, -3.7856e-01, -8.0187e-03, -4.0004e-02,
        -1.3728e-02, -6.4066e-03, -2.5508e-01, -7.5877e-03, -4.5292e-03,
        -4.1672e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 0.0666, -0.2086, -0.0075, -0.0093, -0.1156, -0.0033, -0.0278, -0.0089,
        -0.0665, -0.0124, -0.0028, -0.0055, -0.1428, -0.0199, -0.0976, -0.0132,
        -0.1639, -0.0095, -0.0088, -0.0094,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-6.3517e-02, -7.4620e-02, -5.2851e-03, -9.2478e-03, -4.9562e-02,
        -2.7061e-03, -1.6006e-02, -8.1410e-03, -4.6146e-02, -8.4795e-03,
        -4.0168e-04, -4.1657e-03, -6.4085e-01, -7.7760e-03, -3.3951e-02,
        -1.2497e-02, -6.6540e-03, -9.9900e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-3.8891e-02, -5.9930e-02, -5.8169e-03, -5.1087e-03, -5.0068e-02,
        -1.3301e-03, -2.1053e-02, -4.5148e-03, -2.6365e-02, -4.1242e-03,
        -4.0755e-04, -3.8177e-03, -6.9849e-01, -9.6337e-03, -2.6500e-02,
        -7.7900e-03, -8.0412e-03, -9.4798e-03, -1.2123e-02, -2.2768e-03,
        -4.2336e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0947, -0.2563, -0.0108, -0.0105, -0.0993, -0.0065, -0.0485, -0.0109,
        -0.1580, -0.0110, -0.0021, -0.0058, -0.1482, -0.0184, -0.0738, -0.0209,
        -0.0068, -0.0175,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-1.6362e-02, -7.4834e-02, -5.9855e-03, -4.7530e-03, -2.5363e-02,
        -1.2666e-03, -1.1135e-02, -3.3053e-03, -2.7524e-02, -4.3270e-03,
        -5.3791e-04, -1.5882e-03, -7.4592e-01, -7.9829e-03, -3.0621e-02,
        -6.2773e-03, -6.1785e-03, -9.9423e-03, -3.6450e-03, -4.5550e-03,
        -4.6709e-03, -1.0266e-03, -2.2036e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1026, -0.2549, -0.0091, -0.0097, -0.0807, -0.0043, -0.0318, -0.0088,
        -0.1173, -0.0087, -0.0028, -0.0041, -0.2340, -0.0182, -0.0696, -0.0130,
        -0.0074, -0.0138, -0.0092,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0704, -0.1469, -0.0065, -0.0083, -0.0375, -0.0023, -0.0247, -0.0041,
        -0.0410, -0.0061, -0.0017, -0.0049, -0.3989, -0.0110, -0.0333, -0.0140,
        -0.1600, -0.0114, -0.0061, -0.0058, -0.0052,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 0.0132, -0.2920, -0.0114, -0.0167, -0.1320, -0.0069, -0.0407, -0.0090,
        -0.0859, -0.0156, -0.0037, -0.0073, -0.1397, -0.0191, -0.0796, -0.0272,
        -0.0120, -0.0108, -0.0215, -0.0172, -0.0182, -0.0077, -0.0128,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-7.1104e-02, -3.7091e-02, -6.7411e-04, -6.1278e-03, -2.0490e-02,
        -2.9572e-03, -2.0642e-03, -2.1231e-03, -4.1477e-03, -2.7508e-03,
        -1.8207e-03, -7.6928e-01, -5.1070e-03, -6.9725e-03, -2.2925e-02,
        -7.1278e-03, -4.4974e-03, -3.5214e-03, -5.4693e-03, -5.1109e-03,
        -5.5069e-03, -7.8475e-03, -1.1448e-03, -4.1365e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #4650: [tensor([-0.2011, -0.0123, -0.0036, -0.0148, -0.0069, -0.0066, -0.0074, -0.0083,
        -0.0016, -0.0073, -0.1505, -0.0051, -0.0208, -0.0134, -0.0023, -0.0038,
        -0.1117, -0.0484, -0.0230, -0.3134, -0.0164, -0.0069, -0.0146,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 7.9208e-02, -7.1887e-03, -2.8716e-03, -7.3424e-03, -3.2780e-03,
        -4.1764e-03, -5.9791e-03, -9.8554e-03, -4.5743e-03, -3.8509e-03,
        -5.6264e-02, -4.0457e-03, -1.6260e-02, -1.5089e-02, -3.4170e-04,
        -2.4912e-03, -8.1142e-02, -2.5013e-02, -1.1609e-02, -1.6786e-01,
        -9.0316e-03, -4.4726e-01, -2.0702e-02, -5.2429e-03, -9.3312e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1068, -0.2218, -0.0071, -0.0960, -0.0075, -0.0476, -0.0054, -0.0063,
        -0.0444, -0.0130, -0.0010, -0.0054, -0.3040, -0.0167, -0.0932, -0.0146,
        -0.0092,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0644, -0.1640, -0.0054, -0.0471, -0.0060, -0.0282, -0.0036, -0.0036,
        -0.0439, -0.0142, -0.0014, -0.0082, -0.1218, -0.0109, -0.0704, -0.3836,
        -0.0117, -0.0114,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0388, -0.2906, -0.0053, -0.1132, -0.0069, -0.0787, -0.0082, -0.0061,
        -0.0593, -0.0122, -0.0026, -0.0067, -0.2216, -0.0147, -0.1119, -0.0120,
        -0.0112,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-9.4895e-02, -2.4829e-02, -3.8008e-03, -3.7902e-03, -1.7093e-03,
        -1.6187e-03, -2.6269e-03, -2.5956e-02, -3.1816e-03, -2.8709e-03,
        -6.5466e-03, -2.4385e-03, -2.1190e-03, -1.2096e-02, -1.0351e-02,
        -3.0367e-03, -2.4559e-03, -8.8503e-03, -1.6811e-03,  1.0946e-03,
        -5.6182e-04, -2.6852e-02, -6.4211e-03, -1.2076e-02, -8.3154e-03,
        -3.8932e-03, -7.1668e-01, -3.6169e-03, -2.3891e-03, -3.2471e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.0775e-01, -7.2223e-02, -4.9757e-03, -6.8180e-03, -1.5493e-03,
        -1.3066e-03, -3.7726e-03, -6.5300e-02, -4.2506e-03, -6.3023e-03,
        -8.8283e-03, -2.7966e-03, -3.7293e-03, -2.3608e-02, -1.4842e-02,
        -4.5532e-03, -3.2882e-03, -9.8312e-03, -3.8781e-03,  7.1147e-05,
        -9.9741e-04, -8.6160e-02, -1.8143e-02, -2.1651e-02, -9.1033e-03,
        -5.9174e-03, -7.4604e-03, -8.7505e-03, -2.1618e-02, -1.5606e-01,
        -2.5136e-03, -6.1219e-03, -2.9073e-01, -7.2377e-03, -2.7023e-03,
        -5.1643e-03], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1343, -0.1860, -0.0114, -0.0125, -0.0049, -0.0047, -0.0054, -0.1414,
        -0.0114, -0.0160, -0.0185, -0.0090, -0.0150, -0.1140, -0.0331, -0.0071,
        -0.0044, -0.0308, -0.0083, -0.0017, -0.0040, -0.1096, -0.0270, -0.0678,
        -0.0125, -0.0079, -0.0015,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-4.3655e-02, -3.6466e-02, -2.7304e-03, -3.2804e-03, -1.7912e-02,
        -8.8072e-04, -4.8960e-03, -1.0117e-03, -7.3564e-03, -3.0711e-03,
        -7.5769e-03, -1.8049e-02, -2.8659e-03, -4.6355e-03, -1.4476e-02,
        -3.7045e-03, -3.2458e-03, -2.1003e-03, -2.6998e-02, -7.7183e-04,
        -1.3858e-03, -4.5730e-04, -5.0677e-05, -1.8206e-02, -6.4071e-03,
        -3.7997e-02, -8.0177e-03, -2.6376e-03, -4.7138e-03, -6.2552e-01,
        -5.4751e-03, -3.7948e-03, -3.4948e-02, -3.7764e-02, -2.9309e-03,
        -4.0142e-03], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0308, -0.0378, -0.0040, -0.0038, -0.0336, -0.0016, -0.0040, -0.0015,
        -0.0118, -0.0017, -0.0084, -0.0202, -0.0044, -0.0054, -0.0184, -0.0030,
        -0.0034, -0.0032, -0.0311, -0.0021, -0.0007,  0.0004, -0.0009, -0.1944,
        -0.0087, -0.0463, -0.0112, -0.0530, -0.1691, -0.0066, -0.0045, -0.2668,
        -0.0054, -0.0019,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1690, -0.0881, -0.0061, -0.0097, -0.0768, -0.0021, -0.0084, -0.0012,
        -0.0197, -0.0057, -0.0224, -0.0755, -0.0067, -0.0115, -0.0743, -0.0057,
        -0.0046, -0.0060, -0.1191, -0.0041, -0.0015, -0.0009, -0.0016, -0.0533,
        -0.0165, -0.1148, -0.0305, -0.0057, -0.0065, -0.0104, -0.0118, -0.0120,
        -0.0105, -0.0053, -0.0022,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-4.9929e-02, -9.6942e-02, -6.5286e-03, -6.3525e-02, -5.1117e-02,
        -4.2568e-03, -3.2807e-03, -2.8411e-03, -2.8244e-03,  3.3403e-04,
        -4.3913e-03, -1.5642e-03, -3.3731e-02, -5.1490e-03,  2.8840e-04,
        -2.6324e-03, -1.2321e-01, -1.1108e-02, -3.1423e-02, -4.7421e-01,
        -5.9081e-03, -2.7555e-03, -1.0800e-02, -8.2658e-04, -5.0791e-03,
        -5.3366e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #4700: [tensor([-8.3233e-02, -5.9668e-02, -2.0949e-03, -1.2601e-02, -5.1023e-03,
        -1.6953e-03, -3.9104e-03, -6.6894e-03, -6.8961e-03, -2.9894e-02,
        -2.6796e-03, -3.6514e-03, -6.5689e-02, -7.0620e-03, -1.0017e-04,
        -2.0906e-03, -5.8406e-02, -1.0876e-02, -6.9542e-03, -9.8044e-03,
        -5.7987e-03, -2.0322e-01, -2.7810e-02, -1.3393e-02, -3.5387e-01,
        -9.5854e-03, -2.3848e-03, -4.8424e-03], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-3.0829e-02, -1.0525e-01, -2.1926e-03, -1.1780e-02, -5.2709e-03,
        -1.2914e-03, -3.3904e-03, -6.8768e-03, -4.9779e-03, -2.8460e-02,
        -2.2995e-03, -3.4584e-03, -9.2735e-02, -1.0773e-02,  2.7043e-04,
        -2.2592e-03, -1.8534e-01, -7.1105e-03, -6.1099e-03, -4.7324e-01,
        -7.5228e-03, -4.0834e-03, -4.4713e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0745, -0.1847, -0.0048, -0.0251, -0.0131, -0.0045, -0.0041, -0.0101,
        -0.0135, -0.0569, -0.0052, -0.0136, -0.1781, -0.0302, -0.0003, -0.0053,
        -0.2646, -0.0223, -0.0570, -0.0164, -0.0061, -0.0096,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0984, -0.1606, -0.0080, -0.0806, -0.0651, -0.0016, -0.0057, -0.0042,
        -0.0690,  0.0016, -0.0007, -0.0014, -0.1313, -0.0113, -0.0491, -0.0049,
        -0.0086, -0.0163, -0.0158, -0.1082, -0.1324, -0.0054, -0.0131, -0.0066,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-3.0563e-02, -3.1902e-02, -6.4903e-03, -2.5635e-02, -2.6823e-02,
        -2.2985e-03, -5.5528e-03, -3.7264e-03, -2.4733e-02,  7.1268e-04,
         2.5288e-04, -1.0104e-03, -5.6221e-01, -1.1174e-02, -6.3721e-03,
        -2.4548e-01, -2.6249e-03, -5.8122e-03, -6.6330e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-1.7113e-01, -2.1674e-01, -1.4536e-02, -8.6256e-02, -1.0365e-01,
        -4.6123e-03, -8.2539e-03, -4.9013e-03, -1.1906e-01, -5.6994e-05,
        -5.8249e-04, -7.1777e-03, -1.5567e-02, -1.7182e-01, -3.6491e-03,
        -7.5794e-03, -1.7485e-02, -2.6275e-02, -9.2730e-03, -1.1396e-02,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1589, -0.0478, -0.0191, -0.0167, -0.0054, -0.0386, -0.1332, -0.0211,
        -0.0118, -0.0202, -0.0403, -0.0865, -0.0489, -0.0857, -0.1605, -0.0493,
        -0.0210, -0.0351,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.3014, -0.0971, -0.0264, -0.0640, -0.0147, -0.0634, -0.1629, -0.0341,
        -0.0103, -0.0364, -0.0306, -0.0435, -0.0358, -0.0396, -0.0397,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0607, -0.0359, -0.0122, -0.0114, -0.0052, -0.0190, -0.0758, -0.0080,
        -0.0022, -0.0080, -0.0347, -0.0435, -0.0196, -0.2765, -0.3519, -0.0225,
        -0.0128,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-1.0002e-01, -3.7022e-03, -9.1303e-03, -6.4115e-03, -5.6252e-03,
        -2.0623e-02, -4.2285e-03, -3.4049e-03, -1.3869e-02, -8.9280e-03,
         3.0108e-04, -3.0830e-03, -6.0535e-01, -1.7775e-02, -4.3425e-02,
        -1.5889e-02, -6.5358e-02, -6.5134e-02, -5.6390e-03, -2.1108e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1224, -0.0027, -0.0066, -0.0054, -0.0039, -0.0228, -0.0030, -0.0017,
        -0.0078, -0.0072, -0.0021, -0.0007, -0.1698, -0.0121, -0.0077, -0.5894,
        -0.0073, -0.0082, -0.0122, -0.0029, -0.0041,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-8.3265e-02, -3.2834e-03, -6.8042e-03, -3.9790e-03, -3.3176e-03,
        -2.1565e-02, -3.8383e-03, -4.1952e-03, -8.9832e-03, -1.0700e-02,
        -4.2100e-04, -2.9149e-03, -7.6474e-01, -9.3599e-03, -3.9723e-02,
        -1.2165e-02, -7.5606e-03, -8.1669e-03, -5.0224e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #4750: [tensor([-0.0924, -0.0273, -0.0089, -0.0096, -0.0217, -0.0012, -0.0061, -0.0142,
        -0.0113, -0.5860, -0.0024, -0.0146, -0.0016, -0.0052, -0.0390, -0.0102,
        -0.0226, -0.0202, -0.0779, -0.0068, -0.0106, -0.0030, -0.0070,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1249, -0.0349, -0.0083, -0.0112, -0.0292, -0.0054, -0.0075, -0.0152,
        -0.0109, -0.5940, -0.0041, -0.0152, -0.0026, -0.0022, -0.0529, -0.0146,
        -0.0167, -0.0212, -0.0140, -0.0050, -0.0102,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1386, -0.0172, -0.0029, -0.0051, -0.0100, -0.0015, -0.0019, -0.0106,
        -0.0063, -0.0635, -0.0025, -0.0047, -0.0014, -0.0018, -0.0220, -0.0077,
        -0.0063, -0.1021, -0.0053, -0.0067, -0.0154, -0.0070, -0.5495, -0.0039,
        -0.0020, -0.0040,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0368, -0.0239, -0.0052, -0.0078, -0.0214, -0.0024, -0.0057, -0.0128,
        -0.0075, -0.3269, -0.0030, -0.0080, -0.0006, -0.0026, -0.0365, -0.0079,
        -0.0109, -0.4292, -0.0086, -0.0085, -0.0172, -0.0070, -0.0029, -0.0068,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([ 0.0031, -0.0482, -0.0057, -0.0171, -0.0186, -0.0026, -0.0048, -0.0249,
        -0.0124, -0.7855, -0.0056, -0.0129, -0.0017, -0.0044, -0.0047, -0.0148,
        -0.0132, -0.0108, -0.0091,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0665, -0.0368, -0.0059, -0.0095, -0.0149, -0.0032, -0.0049, -0.0164,
        -0.0071, -0.6905, -0.0033, -0.0088, -0.0009, -0.0025, -0.0408, -0.0069,
        -0.0285, -0.0079, -0.0204, -0.0112, -0.0013, -0.0036, -0.0080,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0187, -0.0195, -0.0027, -0.0062, -0.0133, -0.0014, -0.0045, -0.0115,
        -0.0059, -0.5263, -0.0028, -0.0056, -0.0012, -0.0024, -0.0219, -0.0071,
        -0.0115, -0.0098, -0.0068, -0.0082, -0.0012, -0.0036, -0.1057, -0.0036,
        -0.1853, -0.0082, -0.0009, -0.0043], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0761, -0.0326, -0.0027, -0.0084, -0.0204, -0.0023, -0.0065, -0.0143,
        -0.0088, -0.1544, -0.0039, -0.0087, -0.0009, -0.0029, -0.0375, -0.0116,
        -0.0166, -0.0132, -0.0114, -0.0171, -0.0073, -0.0111, -0.5234, -0.0046,
        -0.0033,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-3.4813e-02, -5.3309e-02, -7.7940e-03, -1.3709e-02, -2.6670e-02,
        -3.3921e-03, -5.8936e-03, -1.4659e-02, -1.2788e-02, -6.7681e-01,
        -1.4549e-03, -1.0161e-02, -4.3056e-04, -3.7092e-03, -4.8117e-02,
        -1.2325e-02, -2.5240e-02, -7.5907e-03, -1.6280e-02, -1.6142e-02,
        -3.9769e-03, -4.7336e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0332, -0.0439, -0.0042, -0.0063, -0.0163, -0.0036, -0.0039, -0.0132,
        -0.0090, -0.6439, -0.0023, -0.0115, -0.0009, -0.0037, -0.0468, -0.0104,
        -0.0154, -0.0241, -0.0771, -0.0089, -0.0119, -0.0016, -0.0080,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0529, -0.0487, -0.0080, -0.0093, -0.0268, -0.0035, -0.0048, -0.0152,
        -0.0119, -0.6236, -0.0029, -0.0130, -0.0026, -0.0020, -0.0669, -0.0087,
        -0.0185, -0.0169, -0.0084, -0.0130, -0.0246, -0.0110, -0.0021, -0.0027,
        -0.0020,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-5.3701e-02, -2.5185e-02, -3.7232e-03, -6.3824e-03, -1.4965e-02,
        -1.5632e-03, -4.5430e-03, -1.0074e-02, -6.9088e-03, -3.9449e-01,
        -1.2318e-03, -8.7448e-03, -3.3910e-04, -3.3422e-03, -7.5779e-03,
        -7.6145e-03, -9.4235e-03, -1.8685e-01, -9.7370e-03, -6.9266e-03,
        -2.0196e-01, -6.2294e-03, -2.4691e-02, -3.7919e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #4800: [tensor([-0.1552, -0.1356, -0.0150, -0.0041, -0.0095, -0.0089, -0.0422, -0.0167,
        -0.0761, -0.0147, -0.0027, -0.0047, -0.0281, -0.0086, -0.0096, -0.0111,
        -0.4363, -0.0100, -0.0108,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.2275e-01, -6.3674e-03, -6.8637e-03, -9.7606e-03, -3.4840e-02,
        -5.4544e-04, -6.8393e-03, -2.6403e-03, -3.9235e-03, -6.6859e-02,
        -1.2505e-02, -1.2909e-01, -2.4348e-01, -8.7704e-03, -4.0698e-03,
         9.8094e-05, -4.4058e-03, -1.8174e-02, -1.0064e-01, -1.6593e-02,
        -8.5795e-03, -1.3534e-01, -3.0992e-02, -8.8307e-03, -7.7896e-03,
        -9.2533e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0858, -0.0100, -0.0077, -0.0053, -0.0233, -0.0012, -0.0030, -0.0032,
        -0.0055, -0.0875, -0.0082, -0.2168, -0.1365, -0.0072, -0.0012, -0.0016,
        -0.0043, -0.0163, -0.0077, -0.0099, -0.1379, -0.0058, -0.0074, -0.1285,
        -0.0687, -0.0040, -0.0052,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0599, -0.0087, -0.0094, -0.0069, -0.0241, -0.0025, -0.0038, -0.0057,
        -0.0017, -0.0460, -0.0134, -0.0649, -0.1822, -0.0069, -0.0031, -0.0013,
        -0.0033, -0.2908, -0.0037, -0.0083, -0.0398, -0.0080, -0.0046, -0.0101,
        -0.0173, -0.0153, -0.1315, -0.0028, -0.0107, -0.0062, -0.0072,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.5433e-01, -4.6946e-02, -8.1729e-03, -9.2301e-02, -3.6783e-03,
        -1.0021e-02, -5.0884e-03, -9.2849e-03, -7.7613e-03, -8.3423e-03,
        -7.8671e-03, -2.5541e-05, -8.0119e-03, -1.4278e-03, -2.7186e-03,
        -1.0612e-01, -1.2730e-02, -4.7477e-01, -1.7066e-02, -1.5943e-02,
        -7.3886e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-7.1712e-02, -3.5682e-02, -5.9481e-03, -3.0653e-02, -3.4598e-03,
        -5.2027e-03, -2.3203e-03, -5.8803e-03, -4.3900e-03, -3.2952e-03,
        -3.7306e-03,  4.2041e-04, -5.7018e-03, -9.3301e-04, -1.5410e-03,
        -5.0850e-02, -1.0822e-02, -2.1710e-01, -7.5818e-03, -1.3162e-02,
        -3.6123e-03, -4.9974e-03, -5.0071e-01, -7.2847e-03, -3.0149e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-7.7299e-02, -4.4169e-02, -5.9930e-03, -5.2411e-02, -4.5548e-03,
        -9.8051e-03, -3.1630e-03, -7.0855e-03, -7.2506e-03, -6.3246e-03,
        -5.9192e-03, -2.1223e-04, -4.9010e-03, -1.2571e-03, -2.6566e-03,
        -1.1597e-01, -1.2459e-02, -5.9354e-01, -1.0431e-02, -2.3056e-02,
        -4.2648e-03, -7.2760e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-8.1792e-02, -2.6734e-03, -2.9253e-03, -2.0318e-03, -6.6351e-03,
        -4.8194e-02, -6.8102e-04, -3.0079e-03, -7.4330e-04, -1.6777e-03,
        -2.0973e-02, -2.5151e-03, -3.5974e-03, -7.3301e-02, -3.7408e-03,
        -9.9372e-04, -3.5369e-03, -3.2602e-03, -2.9248e-02, -3.1295e-04,
        -5.9627e-03, -1.7113e-03, -1.8910e-03, -1.2343e-02, -1.7932e-02,
        -1.9857e-02, -4.4714e-01, -1.6021e-03, -2.2351e-03,  2.9002e-04,
        -9.4423e-04, -3.2514e-02, -2.3742e-03, -3.1928e-03, -5.1187e-03,
        -9.8672e-02, -8.6011e-03, -5.1418e-03, -2.4438e-02, -1.8758e-03,
        -7.9983e-03, -1.6568e-03, -4.6664e-03], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-2.0414e-02, -2.3199e-03, -3.1089e-03, -2.1713e-03, -7.4082e-03,
        -3.9657e-02, -5.0040e-05, -2.0772e-03, -1.1358e-03, -1.9566e-03,
        -2.1930e-02, -2.3100e-03, -2.6323e-03, -3.7157e-02, -2.4433e-03,
        -8.2818e-04, -3.0184e-03, -2.5517e-03, -1.4041e-02, -3.9188e-04,
        -4.1447e-03, -2.2632e-03, -2.0781e-03, -1.1633e-02, -6.3388e-03,
        -1.3152e-02, -5.8916e-01, -1.1743e-03, -1.6132e-03,  5.0222e-04,
        -1.0648e-03, -2.1165e-02, -3.5106e-03, -2.1446e-03, -3.9232e-03,
        -9.7241e-02, -1.4474e-03, -4.6013e-03, -5.3352e-02, -5.2263e-03,
        -2.0597e-03, -1.1422e-03, -3.4573e-03], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-5.6363e-02, -2.6705e-03, -1.4742e-03, -3.1473e-03, -1.2212e-02,
        -2.9553e-02, -2.6941e-04, -3.2477e-03, -1.8700e-03, -2.7155e-03,
        -2.4686e-02, -2.4897e-03, -4.3861e-03, -7.1638e-02, -4.1354e-03,
        -1.1207e-04, -3.3655e-03, -2.7726e-03, -2.9450e-02, -2.2114e-04,
        -7.0196e-03, -2.4252e-03, -1.1522e-03, -1.1347e-02, -2.0588e-02,
        -2.5409e-02, -4.1453e-01, -1.6999e-03, -2.6032e-03, -6.2677e-04,
        -7.0098e-04, -5.4234e-02, -2.2643e-03, -2.7336e-03, -6.4777e-03,
        -1.6985e-01, -1.0990e-02, -4.8370e-03, -1.2509e-03, -2.4803e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0141, -0.0037, -0.0041, -0.0061, -0.0035, -0.0033, -0.0035, -0.0032,
        -0.0273, -0.0141, -0.0010, -0.0024, -0.0064, -0.0046, -0.0047, -0.0608,
        -0.0093, -0.0184, -0.7686, -0.0080, -0.0073, -0.0145, -0.0034, -0.0027,
        -0.0050,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0576, -0.0048, -0.0033, -0.0031, -0.0031, -0.0036, -0.0035, -0.0017,
        -0.0149, -0.0061,  0.0014, -0.0024, -0.0324, -0.0084, -0.0269, -0.0084,
        -0.0079, -0.7980, -0.0070, -0.0022, -0.0034,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>)]
Iter #4850: [tensor([-7.5534e-02, -1.4720e-01, -3.6504e-03, -1.0745e-02, -5.6161e-02,
        -4.2639e-03, -5.2672e-03, -3.3943e-03, -4.3752e-03, -5.2050e-03,
        -4.9445e-04, -4.0148e-03, -5.6568e-01, -1.1276e-02, -6.7022e-02,
        -1.0010e-02, -1.0195e-02, -8.6886e-03, -6.8200e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1915, -0.1283, -0.0106, -0.0251, -0.0093, -0.0197, -0.0229, -0.0124,
        -0.0170, -0.0297, -0.0126, -0.0252, -0.0850, -0.0533, -0.0034, -0.0086,
        -0.1558, -0.0227, -0.0244, -0.0178, -0.0174, -0.0431, -0.0422, -0.0221],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1831, -0.1228, -0.0101, -0.0115, -0.0080, -0.0197, -0.0314, -0.0109,
        -0.0249, -0.0332, -0.0115, -0.0237, -0.1410, -0.0475, -0.0038, -0.0089,
        -0.1769, -0.0232, -0.0426, -0.0199, -0.0262, -0.0192,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0051, -0.1203, -0.0091, -0.0161, -0.0040, -0.0151, -0.0280, -0.0084,
        -0.0265, -0.0200, -0.0144, -0.0150, -0.1407, -0.0545, -0.0047, -0.0141,
        -0.1968, -0.1008, -0.0659, -0.0594, -0.0465, -0.0217, -0.0130,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1378, -0.3909, -0.0088, -0.0246, -0.0056, -0.0050, -0.0064, -0.0047,
        -0.2509, -0.0116, -0.0131, -0.0175, -0.0149, -0.0428, -0.0107, -0.0102,
        -0.0099, -0.0242, -0.0105,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1091, -0.3843, -0.0055, -0.0203, -0.0065, -0.0063, -0.0075, -0.0060,
        -0.2976, -0.0388, -0.0066, -0.0187, -0.0245, -0.0254, -0.0099, -0.0092,
        -0.0109, -0.0129,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1254, -0.2001, -0.0043, -0.0206, -0.0047, -0.0037, -0.0041, -0.0061,
        -0.0653, -0.0115, -0.0064, -0.0119, -0.0077, -0.0246, -0.0067, -0.4715,
        -0.0112, -0.0074, -0.0067,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2165, -0.1278, -0.0060, -0.0223, -0.0057, -0.0240, -0.0058, -0.0079,
        -0.0962, -0.0049, -0.0016, -0.0042, -0.0142, -0.0758, -0.0071, -0.1964,
        -0.0129, -0.0537, -0.1007, -0.0034, -0.0053, -0.0075,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0416, -0.3332, -0.0096, -0.0280, -0.0057, -0.0317, -0.0075, -0.0168,
        -0.0864, -0.0048, -0.0010, -0.0065, -0.0216, -0.3348, -0.0073, -0.0337,
        -0.0091, -0.0205,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0900, -0.3360, -0.0129, -0.0326, -0.0095, -0.0279, -0.0081, -0.0085,
        -0.1415, -0.0093, -0.0032, -0.0123, -0.0224, -0.2444, -0.0151, -0.0136,
        -0.0126,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1512, -0.1572, -0.0039, -0.0559, -0.0936, -0.0044, -0.0011, -0.0027,
        -0.0029, -0.0083, -0.0048, -0.0011, -0.0038, -0.0090, -0.0110, -0.4644,
        -0.0117, -0.0052, -0.0079,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1513, -0.2992, -0.0072, -0.1711, -0.2064, -0.0095, -0.0022, -0.0077,
        -0.0057, -0.0062, -0.0142, -0.0098, -0.0104, -0.0190, -0.0146, -0.0195,
        -0.0196, -0.0264,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #4900: [tensor([-0.0081, -0.1378, -0.0049, -0.0089, -0.0051, -0.0023, -0.0007, -0.0013,
        -0.0214, -0.0016, -0.0154, -0.1958, -0.0008, -0.0017, -0.0023, -0.0040,
        -0.0013, -0.0046, -0.0054,  0.0009, -0.0014, -0.4394, -0.0046, -0.1152,
        -0.0063, -0.0046, -0.0042,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0458, -0.0584, -0.0038, -0.0058, -0.0026, -0.0014, -0.0009, -0.0012,
        -0.0135, -0.0016, -0.0079, -0.2228, -0.0013, -0.0024, -0.0033, -0.0044,
        -0.0016, -0.0030, -0.0036,  0.0014, -0.0010, -0.3527, -0.0023, -0.0389,
        -0.0014, -0.0060, -0.1964, -0.0087, -0.0028, -0.0033,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-2.8257e-02, -1.3737e-01, -4.0530e-03, -8.1894e-03, -3.8676e-03,
        -2.7981e-03, -9.3653e-04, -2.9842e-04, -1.7141e-02, -2.1279e-03,
        -1.4818e-02, -3.5847e-01, -1.5719e-03, -4.6000e-03, -4.1638e-03,
        -3.5100e-03, -2.2398e-03, -2.8447e-03, -5.6175e-03,  6.9012e-04,
        -2.4667e-03, -3.0411e-01, -3.9663e-03, -5.3387e-02, -3.5876e-03,
        -1.3238e-02, -2.4839e-03, -4.0235e-03, -5.1334e-03, -4.0390e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1228, -0.3097, -0.0050, -0.0114, -0.0097, -0.0109, -0.0171, -0.0061,
         0.0003, -0.0071, -0.3311, -0.0143, -0.0129, -0.0248, -0.0946, -0.0116,
        -0.0104,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0783, -0.3124, -0.0033, -0.0079, -0.0086, -0.0160, -0.0167, -0.0063,
        -0.0035, -0.0056, -0.0061, -0.0105, -0.0183, -0.3983, -0.0153, -0.0622,
        -0.0131, -0.0176,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-8.3731e-02, -1.4610e-01, -2.6319e-03, -4.3701e-03, -2.8054e-03,
        -8.3345e-03, -1.2018e-02, -2.5618e-03, -2.2436e-04, -4.6167e-03,
        -1.6748e-01, -1.1892e-02, -8.4901e-03, -1.0289e-01, -5.6469e-02,
        -1.1865e-02, -1.8575e-02, -3.4085e-01, -8.4648e-03, -5.6225e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.0738e-02, -2.2566e-02, -2.7507e-03, -1.8727e-03, -6.6592e-03,
        -3.2452e-02, -1.2222e-03, -2.8729e-03, -7.9620e-03,  6.4463e-05,
        -5.6236e-04, -2.8021e-03, -1.7129e-03, -4.8120e-02, -1.2856e-03,
        -4.4035e-03, -1.4454e-03, -2.1284e-03, -3.0085e-03, -3.2213e-03,
        -1.7919e-03, -2.0799e-04, -6.4815e-01, -3.4466e-03,  1.3866e-03,
        -1.3492e-03, -7.2132e-02, -2.4119e-03, -9.3234e-02, -3.9100e-03,
        -2.9587e-03, -3.3906e-03, -4.6699e-03, -7.8726e-04, -2.3250e-03],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0465, -0.0414, -0.0039, -0.0029, -0.0095, -0.0378, -0.0016, -0.0039,
        -0.0087, -0.0009, -0.0012, -0.0024, -0.0022, -0.0730, -0.0015, -0.0069,
        -0.0022, -0.0024, -0.0049, -0.0040, -0.0019, -0.0016, -0.5370, -0.0051,
         0.0006, -0.0011, -0.1060, -0.0026, -0.0648, -0.0063, -0.0030, -0.0062,
        -0.0029, -0.0033,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-5.9107e-02, -2.3024e-02, -2.5746e-03, -1.2445e-03, -7.7795e-03,
        -1.5091e-02, -1.0453e-03, -2.8695e-03, -8.1215e-03, -2.2436e-04,
        -1.1692e-03, -2.7996e-03, -2.3876e-03, -2.9029e-02, -1.3106e-03,
        -4.7803e-03, -7.4692e-04, -2.3376e-03, -4.2198e-03, -3.1125e-03,
        -1.4973e-03, -5.2160e-04, -3.4183e-01, -3.7101e-03,  1.0923e-03,
        -1.4916e-03, -4.1782e-01, -2.6593e-03, -2.0551e-02, -4.5916e-03,
        -1.4446e-02, -1.1865e-02, -2.1338e-03, -6.9052e-04, -2.1217e-03],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1277, -0.2474, -0.0032, -0.0252, -0.0066, -0.0128, -0.0393, -0.0153,
        -0.0133, -0.0113, -0.0735, -0.0413, -0.0052, -0.0093, -0.2372, -0.0143,
        -0.0251, -0.0278, -0.0090, -0.0276, -0.0181, -0.0096,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.5443e-01, -1.0772e-01, -1.9909e-04, -1.3475e-02, -3.5805e-03,
        -9.4575e-03, -2.1876e-02, -9.6255e-03, -7.0299e-03, -7.7814e-03,
        -4.3082e-02, -1.2721e-02, -2.1056e-03, -3.7972e-03, -4.9063e-01,
        -8.1537e-03, -1.5537e-02, -1.0347e-02, -3.8582e-02, -1.0803e-02,
        -2.3644e-02, -1.6925e-03, -3.7332e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.8874e-01, -2.0692e-01, -1.8603e-04, -1.3638e-02, -4.0177e-03,
        -1.2416e-02, -4.8497e-02, -1.1982e-02, -8.6607e-03, -8.3761e-03,
        -8.8232e-02, -2.6683e-02, -2.3890e-03, -6.7435e-03, -2.6200e-01,
        -1.0396e-02, -2.0419e-02, -1.4473e-02, -1.0015e-02, -4.0674e-02,
        -7.5653e-03, -6.9772e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #4950: [tensor([-0.0917, -0.0781, -0.0124, -0.0061, -0.0850, -0.0055, -0.0100, -0.0040,
        -0.0024, -0.0040, -0.1271, -0.0230, -0.0112, -0.1537, -0.0092, -0.0097,
        -0.0548, -0.0111, -0.2866, -0.0077, -0.0066,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0676, -0.0204, -0.0009, -0.0123, -0.0740, -0.0095, -0.0088, -0.0048,
        -0.0735, -0.0007, -0.0039, -0.0115, -0.0088, -0.0104, -0.0024, -0.0866,
        -0.0122, -0.5550, -0.0090, -0.0145, -0.0038, -0.0096,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0564, -0.0126, -0.0036, -0.0079, -0.1158, -0.0067, -0.0133, -0.0073,
        -0.0845, -0.0029, -0.0059, -0.0218, -0.0088, -0.0193, -0.0034, -0.1048,
        -0.0148, -0.4895, -0.0098, -0.0109,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0584, -0.0176, -0.0032, -0.0080, -0.0590, -0.0073, -0.0066, -0.0046,
        -0.0510, -0.0031, -0.0030, -0.0059, -0.0068, -0.0077, -0.0023, -0.0621,
        -0.0102, -0.6649, -0.0086, -0.0037, -0.0060,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-4.2395e-02, -3.1281e-02, -1.4806e-03, -4.4301e-03, -1.3933e-03,
        -3.2322e-02, -2.3200e-03, -2.9329e-03, -1.3516e-03, -1.7191e-02,
        -1.9409e-03, -2.4716e-03, -2.2361e-03, -2.1135e-02, -1.5128e-03,
        -4.8481e-03, -1.9341e-02, -2.7789e-03, -2.7058e-03, -3.5292e-04,
         5.7245e-05, -8.9959e-04, -3.6673e-03, -2.4518e-03, -4.0036e-03,
        -3.1560e-04,  7.5043e-04, -6.5444e-04, -7.2548e-01, -3.3075e-03,
        -4.1654e-02, -4.5823e-03, -2.7885e-03, -5.5084e-04, -4.2565e-03,
        -3.4839e-03, -1.6461e-03, -3.0275e-03,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-4.3378e-02, -4.7438e-02, -1.7633e-03, -5.0419e-03, -2.5140e-03,
        -1.6987e-02, -1.4174e-03, -2.6112e-03, -1.2523e-03, -2.2676e-02,
        -2.6233e-03, -3.5152e-03, -2.9962e-03, -2.3405e-02, -1.1414e-03,
        -6.3916e-03, -2.0159e-02, -2.1123e-03, -3.1199e-03, -2.4290e-04,
         4.0885e-04, -8.7073e-04, -1.6953e-03, -2.0100e-03, -3.7644e-03,
         3.7273e-04,  1.0373e-03, -7.2309e-04, -3.9308e-01, -2.8471e-03,
        -2.4898e-02, -3.1311e-03, -4.6082e-03, -3.3914e-01, -4.7090e-03,
        -2.8753e-03, -3.0431e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-7.5339e-02, -2.6974e-02, -1.2580e-03, -3.6039e-03, -1.4355e-03,
        -1.7486e-02, -1.8910e-03, -4.3157e-03, -1.1502e-03, -1.3513e-02,
        -1.7364e-03, -3.5198e-03, -2.9380e-03, -1.3396e-02, -1.1791e-03,
        -7.3356e-03, -9.4705e-03, -2.3841e-03, -3.2372e-03, -3.7260e-05,
         3.5471e-04, -2.3175e-04, -2.1328e-03, -1.5573e-03, -4.0849e-03,
         3.2369e-04,  7.6352e-04, -8.9465e-04, -5.7476e-01, -3.6104e-03,
        -2.3524e-02, -4.2772e-03, -5.0843e-03, -1.7711e-01, -3.9097e-03,
        -2.3502e-03, -2.8288e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.2520e-01, -1.7409e-01, -6.9929e-03, -3.7332e-03, -1.9753e-03,
        -1.0205e-01, -1.1683e-03, -2.2206e-03, -3.8125e-03, -2.3168e-03,
        -2.4057e-02, -5.6135e-03, -4.7794e-03, -3.4699e-03, -5.4831e-03,
        -5.2322e-03, -2.1207e-02, -1.1684e-02, -2.4753e-01, -3.7098e-03,
        -3.8978e-03, -2.1468e-03, -9.5748e-03, -1.4382e-01, -1.7565e-02,
        -2.1695e-04, -3.9536e-03, -1.6777e-03, -5.9789e-03, -1.6749e-02,
        -1.0829e-02, -8.4011e-03, -8.3195e-03, -3.6632e-03, -6.8771e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0169, -0.1091, -0.0043, -0.0032, -0.0027, -0.0831, -0.0016, -0.0025,
        -0.0025, -0.0028, -0.0194, -0.0058, -0.0055, -0.0037, -0.0029, -0.0059,
        -0.0206, -0.0072, -0.0493, -0.0027, -0.0015, -0.0023, -0.0100, -0.1584,
        -0.0125, -0.0014, -0.0030, -0.0027, -0.3214, -0.0030, -0.0104, -0.0616,
        -0.0121, -0.0121, -0.0061, -0.0060, -0.0123, -0.0052, -0.0063,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1651, -0.2217, -0.0043, -0.0036, -0.0020, -0.1054, -0.0025, -0.0016,
        -0.0031, -0.0033, -0.0177, -0.0056, -0.0054, -0.0029, -0.0046, -0.0064,
        -0.0295, -0.0062, -0.1111, -0.0019, -0.0008, -0.0029, -0.0067, -0.1107,
        -0.0133, -0.0029, -0.0046, -0.0015, -0.0074, -0.1086, -0.0062, -0.0061,
        -0.0100, -0.0034, -0.0051, -0.0059,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.6017e-01, -6.7858e-02, -5.1071e-03, -2.3663e-03, -2.9124e-03,
        -5.5103e-02, -1.4823e-03, -9.8182e-04, -2.5716e-03, -1.5374e-03,
        -1.7371e-02, -1.9620e-03, -2.2568e-03, -2.3937e-03, -2.9735e-03,
        -6.3924e-03, -1.5347e-02, -7.3826e-03, -7.6136e-02, -1.3456e-03,
        -1.0498e-03, -3.2334e-03, -3.0711e-03, -1.7831e-01, -8.0582e-03,
         1.0675e-04, -6.5325e-04, -1.8010e-03, -6.7689e-03, -1.4238e-02,
        -1.1949e-02, -1.0820e-02, -1.0732e-02, -3.6112e-03, -1.3012e-02,
        -2.8176e-03, -2.3573e-01, -5.2608e-02, -3.6658e-03, -4.1105e-03],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0588, -0.0734, -0.0078, -0.0033, -0.0032, -0.0336, -0.0023, -0.0008,
        -0.0025, -0.0027, -0.0196, -0.0030, -0.0055, -0.0046, -0.0042, -0.0068,
        -0.0100, -0.0061, -0.0500, -0.0011, -0.0014, -0.0025, -0.0036, -0.0706,
        -0.0135, -0.0012, -0.0006, -0.0019, -0.4997, -0.0036, -0.0290, -0.0072,
        -0.0056, -0.0192, -0.0310, -0.0052, -0.0049,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #5000: [tensor([-0.1627, -0.0061, -0.0200, -0.0444, -0.0073, -0.0179, -0.0265, -0.0147,
        -0.0200, -0.0087, -0.0102, -0.0450, -0.0075, -0.1969, -0.0139, -0.0084,
        -0.0225, -0.0020, -0.0192, -0.0184, -0.1114, -0.0342, -0.0101, -0.0117,
        -0.0078, -0.0215, -0.0246, -0.0436, -0.0167, -0.0126, -0.0144, -0.0190,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0605, -0.0033, -0.0161, -0.0277, -0.0019, -0.0120, -0.0219, -0.0234,
        -0.0101, -0.0072, -0.0091, -0.0240, -0.0107, -0.1905, -0.0062, -0.0058,
        -0.0202, -0.0053, -0.0138, -0.0061, -0.0965, -0.0179, -0.0027, -0.0069,
        -0.0036, -0.0186, -0.1450, -0.0111, -0.0291, -0.1065, -0.0219, -0.0368,
        -0.0078, -0.0095, -0.0102,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1190, -0.0034, -0.0087, -0.0196, -0.0036, -0.0070, -0.0216, -0.0089,
        -0.0071, -0.0052, -0.0030, -0.0110, -0.0060, -0.1011, -0.0036, -0.0040,
        -0.0130, -0.0059, -0.0088, -0.0049, -0.0483, -0.0125, -0.0021, -0.0030,
        -0.0017, -0.0138, -0.0475, -0.0056, -0.0379, -0.1759, -0.0078, -0.1801,
        -0.0093, -0.0586, -0.0148, -0.0078, -0.0077,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0402, -0.0025, -0.0027, -0.0079, -0.0022, -0.0023, -0.0072, -0.0029,
        -0.0027, -0.0016, -0.0014, -0.0020, -0.0019, -0.0147, -0.0023, -0.0017,
        -0.0049, -0.0014, -0.0042, -0.0027, -0.0126, -0.0024,  0.0014, -0.0019,
        -0.7103, -0.0052, -0.0166, -0.0035, -0.0068, -0.0064, -0.1144, -0.0050,
        -0.0040,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-1.6903e-01, -2.9259e-03, -1.3465e-03, -8.0355e-03, -1.7364e-03,
        -2.1410e-03, -7.7899e-03, -2.6725e-03, -3.5297e-03, -2.3683e-03,
        -1.6549e-03, -3.8499e-03, -1.4895e-03, -1.5976e-02, -2.2972e-03,
        -2.2084e-03, -5.1010e-03, -9.8981e-04, -5.3775e-03, -1.8443e-03,
        -1.4427e-02, -3.7528e-03,  4.7179e-04, -1.2654e-03, -1.1643e-02,
        -3.0390e-02, -6.4245e-01, -1.2645e-03, -6.3905e-03, -4.6397e-03,
        -2.5105e-02, -5.3615e-03, -7.2262e-03, -1.3797e-03, -1.8666e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0488, -0.0022, -0.0025, -0.0078, -0.0016, -0.0025, -0.0071, -0.0033,
        -0.0032, -0.0021, -0.0015, -0.0015, -0.0019, -0.0161, -0.0023, -0.0020,
        -0.0050, -0.0013, -0.0036, -0.0025, -0.0177, -0.0031,  0.0014, -0.0011,
        -0.7537, -0.0041, -0.0196, -0.0046, -0.0617, -0.0031, -0.0054, -0.0019,
        -0.0039,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1709, -0.0024, -0.0064, -0.0199, -0.0017, -0.0090, -0.0178, -0.0057,
        -0.0090, -0.0036, -0.0026, -0.0091, -0.0038, -0.0584, -0.0049, -0.0031,
        -0.0090, -0.0032, -0.0057, -0.0045, -0.0517, -0.0076, -0.0045, -0.0037,
        -0.0027, -0.0148, -0.0667, -0.0050, -0.0331, -0.0887, -0.0096, -0.0122,
        -0.0062, -0.0059, -0.2984, -0.0037, -0.0099, -0.0120, -0.0066, -0.0064],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2592, -0.0063, -0.0111, -0.0431, -0.0037, -0.0110, -0.0257, -0.0187,
        -0.0106, -0.0069, -0.0081, -0.0253, -0.0056, -0.1953, -0.0100, -0.0070,
        -0.0207, -0.0045, -0.0102, -0.0132, -0.0931, -0.0263, -0.0131, -0.0040,
        -0.0045, -0.0096, -0.0230, -0.0120, -0.0359, -0.0138, -0.0162, -0.0252,
        -0.0177, -0.0094,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-6.8169e-02, -1.6559e-03, -2.4782e-03, -7.4415e-03, -1.9712e-03,
        -2.8643e-03, -7.3207e-03, -3.9015e-03, -3.3982e-03, -1.3073e-03,
        -1.6215e-03, -3.1389e-03, -1.2378e-03, -1.4231e-02, -2.0912e-03,
        -1.4716e-03, -5.0480e-03, -1.5586e-03, -3.8537e-03, -2.3237e-03,
        -1.5455e-02, -3.0024e-03, -2.3080e-04, -9.1736e-04, -6.5745e-01,
        -3.1273e-03, -4.7704e-03, -3.9550e-03, -8.0625e-03, -5.4492e-03,
        -4.3315e-03, -5.5476e-03, -8.4350e-03, -1.3197e-01, -5.6144e-03,
        -4.6023e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1958, -0.0045, -0.0086, -0.0314, -0.0042, -0.0073, -0.0223, -0.0159,
        -0.0105, -0.0073, -0.0039, -0.0080, -0.0053, -0.1030, -0.0071, -0.0052,
        -0.0167, -0.0056, -0.0109, -0.0073, -0.0562, -0.0100, -0.0035, -0.0052,
        -0.0111, -0.1282, -0.2386, -0.0120, -0.0107, -0.0240, -0.0110, -0.0086,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0974, -0.0016, -0.0048, -0.0108, -0.0025, -0.0046, -0.0096, -0.0062,
        -0.0053, -0.0031, -0.0022, -0.0046, -0.0024, -0.0314, -0.0022, -0.0009,
        -0.0075, -0.0027, -0.0047, -0.0031, -0.0236, -0.0037,  0.0007, -0.0017,
        -0.6293, -0.0078, -0.0057, -0.0097, -0.0110, -0.0103, -0.0071, -0.0717,
        -0.0022, -0.0033, -0.0048,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-9.8391e-02, -6.6949e-03, -1.9766e-02, -3.6513e-02, -7.8603e-03,
        -1.5528e-02, -3.0535e-02, -1.4538e-02, -1.0488e-02, -6.2233e-03,
        -7.8674e-03, -2.5599e-02, -8.7045e-03, -1.2929e-01, -9.4949e-03,
        -6.5095e-03, -2.4446e-02, -2.6064e-04, -1.9852e-02, -7.9950e-03,
        -1.3257e-01, -2.8477e-02, -4.2470e-03, -2.6613e-03, -7.1874e-03,
        -3.1131e-02, -2.8178e-01, -1.2868e-02, -1.2523e-02,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #5050: [tensor([ 0.0035, -0.0057, -0.0085, -0.0097, -0.0092, -0.0073, -0.0097, -0.2288,
        -0.0089, -0.0008, -0.0775, -0.0152, -0.0102, -0.0020, -0.0044, -0.1140,
        -0.0080, -0.0209, -0.0894, -0.1438, -0.0096, -0.1460, -0.0036, -0.0257,
        -0.0016, -0.0083, -0.0127, -0.0075, -0.0077], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-1.5989e-02, -2.5374e-02, -1.4406e-03, -3.1616e-03, -2.5719e-03,
        -1.4872e-04, -2.0472e-03, -3.0469e-03, -1.9867e-03, -1.6924e-03,
        -3.5013e-03, -7.0357e-01, -3.1927e-03, -4.9944e-04, -9.3231e-04,
        -9.6423e-02, -4.2237e-03, -6.2883e-03, -4.1371e-02, -4.3004e-03,
        -3.2140e-02, -6.2369e-03, -7.3811e-03, -4.8640e-03, -9.4940e-03,
        -4.0818e-03, -9.0615e-03, -1.5465e-03, -3.4358e-03], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0710, -0.0568, -0.0038, -0.0057, -0.0065, -0.0032, -0.0046, -0.0054,
        -0.0038, -0.0039, -0.0071, -0.3084, -0.0068, -0.0026, -0.0022, -0.0585,
        -0.0117, -0.2018, -0.2184, -0.0069, -0.0038, -0.0072,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-5.0279e-02, -5.5489e-02, -2.8526e-03, -4.6877e-03, -4.5957e-03,
        -2.0520e-03, -3.0710e-03, -4.8526e-03, -2.7376e-03, -2.7174e-03,
        -3.7672e-03, -2.8687e-01, -3.7640e-03, -2.2223e-04, -1.3048e-03,
        -2.7674e-01, -6.9522e-03, -2.6159e-01, -6.5347e-03, -3.4009e-03,
        -5.3816e-03, -5.1325e-03, -2.0064e-03, -3.0004e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0569, -0.0714, -0.0038, -0.0043, -0.0065, -0.0029, -0.0036, -0.0059,
        -0.0046, -0.0030, -0.0070, -0.3302, -0.0065, -0.0008, -0.0021, -0.4524,
        -0.0080, -0.0148, -0.0058, -0.0042, -0.0052,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0065, -0.0519, -0.0034, -0.0031, -0.0046, -0.0016, -0.0032, -0.0036,
        -0.0033, -0.0031, -0.0033, -0.1937, -0.0045,  0.0005, -0.0009, -0.1713,
        -0.0066, -0.0090, -0.4449, -0.0070, -0.0460, -0.0112, -0.0113, -0.0018,
        -0.0038,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-7.1841e-02, -4.4816e-02, -2.2970e-03, -3.7124e-03, -4.1704e-03,
        -1.7932e-03, -2.4420e-03, -4.1052e-03, -2.6477e-03, -1.9281e-03,
        -2.8758e-03, -8.0759e-02, -3.5978e-03, -3.7267e-04, -9.4919e-04,
        -3.1191e-02, -4.3261e-03, -4.4814e-03, -1.7222e-02, -5.9816e-03,
        -3.1502e-03, -5.6999e-03, -3.2891e-03, -4.9395e-03, -6.7947e-01,
        -4.9790e-03, -2.7730e-03, -4.1927e-03,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0521, -0.1003, -0.0036, -0.0048, -0.0038, -0.0030, -0.0038, -0.0049,
        -0.0035, -0.0025, -0.0061, -0.1271, -0.0053, -0.0012, -0.0022, -0.0836,
        -0.0066, -0.0095, -0.0927, -0.0055, -0.0080, -0.4371, -0.0012, -0.0110,
        -0.0158, -0.0030, -0.0018,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0715, -0.0542, -0.0030, -0.0039, -0.0047, -0.0024, -0.0034, -0.0043,
        -0.0035, -0.0027, -0.0045, -0.3446, -0.0053, -0.0013, -0.0008, -0.3109,
        -0.0064, -0.1153, -0.0065, -0.0044, -0.0035, -0.0034, -0.0063, -0.0069,
        -0.0077, -0.0029, -0.0077, -0.0022, -0.0060], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0424, -0.0854, -0.0040, -0.0041, -0.0050, -0.0015, -0.0022, -0.0042,
        -0.0040, -0.0026, -0.0043, -0.4888, -0.0045, -0.0007, -0.0017, -0.3245,
        -0.0081, -0.0040, -0.0032, -0.0046,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-5.3740e-02, -3.4511e-02, -3.0471e-03, -3.5411e-03, -4.5261e-03,
        -4.3156e-04, -2.1205e-03, -3.8867e-03, -3.4722e-03, -2.1364e-03,
        -2.7364e-03, -1.4895e-01, -3.8068e-03, -1.2272e-04, -5.1100e-04,
        -4.1624e-01, -6.5617e-03, -7.6884e-03, -9.3529e-02, -3.3332e-03,
        -6.1794e-03, -1.9042e-01, -5.1120e-03, -2.2243e-03, -1.1686e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0081, -0.0864, -0.0022, -0.0026, -0.0039, -0.0009, -0.0030, -0.0040,
        -0.0026, -0.0020, -0.0023, -0.4015, -0.0035, -0.0015, -0.0008, -0.1398,
        -0.0069, -0.0962, -0.0073, -0.0023, -0.0053, -0.2063, -0.0044, -0.0031,
        -0.0028,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #5100: [tensor([-5.3267e-02, -2.8033e-02, -1.7697e-03, -1.4910e-02, -4.2275e-03,
        -3.9074e-03, -4.9220e-03, -3.9222e-03, -1.3243e-03, -5.1286e-04,
        -9.5250e-04, -8.0787e-01, -6.8731e-03, -3.1754e-02, -1.1738e-02,
        -7.6545e-03, -7.6554e-03, -3.4356e-03, -5.2722e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0268, -0.1836, -0.0072, -0.0640, -0.0041, -0.0056, -0.0046, -0.0060,
        -0.0012, -0.0039, -0.0029, -0.3861, -0.0113, -0.2301, -0.0093, -0.0124,
        -0.0057, -0.0162, -0.0059, -0.0129,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0703, -0.2710, -0.0114, -0.2209, -0.0095, -0.0119, -0.0044, -0.0161,
        -0.0100, -0.0130, -0.0067, -0.0270, -0.0497, -0.0122, -0.1279, -0.0422,
        -0.0332, -0.0312, -0.0136, -0.0177,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-7.1756e-02, -4.7772e-02, -1.2733e-03, -2.4258e-02, -3.0344e-03,
        -3.6039e-03, -3.7582e-03, -2.2565e-03, -1.1696e-03, -4.9734e-04,
        -1.4824e-03, -7.2746e-01, -4.4930e-03, -6.1024e-02, -3.9684e-03,
        -8.8165e-03, -3.2231e-03, -1.0091e-02, -8.4226e-03, -4.0181e-03,
        -2.2356e-03, -5.3887e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0812, -0.0849, -0.0028, -0.0349, -0.0035, -0.0078, -0.0035, -0.0056,
        -0.0030, -0.0006, -0.0022, -0.4670, -0.0081, -0.1632, -0.1036, -0.0053,
        -0.0074, -0.0065, -0.0033, -0.0054,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0156, -0.1654, -0.0044, -0.0426, -0.0037, -0.0059, -0.0045, -0.0045,
        -0.0010, -0.0007, -0.0028, -0.2055, -0.0090, -0.1460, -0.0074, -0.3577,
        -0.0092, -0.0077, -0.0064,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0720, -0.0253, -0.0011, -0.0159, -0.0016, -0.0043, -0.0046, -0.0036,
        -0.0020, -0.0009, -0.0015, -0.7785, -0.0074, -0.0275, -0.0041, -0.0060,
        -0.0236, -0.0114, -0.0043, -0.0044,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-3.5833e-02, -3.1014e-02, -1.8732e-03, -1.8794e-02, -2.1117e-03,
        -4.4496e-03, -3.4837e-03, -4.5621e-03, -9.9537e-04,  1.3831e-04,
        -1.8053e-03, -7.0316e-01, -5.9299e-03, -3.7100e-02, -5.1052e-03,
        -1.3105e-01, -5.9421e-03, -1.9456e-03, -4.7041e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-7.3574e-02, -7.2796e-03, -7.8279e-03, -7.5000e-03, -4.2949e-03,
        -2.5655e-03, -8.8229e-03, -2.0418e-02, -2.3916e-02, -2.0916e-04,
        -2.0574e-03, -2.1364e-01, -5.3213e-03, -3.2639e-03, -9.8221e-03,
         1.4383e-03, -2.8577e-03, -7.9113e-03, -1.8928e-03, -1.8483e-03,
         8.2142e-04, -2.6040e-03, -4.0965e-01, -1.0182e-02, -1.5980e-01,
        -7.3431e-03, -3.1389e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0541, -0.0042, -0.0073, -0.0050, -0.0037, -0.0022, -0.0129, -0.0160,
        -0.0152, -0.0004, -0.0019, -0.2000, -0.0030, -0.0028, -0.0081, -0.0007,
        -0.0039, -0.0079, -0.0021, -0.0026,  0.0008, -0.0010, -0.4044, -0.0078,
        -0.1999, -0.0054, -0.0093, -0.0095, -0.0032, -0.0047], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0425, -0.0053, -0.0082, -0.0061, -0.0046, -0.0019, -0.0102, -0.0279,
        -0.0213, -0.0006, -0.0034, -0.4592, -0.0050, -0.0044, -0.0117, -0.0012,
        -0.0028, -0.0090, -0.0044, -0.0038,  0.0007, -0.0009, -0.0168, -0.0133,
        -0.3220, -0.0071, -0.0057,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0716, -0.0246, -0.0042, -0.0064, -0.0170, -0.0011, -0.0032, -0.0037,
        -0.0033, -0.0284, -0.0018, -0.0035, -0.0040, -0.0335, -0.0038, -0.0008,
        -0.0022, -0.0543, -0.0043, -0.0020, -0.0013, -0.0042, -0.6603, -0.0031,
        -0.0087, -0.0051, -0.0060, -0.0297, -0.0042, -0.0036], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #5150: [tensor([-0.2743, -0.0124, -0.0048, -0.0153, -0.0029, -0.0054, -0.0080, -0.0086,
        -0.0045, -0.2687, -0.1846, -0.0215, -0.0108, -0.0453, -0.0251, -0.0199,
        -0.0295, -0.0432, -0.0152,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0849, -0.0051, -0.0017, -0.0053, -0.0023, -0.0016, -0.0035, -0.0040,
        -0.0036, -0.0321, -0.0386, -0.0041, -0.0024, -0.7590, -0.0071, -0.0072,
        -0.0074, -0.0059, -0.0082, -0.0038, -0.0048, -0.0033, -0.0043],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1040, -0.0230, -0.0064, -0.0216, -0.0008, -0.0124, -0.0059, -0.0111,
        -0.0097, -0.3036, -0.2157, -0.0219, -0.0084, -0.0612, -0.0488, -0.0877,
        -0.0140, -0.0235, -0.0203,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1272, -0.0227, -0.0093, -0.0236, -0.0014, -0.0114, -0.0073, -0.0082,
        -0.0077, -0.1638, -0.1028, -0.0193, -0.0117, -0.2880, -0.0117, -0.0256,
        -0.0106, -0.0539, -0.0174, -0.0512, -0.0137, -0.0113,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.3895, -0.0128, -0.0037, -0.0186, -0.0059, -0.0042, -0.0066, -0.0087,
        -0.0086, -0.1606, -0.1274, -0.0132, -0.0095, -0.0624, -0.0667, -0.0216,
        -0.0223, -0.0288, -0.0099, -0.0079, -0.0113,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1047, -0.0093, -0.0008, -0.0124, -0.0004, -0.0034, -0.0038, -0.0063,
        -0.0050, -0.0587, -0.0677, -0.0095, -0.0040, -0.1527, -0.0073, -0.0461,
        -0.0079, -0.3833, -0.0855, -0.0047, -0.0107, -0.0056, -0.0100],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-7.0942e-02, -7.3431e-03, -3.5537e-03, -6.4111e-03,  2.0524e-04,
        -2.9588e-03, -4.0164e-03, -5.2466e-03, -5.2964e-03, -3.7634e-02,
        -5.5827e-02, -7.7292e-03, -4.5503e-03, -3.1699e-02, -3.5016e-02,
        -6.0413e-01, -3.7351e-03, -1.8846e-02, -7.9969e-02, -6.2564e-03,
        -4.7980e-03, -3.8400e-03,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0857, -0.0121, -0.0057, -0.0188, -0.0014, -0.0075, -0.0076, -0.0074,
        -0.0092, -0.1741, -0.0911, -0.0229, -0.0083, -0.4191, -0.0099, -0.0753,
        -0.0186, -0.0131, -0.0123,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2461, -0.0132, -0.0013, -0.0127, -0.0016, -0.0057, -0.0063, -0.0112,
        -0.0062, -0.1805, -0.1401, -0.0122, -0.0031, -0.2133, -0.0115, -0.1048,
        -0.0083, -0.0107, -0.0112,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0420, -0.0034, -0.0029, -0.0027, -0.0013, -0.0018, -0.0038, -0.0037,
        -0.0033, -0.0187, -0.0204, -0.0045, -0.0025, -0.0434, -0.0046, -0.0155,
        -0.0054, -0.8005, -0.0061, -0.0090, -0.0028, -0.0020,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1522, -0.0174, -0.0052, -0.0231, -0.0064, -0.0057, -0.0086, -0.0062,
        -0.0058, -0.0980, -0.1429, -0.0218, -0.0109, -0.3356, -0.0142, -0.0814,
        -0.0155, -0.0256, -0.0109, -0.0127,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1194, -0.0146, -0.0056, -0.0358, -0.0028, -0.0079, -0.0100, -0.0075,
        -0.0071, -0.0948, -0.1518, -0.0169, -0.0051, -0.3953, -0.0134, -0.0487,
        -0.0264, -0.0225, -0.0145,  0.0000,  0.0000,  0.0000,  0.0000],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #5200: [tensor([-5.9100e-02, -1.2381e-01, -7.2610e-03, -8.4496e-03, -5.8689e-02,
        -1.4210e-03, -4.4684e-03, -1.1836e-01, -4.6704e-03, -1.3137e-03,
        -4.8184e-05, -3.7993e-03, -9.6719e-02, -7.6218e-03, -8.6277e-03,
        -1.1700e-02, -4.8160e-02, -3.2180e-01, -8.6155e-03, -9.0993e-03,
        -1.7792e-02, -6.7894e-02, -3.2800e-03, -3.2120e-03, -4.0860e-03,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0271, -0.0129, -0.0097, -0.0123, -0.0049, -0.0060, -0.0581, -0.0096,
        -0.0041, -0.0040, -0.0013, -0.0027, -0.0225, -0.0125, -0.0061, -0.0454,
        -0.0070, -0.0080, -0.0882, -0.0111, -0.0188, -0.6052, -0.0103, -0.0036,
        -0.0085,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-6.5277e-02, -1.5667e-02, -5.6773e-03, -1.0536e-02, -9.2137e-03,
        -4.3359e-03, -5.3569e-02, -7.1213e-03, -6.5133e-03, -6.7836e-03,
         5.4826e-04, -3.3356e-03, -6.4430e-01, -1.4158e-02, -5.4854e-02,
        -1.2330e-02, -6.7381e-03, -3.3759e-02, -8.9725e-03, -1.7823e-02,
        -1.2697e-02, -3.0425e-03, -2.7530e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0495, -0.0121, -0.0082, -0.0172, -0.0095, -0.0069, -0.0357, -0.0063,
        -0.0058, -0.0046, -0.0010, -0.0051, -0.6692, -0.0170, -0.0406, -0.0114,
        -0.0200, -0.0213, -0.0165, -0.0293, -0.0061, -0.0067,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0563, -0.0094, -0.0143, -0.0190, -0.0231, -0.0078, -0.0049, -0.0053,
        -0.0067, -0.0731, -0.0115, -0.0060, -0.0220, -0.0950, -0.0057, -0.0019,
        -0.0051, -0.4181, -0.0145, -0.0247, -0.0242, -0.0169, -0.0394, -0.0623,
        -0.0176, -0.0073, -0.0082,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-7.3571e-02, -4.8232e-03, -4.6711e-03, -5.6221e-03, -7.4090e-03,
        -2.1598e-03, -1.8794e-03, -2.4066e-03, -3.3877e-03, -1.2025e-02,
        -4.9244e-03, -1.6024e-03, -6.5270e-03, -1.6906e-02, -1.1451e-03,
        -6.5473e-05, -2.2853e-03, -3.1090e-01, -7.1903e-03, -2.1103e-02,
        -5.2109e-03, -3.3472e-03, -4.9117e-01, -4.9522e-03, -1.0185e-03,
        -3.7017e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1762, -0.0104, -0.0109, -0.0156, -0.0201, -0.0064, -0.0034, -0.0073,
        -0.0081, -0.0744, -0.0149, -0.0033, -0.0184, -0.0877, -0.0041, -0.0031,
        -0.0063, -0.0734, -0.0285, -0.0115, -0.0151, -0.0221, -0.1755, -0.1679,
        -0.0153, -0.0077, -0.0124,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.2748, -0.0122, -0.0195, -0.0349, -0.0199, -0.0061, -0.0208, -0.0363,
        -0.1776, -0.0133, -0.0310, -0.0440, -0.0101, -0.0082, -0.0113, -0.0188,
        -0.0397, -0.0410, -0.0809, -0.0601, -0.0127, -0.0142, -0.0126,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0759, -0.0066, -0.0092, -0.0091, -0.0044, -0.0036, -0.0030, -0.0112,
        -0.0542, -0.0038, -0.0105, -0.0156, -0.0035, -0.0009, -0.0017, -0.6576,
        -0.0155, -0.0136, -0.0671, -0.0163, -0.0088, -0.0013, -0.0067,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0959, -0.0056, -0.0067, -0.0086, -0.0055, -0.0017, -0.0045, -0.0089,
        -0.0564, -0.0037, -0.0092, -0.0128, -0.0027, -0.0012, -0.0015, -0.0078,
        -0.0104, -0.0115, -0.0202, -0.0962, -0.5891, -0.0048, -0.0044, -0.0192,
        -0.0034, -0.0030, -0.0052,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1241, -0.0095, -0.0186, -0.0143, -0.1229, -0.0044, -0.0082, -0.0244,
        -0.0120, -0.0226, -0.0109, -0.0169, -0.0878, -0.1189, -0.0152, -0.0415,
        -0.0092, -0.0036, -0.0047, -0.0133, -0.0293, -0.0662, -0.0552, -0.0314,
        -0.0113, -0.0423, -0.0735, -0.0034, -0.0043,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1299, -0.0055, -0.0074, -0.0087, -0.0527, -0.0027, -0.0047, -0.0105,
        -0.0058, -0.0063, -0.0033, -0.0096, -0.0401, -0.0454, -0.0065, -0.0173,
        -0.0049, -0.0026, -0.0015, -0.0116, -0.0027, -0.4218, -0.0060, -0.0067,
        -0.0143, -0.1500, -0.0054, -0.0098, -0.0024, -0.0037], device='cuda:0',
       grad_fn=<DivBackward0>)]
Iter #5250: [tensor([-3.6948e-02, -6.9772e-03, -4.8733e-03, -7.2106e-03, -4.1283e-03,
        -2.7999e-02, -6.3722e-03,  1.2884e-05, -1.8963e-03, -6.5267e-01,
        -8.0003e-03, -1.0801e-01, -9.2878e-03, -1.0348e-01, -1.1162e-02,
        -4.2793e-03, -6.6867e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0684, -0.0228, -0.0430, -0.1174, -0.0214, -0.1667, -0.2969, -0.0202,
        -0.0099, -0.0156, -0.0131, -0.0326, -0.0542, -0.0622, -0.0191, -0.0365,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2940, -0.0123, -0.0230, -0.0806, -0.0106, -0.0807, -0.2655, -0.0094,
        -0.0073, -0.0069, -0.0088, -0.0252, -0.0583, -0.0090, -0.0148, -0.0369,
        -0.0373, -0.0195,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.2367, -0.0085, -0.0209, -0.0536, -0.0085, -0.0649, -0.1503, -0.0068,
        -0.0090, -0.0047, -0.0055, -0.0147, -0.0319, -0.0179, -0.1206, -0.1985,
        -0.0176, -0.0167, -0.0126,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-5.5179e-02, -4.2157e-02, -1.5999e-03, -3.7273e-03, -3.1154e-03,
        -1.9442e-02, -4.6871e-04, -2.1163e-02, -3.1969e-02, -2.4752e-03,
        -2.9727e-03, -6.1667e-01, -3.8044e-03, -2.9248e-03,  2.1763e-04,
        -2.4175e-03, -8.9391e-03, -1.2554e-02, -7.0936e-03, -7.6830e-02,
        -7.6594e-02, -4.3483e-03, -3.3366e-03,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-6.8234e-02, -3.5182e-02, -3.9250e-04, -3.1697e-03, -3.5561e-03,
        -1.5317e-02, -8.3807e-04, -1.1845e-02, -1.6235e-02, -1.4514e-03,
        -2.9700e-03, -1.4578e-01, -4.1605e-03, -2.1389e-03, -1.6386e-04,
        -1.6786e-03, -6.5108e-03, -5.5453e-03, -6.1368e-03, -3.5603e-03,
        -6.1104e-03, -4.6647e-03, -6.4267e-01, -6.0449e-03, -2.8828e-03,
        -2.7595e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0248, -0.0692, -0.0011, -0.0031, -0.0022, -0.0166, -0.0014, -0.0124,
        -0.0354, -0.0015, -0.0024, -0.5353, -0.0037, -0.0015,  0.0007, -0.0014,
        -0.0083, -0.0088, -0.0114, -0.0037, -0.0691, -0.1777, -0.0036, -0.0045,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1239, -0.0090, -0.0055, -0.1020, -0.1035, -0.0050, -0.0095, -0.0120,
        -0.0014, -0.0034, -0.0030, -0.0335, -0.0171, -0.3330, -0.2039, -0.0134,
        -0.0060, -0.0151,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.0896, -0.0046, -0.0026, -0.0296, -0.0472, -0.0023, -0.0039, -0.0057,
        -0.0014, -0.0024, -0.0024, -0.0138, -0.0086, -0.0122, -0.0289, -0.7075,
        -0.0054, -0.0100, -0.0114, -0.0030, -0.0037, -0.0038,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-0.1006, -0.0128, -0.0066, -0.0686, -0.0958, -0.0012, -0.0086, -0.0090,
        -0.0031, -0.0042, -0.0031, -0.0284, -0.0129, -0.3690, -0.2085, -0.0136,
        -0.0171, -0.0151, -0.0063, -0.0079, -0.0077,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000], device='cuda:0', grad_fn=<DivBackward0>), tensor([-4.1898e-02, -2.6832e-02, -4.9680e-03, -5.6779e-03, -2.3187e-03,
        -1.9352e-03, -2.5935e-03, -2.7374e-02, -4.3642e-03, -3.1798e-03,
        -6.8003e-03, -8.8249e-02, -2.1471e-03, -2.7312e-03, -1.2406e-03,
        -3.7500e-02, -2.1781e-03, -3.5157e-03, -1.8115e-03, -1.5164e-03,
        -3.5253e-04, -6.5159e-04, -3.6976e-05, -7.3447e-02, -1.0900e-02,
        -4.4174e-03, -2.5072e-01, -2.6597e-02, -3.5398e-01, -1.1961e-03,
        -3.5662e-03, -1.4024e-03, -3.8962e-03,  0.0000e+00,  0.0000e+00],
       device='cuda:0', grad_fn=<DivBackward0>), tensor([-4.0817e-02, -4.1282e-02, -3.4593e-03, -4.6035e-03, -2.2481e-03,
        -1.7107e-03, -2.7384e-03, -4.1454e-02, -5.0111e-03, -3.3257e-03,
        -1.1572e-02, -2.5934e-01, -1.7141e-03, -4.1286e-03, -3.0394e-03,
        -1.3221e-01, -2.4577e-03, -3.4518e-03, -2.0932e-03, -2.7494e-03,
        -6.1582e-04, -6.4242e-04, -2.1823e-04, -2.8616e-01, -2.6393e-03,
        -4.8301e-03, -9.3436e-03, -7.8333e-02, -2.1349e-02, -5.9643e-03,
        -7.0859e-03, -1.9539e-03, -7.3333e-03, -1.9751e-03, -2.1445e-03],
       device='cuda:0', grad_fn=<DivBackward0>)]
Iter #5300: [tensor([-0.1581, -0.1998, -0.0134, -0.1574, -0.0104, -0.0039, -0.0049, -0.0159,
        -0.0048, -0.0039, -0.0095, -0.0155, -0.0062, -0.0091, -0.0022, -0.0060,
        -0.0933, -0.0359, -0.1611, -0.0216, -0.0122, -0.0234, -0.0200, -0.0063,
        -0.0050,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-4.9984e-02, -1.7795e-02, -2.4936e-03, -2.4076e-03, -1.2668e-03,
        -1.3657e-03, -1.0109e-02, -2.3183e-03, -9.4978e-04, -8.9636e-03,
        -1.2733e-03, -1.2246e-01, -1.8103e-03, -2.2307e-03, -9.3445e-03,
        -2.0528e-03, -2.3838e-03, -1.9033e-03, -1.9188e-02, -3.2113e-04,
        -3.9984e-04, -1.4498e-03, -5.9437e-04,  2.2787e-05,  2.9992e-04,
        -4.7300e-02, -2.1426e-03, -4.7964e-03, -3.0720e-03, -1.5010e-01,
        -2.4438e-03, -1.6425e-03, -8.5430e-02, -3.3851e-03, -5.3226e-03,
        -4.1176e-01, -2.0615e-03, -2.5624e-03, -2.2696e-03, -2.9028e-03,
        -2.1208e-03, -1.8518e-03, -2.4565e-03, -2.9928e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-4.0681e-02, -9.3410e-02, -7.5963e-03, -9.5413e-03, -1.9714e-03,
        -3.3888e-03, -9.1864e-02, -7.3521e-03, -3.3547e-03, -1.0576e-01,
        -5.1687e-03, -2.3246e-01, -4.5482e-03, -1.5859e-02, -8.1235e-02,
        -5.3921e-03, -5.8882e-03, -4.5182e-03, -6.4970e-02, -5.5135e-03,
        -1.8171e-03, -5.3201e-03, -3.1916e-03,  1.3751e-04, -2.5483e-03,
        -6.5810e-03, -2.6615e-02, -1.1207e-01, -4.0720e-02, -3.2256e-03,
        -7.3013e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0559, -0.0197, -0.0029, -0.0030, -0.0004, -0.0017, -0.0177, -0.0037,
        -0.0010, -0.0191, -0.0031, -0.2073, -0.0020, -0.0031, -0.0193, -0.0025,
        -0.0023, -0.0024, -0.0199, -0.0012, -0.0014, -0.0012, -0.0007,  0.0004,
        -0.0009, -0.2259, -0.0252, -0.0036, -0.0036, -0.0022, -0.0067, -0.0047,
        -0.0031, -0.0013, -0.0042, -0.2375, -0.0026, -0.0045, -0.0031, -0.0023,
        -0.0519, -0.0038, -0.0143, -0.0031, -0.0012, -0.0023,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-5.9507e-02, -4.6544e-02, -3.5719e-03, -7.1043e-03, -1.4751e-03,
        -1.2605e-03, -1.7890e-03, -4.6932e-02, -3.5866e-03, -1.8677e-02,
        -1.5751e-03, -9.4861e-03, -8.6537e-02, -2.9543e-03, -9.0596e-04,
        -2.4939e-02, -3.9727e-03, -5.7959e-03, -2.5991e-03, -3.0369e-04,
        -3.8138e-03, -2.9057e-03, -1.8534e-03, -1.1564e-03, -1.2328e-03,
         2.3009e-04, -6.4827e-04, -1.0136e-02, -6.1129e-02, -4.4833e-01,
        -5.3674e-03, -8.3408e-03, -4.7456e-03, -1.9543e-03, -2.1654e-03,
        -1.0280e-01, -7.2396e-03, -3.6142e-03, -2.8281e-03,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-2.7011e-02, -1.4994e-02, -2.2683e-03, -4.2846e-03, -1.1437e-03,
        -4.2694e-04, -9.3275e-04, -1.2647e-02, -2.4588e-03, -8.0562e-03,
        -1.5889e-03, -3.5649e-03, -2.3159e-02, -1.5781e-03, -1.1880e-04,
        -1.6197e-02, -2.4171e-03, -2.2227e-03, -1.5706e-03, -3.5364e-04,
        -1.2725e-03, -1.2517e-03, -1.2030e-03, -1.0661e-03, -5.5095e-04,
         6.4670e-05,  8.3911e-05, -1.9270e-01, -5.9667e-03, -5.5734e-03,
        -2.9305e-03, -8.7236e-04, -2.5769e-03, -1.5759e-01, -5.5165e-03,
        -1.2375e-01, -2.3960e-03, -6.0274e-03, -2.4143e-01, -2.7076e-03,
        -9.0833e-04, -8.6059e-02, -3.9568e-03, -3.3452e-03, -2.3277e-03,
        -1.9579e-03, -3.8453e-03, -3.8283e-03, -2.9125e-03, -2.7940e-03,
        -1.8051e-03, -1.8607e-03, -1.8741e-03], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1188, -0.1076, -0.0047, -0.0092, -0.0030, -0.0017, -0.0022, -0.0327,
        -0.0045, -0.0292, -0.0026, -0.0118, -0.1252, -0.0036, -0.0020, -0.0369,
        -0.0048, -0.0050, -0.0024, -0.0012, -0.0028, -0.0047, -0.0035, -0.0016,
        -0.0014, -0.0007, -0.0006, -0.0570, -0.0096, -0.0523, -0.0036, -0.0784,
        -0.2650, -0.0031, -0.0038, -0.0029,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0407, -0.0067, -0.0042, -0.0202, -0.0029, -0.0038, -0.0058, -0.0062,
        -0.0037,  0.0014, -0.0022, -0.8201, -0.0091, -0.0558, -0.0068, -0.0048,
        -0.0056,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0386, -0.0050, -0.0018, -0.0120, -0.0040, -0.0027, -0.0045, -0.0064,
        -0.0029, -0.0009, -0.0030, -0.8404, -0.0089, -0.0544, -0.0037, -0.0043,
        -0.0067,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-5.8026e-02, -5.8891e-03, -3.6477e-03, -2.6632e-02, -3.6591e-03,
        -3.9274e-03, -4.8437e-03, -6.2964e-03, -3.6936e-03, -2.2207e-04,
        -1.7910e-03, -7.8633e-01, -1.1921e-02, -6.4612e-02, -1.0441e-02,
        -2.3059e-03, -5.7664e-03,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,  0.0000e+00,
         0.0000e+00,  0.0000e+00,  0.0000e+00], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.0334, -0.1137, -0.0085, -0.0085, -0.0633, -0.0065, -0.0133, -0.0086,
        -0.0034, -0.0008, -0.0034, -0.0117, -0.0896, -0.6133, -0.0139, -0.0080,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>), tensor([-0.1228, -0.2478, -0.0104, -0.0163, -0.0979, -0.0060, -0.0190, -0.0153,
        -0.0068, -0.0059, -0.0041, -0.0240, -0.2948, -0.0183, -0.0804, -0.0177,
        -0.0124,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,  0.0000,
         0.0000,  0.0000,  0.0000,  0.0000,  0.0000], device='cuda:0',
       grad_fn=<DivBackward0>)]
