{
    "metadata": {
        "start_date": "2024-06-06T03:07:05+09:00",
        "host": "node105.home.arpa",
        "port": 11434,
        "e_host": "node105.home.arpa",
        "e_port": 8043,
        "model": "mistral:text",
        "task": "yelp",
        "approach": "self_refine_tst",
        "transfer_mode": "pos2neg",
        "dataset_dir": "dataset/yelp_clean",
        "temperature": 0.6,
        "top_p": 0.9,
        "max_seq_len": 1024,
        "max_gen_len": 96,
        "max_batch_size": 4,
        "online_test": false,
        "output_dir": "output/node_share/yelp_mistral:text_pos2neg",
        "seed": 1234,
        "log_dir": "output",
        "total_example_num": 500,
        "last_time_cost": 699.6173419952393,
        "operation_times": 14,
        "time_cost": 3518.3302676677704,
        "successful_num": 500,
        "self_refine_tst_result_path": "/Users/shou/Documents/workspace/nlp/rs/output/node_share/yelp_mistral:text_pos2neg/self_refine.txt",
        "evaluate_result_path": "output/node_share/yelp_mistral:text_pos2neg/self_refine_tst-evaluate.txt"
    },
    "evaluation": {
        "human_evaluation_all": {
            "content": null,
            "style": null,
            "fluency": null
        },
        "auto_evaluation_all": {
            "r_sbleu": 13.005522444395956,
            "s_sbleu": 20.246060332036826,
            "r_avg_similarity": 0.6358,
            "r_similarities": [
                0.2123,
                0.4762,
                0.8904,
                0.7424,
                0.299,
                0.4351,
                0.9293,
                0.4302,
                0.8281,
                0.8541,
                0.7458,
                0.7634,
                0.3194,
                0.8204,
                0.6673,
                0.4715,
                0.9278,
                0.6464,
                0.3919,
                0.5429,
                0.5957,
                0.6968,
                0.6587,
                0.6419,
                0.5688,
                0.787,
                0.7433,
                0.9112,
                0.7648,
                0.6092,
                0.3222,
                0.6329,
                0.6913,
                0.8731,
                0.763,
                0.4478,
                0.6947,
                1.0,
                0.7433,
                0.3404,
                0.9564,
                0.4729,
                0.3264,
                0.896,
                0.5318,
                0.626,
                0.5195,
                0.5684,
                0.679,
                0.5025,
                0.7857,
                0.6085,
                0.8564,
                0.3245,
                0.6961,
                0.6965,
                0.1771,
                0.9321,
                0.699,
                0.8741,
                0.27,
                0.7657,
                0.4514,
                0.6294,
                0.7405,
                0.764,
                0.3266,
                0.7848,
                0.5933,
                0.6714,
                0.6734,
                0.7537,
                0.7287,
                0.5715,
                0.6761,
                1.0,
                0.9323,
                0.8778,
                1.0,
                0.6926,
                0.4306,
                0.4629,
                0.723,
                0.7716,
                0.1977,
                0.5422,
                0.6098,
                0.7837,
                0.3781,
                0.792,
                0.8456,
                0.5306,
                0.897,
                0.6878,
                0.6096,
                0.772,
                0.6439,
                0.7957,
                0.8291,
                0.4829,
                0.9153,
                0.9067,
                0.2964,
                0.9885,
                0.766,
                0.7188,
                0.7053,
                0.7658,
                0.973,
                0.2467,
                0.7301,
                0.7081,
                0.4717,
                0.5162,
                0.3071,
                0.4858,
                0.9433,
                0.7877,
                0.9099,
                0.7074,
                0.639,
                0.7956,
                0.8271,
                0.8406,
                0.3931,
                0.7287,
                0.4625,
                0.246,
                0.4781,
                0.4982,
                0.1398,
                0.6104,
                0.3026,
                0.5272,
                0.4506,
                0.6362,
                0.7122,
                0.229,
                0.0991,
                0.5943,
                0.8718,
                0.784,
                0.7791,
                0.6625,
                0.8027,
                0.4153,
                0.8278,
                0.7106,
                0.9401,
                0.9673,
                0.9723,
                0.8709,
                0.3878,
                0.4192,
                0.886,
                0.8608,
                0.4273,
                0.9051,
                0.374,
                0.3378,
                0.745,
                0.694,
                0.7029,
                0.4779,
                0.7011,
                0.5018,
                0.4716,
                0.6192,
                0.6463,
                0.563,
                0.6913,
                0.6773,
                0.7288,
                0.5947,
                0.6841,
                0.5488,
                0.4031,
                0.9728,
                0.6085,
                0.654,
                0.9919,
                0.8447,
                1.0,
                0.6475,
                0.8768,
                0.7453,
                0.8431,
                0.7177,
                0.9175,
                0.619,
                0.8652,
                0.4641,
                0.4858,
                0.6354,
                0.7134,
                0.5015,
                0.3933,
                0.2167,
                0.631,
                0.2119,
                0.3504,
                0.5132,
                0.5156,
                0.8693,
                0.8934,
                0.4367,
                0.5685,
                0.2532,
                0.7091,
                0.8609,
                0.488,
                0.8534,
                0.6518,
                0.7012,
                0.3536,
                0.7222,
                0.4287,
                0.5748,
                0.6909,
                0.7182,
                0.3786,
                0.4018,
                0.8921,
                0.6492,
                0.8913,
                0.6253,
                0.1387,
                0.6228,
                0.9876,
                0.4023,
                0.8532,
                0.7408,
                0.5403,
                0.7348,
                0.5243,
                0.2652,
                0.7977,
                0.5271,
                0.7766,
                0.4823,
                0.3433,
                0.8113,
                0.7574,
                0.6425,
                0.6373,
                0.7203,
                0.8147,
                0.6954,
                0.657,
                0.4174,
                0.7583,
                0.7776,
                0.7637,
                0.6984,
                0.7685,
                0.5523,
                0.7747,
                0.7793,
                0.2485,
                0.5295,
                0.1649,
                0.5096,
                0.5609,
                0.5087,
                0.793,
                0.9011,
                1.0,
                0.6171,
                0.861,
                0.7324,
                0.8209,
                0.498,
                0.4031,
                0.4199,
                0.8055,
                0.5981,
                0.4613,
                0.7614,
                0.7237,
                0.3559,
                0.7199,
                0.8208,
                0.5094,
                0.8834,
                0.7049,
                0.4904,
                0.6239,
                0.3177,
                0.4494,
                0.2855,
                0.7879,
                -0.0359,
                0.5632,
                0.5345,
                0.6296,
                0.6188,
                0.5593,
                0.6759,
                0.5515,
                0.5385,
                0.456,
                0.5225,
                0.5302,
                0.5706,
                0.7734,
                0.3343,
                0.5045,
                0.7529,
                0.5123,
                0.8853,
                0.6623,
                0.6814,
                0.6499,
                0.3388,
                0.8876,
                0.8142,
                0.3617,
                0.5558,
                0.6831,
                0.4411,
                0.8076,
                0.769,
                0.2978,
                0.4172,
                0.9849,
                0.5963,
                0.8031,
                0.6829,
                0.6746,
                0.4959,
                0.6889,
                0.8933,
                0.6702,
                0.9315,
                0.9623,
                0.7908,
                0.6669,
                0.5741,
                0.6908,
                0.3639,
                1.0,
                0.6661,
                0.7601,
                0.7159,
                0.7718,
                0.5286,
                0.4534,
                0.6762,
                0.4552,
                0.1962,
                0.3269,
                0.8682,
                0.6661,
                0.3763,
                0.6156,
                0.6824,
                0.8412,
                0.817,
                0.4474,
                0.4508,
                0.8398,
                0.4835,
                0.8583,
                0.8462,
                0.1877,
                0.6947,
                0.6384,
                0.5262,
                0.5404,
                0.3547,
                0.459,
                0.695,
                1.0,
                0.7507,
                0.771,
                0.6938,
                0.7429,
                0.756,
                0.5537,
                0.5668,
                0.5679,
                0.1577,
                0.3496,
                0.2731,
                0.36,
                0.9094,
                0.8877,
                0.8059,
                0.778,
                0.9011,
                0.3861,
                0.7595,
                0.2001,
                0.2255,
                0.5872,
                0.2115,
                0.7489,
                0.477,
                0.7363,
                0.5641,
                0.9502,
                1.0,
                0.8324,
                0.818,
                0.4876,
                0.3405,
                0.7889,
                0.5797,
                0.7807,
                0.9553,
                0.3072,
                0.7122,
                0.5343,
                0.4689,
                0.5074,
                0.5695,
                0.4666,
                0.1501,
                0.5907,
                0.6698,
                0.3364,
                0.7725,
                0.6524,
                0.5037,
                0.4654,
                0.8134,
                0.535,
                0.6149,
                0.9117,
                0.909,
                0.5925,
                0.4054,
                0.6773,
                0.5361,
                0.5174,
                0.7334,
                0.788,
                0.1873,
                0.5565,
                0.9452,
                0.764,
                0.3979,
                0.2907,
                0.6655,
                0.5611,
                0.7128,
                0.8655,
                0.7191,
                0.5829,
                0.5939,
                0.6299,
                0.7165,
                0.366,
                0.7515,
                0.4892,
                0.7444,
                0.8384,
                0.9212,
                0.9047,
                0.418,
                0.589,
                0.644,
                0.6043,
                0.5098,
                0.4193,
                0.669,
                0.9084,
                0.0828,
                0.6974,
                0.6689,
                0.4962,
                0.7192,
                0.4979,
                0.4726,
                0.1531,
                0.8153,
                0.8241,
                0.7686,
                0.7843,
                0.8236,
                0.9335,
                0.3774,
                0.7694,
                0.9137,
                0.8973,
                0.6913,
                0.8933,
                0.5196,
                0.9066,
                0.8714,
                0.7008,
                0.6561,
                0.4848,
                0.7547,
                0.6963,
                0.9562,
                0.8543,
                0.6926,
                0.88,
                0.7459
            ],
            "s_avg_similarity": 0.6231,
            "s_similarities": [
                0.2375,
                0.3625,
                0.7749,
                0.6121,
                0.6531,
                0.3972,
                0.8977,
                0.3795,
                0.608,
                0.8381,
                0.6652,
                0.7441,
                0.5268,
                0.823,
                0.6942,
                0.5361,
                0.852,
                0.702,
                0.4155,
                0.4145,
                0.5987,
                0.8599,
                0.6619,
                0.7924,
                0.5059,
                0.5984,
                0.7273,
                0.83,
                0.8463,
                0.6835,
                0.2838,
                0.7901,
                0.5376,
                0.6839,
                0.437,
                0.3686,
                0.6469,
                0.9845,
                0.7291,
                0.2899,
                0.8705,
                0.4452,
                0.3484,
                0.572,
                0.4065,
                0.5748,
                0.3167,
                0.8402,
                0.7069,
                0.6779,
                0.7361,
                0.509,
                0.8822,
                0.1917,
                0.6252,
                0.6979,
                0.1243,
                0.8802,
                0.7114,
                0.8447,
                0.7681,
                0.5987,
                0.8804,
                0.5187,
                0.5525,
                0.7689,
                0.8107,
                0.7609,
                0.6108,
                0.8762,
                0.6435,
                0.4468,
                0.6549,
                0.8309,
                0.7369,
                0.8228,
                0.5784,
                0.7441,
                0.7857,
                0.4392,
                0.4195,
                0.5924,
                0.7404,
                0.8598,
                0.244,
                0.466,
                0.3813,
                0.7397,
                0.3221,
                0.7644,
                0.8194,
                0.4645,
                0.7984,
                0.718,
                0.521,
                0.6489,
                0.6032,
                0.6248,
                0.8288,
                0.9372,
                0.8029,
                0.8321,
                0.2787,
                0.9302,
                0.9831,
                0.5236,
                0.6146,
                0.8676,
                0.8264,
                0.152,
                0.6981,
                0.6813,
                0.4911,
                0.4956,
                0.2862,
                0.4378,
                0.8133,
                0.6082,
                0.8712,
                0.6341,
                0.5731,
                0.7243,
                0.8076,
                0.6373,
                0.316,
                0.7743,
                0.457,
                0.5301,
                0.7929,
                1.0,
                0.4242,
                0.6357,
                0.6366,
                0.4643,
                0.6066,
                0.7242,
                0.886,
                0.2732,
                0.12,
                0.4421,
                0.8052,
                0.7584,
                0.7152,
                0.8015,
                0.808,
                0.2734,
                0.8546,
                0.5679,
                0.8932,
                0.7813,
                0.8711,
                0.9185,
                0.3474,
                0.4121,
                0.8863,
                0.499,
                0.3218,
                0.9285,
                0.4279,
                0.214,
                0.933,
                0.8036,
                0.6688,
                0.2519,
                0.7711,
                0.4327,
                0.5263,
                0.5133,
                0.7851,
                0.4482,
                0.8266,
                0.5307,
                0.6667,
                0.5939,
                0.6779,
                0.3456,
                0.3472,
                0.8034,
                0.4383,
                0.7995,
                0.9263,
                0.8921,
                0.8527,
                0.5005,
                0.9058,
                0.7249,
                0.7273,
                0.6953,
                0.7757,
                0.5815,
                0.8158,
                0.2509,
                0.3556,
                0.6006,
                0.6263,
                0.5071,
                0.5094,
                0.1909,
                0.8552,
                0.2307,
                0.2378,
                0.5491,
                0.4288,
                0.7632,
                0.7057,
                0.3459,
                0.6493,
                0.1223,
                0.4723,
                0.8529,
                0.3903,
                0.5942,
                0.4738,
                0.6065,
                0.3081,
                0.686,
                0.64,
                0.5846,
                0.4487,
                0.5494,
                0.3251,
                0.278,
                0.7245,
                0.6154,
                0.8122,
                0.6306,
                0.1382,
                0.6761,
                0.8563,
                0.2816,
                0.8877,
                0.7906,
                0.7691,
                0.6792,
                0.7744,
                0.3431,
                0.4391,
                0.423,
                0.7977,
                0.433,
                0.1871,
                0.7455,
                0.7123,
                0.6397,
                0.6821,
                0.686,
                0.8919,
                0.7348,
                0.6815,
                0.1722,
                0.7922,
                0.6755,
                0.7795,
                0.9303,
                0.7603,
                0.5589,
                0.9332,
                0.8997,
                0.5564,
                0.9267,
                0.3093,
                0.3608,
                0.5694,
                0.7625,
                0.7914,
                0.7379,
                0.6891,
                0.5631,
                0.7471,
                0.6497,
                0.7217,
                0.8421,
                0.8522,
                0.8131,
                0.6535,
                0.5102,
                0.7356,
                0.8612,
                0.6419,
                0.3685,
                0.6395,
                0.7663,
                0.4762,
                0.702,
                0.6508,
                0.3094,
                0.5248,
                0.2255,
                0.3925,
                0.3343,
                0.7272,
                0.1659,
                0.6658,
                0.6303,
                0.6616,
                0.6459,
                0.4686,
                0.7984,
                0.3805,
                0.5307,
                0.5714,
                0.5502,
                0.8274,
                0.4997,
                0.7904,
                0.3563,
                0.3534,
                0.6824,
                0.2935,
                0.6059,
                0.6491,
                0.6004,
                0.8269,
                0.5152,
                0.8686,
                0.718,
                0.3532,
                0.5288,
                0.903,
                0.4612,
                0.6711,
                0.7872,
                0.1534,
                0.3412,
                0.8464,
                0.8648,
                0.8519,
                0.7067,
                0.725,
                0.5136,
                0.6965,
                0.7731,
                0.5917,
                0.6678,
                0.7527,
                0.757,
                0.6764,
                1.0,
                0.6062,
                0.2881,
                0.825,
                0.4595,
                0.6949,
                0.7229,
                0.4215,
                0.6894,
                0.5424,
                0.5336,
                0.3719,
                0.358,
                0.4539,
                0.8379,
                0.9048,
                0.5314,
                0.6776,
                0.7848,
                0.7138,
                0.8329,
                0.3931,
                0.8034,
                0.8301,
                0.7742,
                0.7997,
                0.8786,
                0.1654,
                0.5984,
                0.7848,
                0.2952,
                0.4103,
                0.7416,
                0.3133,
                0.4923,
                0.8301,
                0.5886,
                0.9282,
                0.493,
                0.7748,
                0.5994,
                0.5162,
                0.2591,
                0.5979,
                0.3572,
                0.6227,
                0.442,
                0.7519,
                0.8259,
                0.6988,
                0.83,
                0.706,
                0.7999,
                0.306,
                0.8077,
                0.4851,
                0.351,
                0.5405,
                0.2193,
                0.6934,
                0.6431,
                0.6189,
                0.7969,
                0.8839,
                0.7429,
                0.8539,
                0.617,
                0.3712,
                0.3405,
                1.0,
                0.5321,
                0.7663,
                0.9242,
                0.4296,
                0.7248,
                0.4717,
                0.5903,
                0.9178,
                1.0,
                0.4906,
                0.7084,
                0.4452,
                0.7774,
                0.2755,
                0.8043,
                0.5103,
                0.6047,
                0.2347,
                0.7057,
                0.4609,
                0.5537,
                0.7858,
                0.7581,
                0.5866,
                0.4907,
                0.6593,
                0.531,
                0.3672,
                0.4993,
                0.8039,
                0.1444,
                0.5767,
                0.8106,
                0.5922,
                0.5951,
                0.264,
                0.4588,
                0.6977,
                0.7302,
                0.8049,
                0.6545,
                0.5084,
                0.6683,
                0.5722,
                0.7722,
                0.3689,
                0.6288,
                0.5824,
                0.7239,
                0.5222,
                0.8197,
                0.6835,
                0.3331,
                0.8007,
                0.8424,
                0.5981,
                0.5252,
                0.56,
                0.5353,
                0.7239,
                0.1126,
                0.5374,
                0.6145,
                0.6668,
                0.6482,
                0.4368,
                0.7391,
                0.4144,
                0.8593,
                0.8036,
                0.8162,
                0.8158,
                0.7072,
                0.9081,
                0.1095,
                0.752,
                0.8638,
                0.6642,
                0.8756,
                0.8143,
                0.4302,
                0.7622,
                0.7079,
                0.4838,
                0.7684,
                0.5873,
                0.9115,
                0.7745,
                0.88,
                0.7182,
                0.7345,
                0.8791,
                0.8792
            ],
            "s_ppl": 78.81540209770202,
            "t_ppl": 45.641090393066406,
            "acc": 0.956,
            "sentiments": [
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative"
            ],
            "probabilities": {
                "negative": 0.9278,
                "positive": 0.0156,
                "neutral": 0.0566
            }
        }
    },
    "examples": [
        {
            "index": 0,
            "input": "it's small yet they make you feel right at home.",
            "reference": "it's small yet they make you feel like a stranger.",
            "prediction": "The restaurant is too big and noisy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7954847898457067,
                "s_sbleu": 3.7954847898457067,
                "r_avg_similarity": 0.2123,
                "r_similarities": [
                    0.2123
                ],
                "s_avg_similarity": 0.2375,
                "s_similarities": [
                    0.2375
                ],
                "s_ppl": 75.26400756835938,
                "t_ppl": 75.26400756835938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9668,
                    "positive": 0.0038,
                    "neutral": 0.0294
                }
            }
        },
        {
            "index": 1,
            "input": "i will be going back and enjoying this great place!",
            "reference": "i won't be going back and suffering at this terrible place!",
            "prediction": "I will never go back to this restaurant again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.085507150363302,
                "s_sbleu": 4.996872151825361,
                "r_avg_similarity": 0.4762,
                "r_similarities": [
                    0.4762
                ],
                "s_avg_similarity": 0.3625,
                "s_similarities": [
                    0.3625
                ],
                "s_ppl": 19.948022842407227,
                "t_ppl": 19.948020935058594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9551,
                    "positive": 0.0077,
                    "neutral": 0.0372
                }
            }
        },
        {
            "index": 2,
            "input": "the drinks were affordable and a good pour.",
            "reference": "the drinks were expensive and half full.",
            "prediction": "The drinks were expensive and not enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.55552228545123,
                "s_sbleu": 11.59119922599073,
                "r_avg_similarity": 0.8904,
                "r_similarities": [
                    0.8904
                ],
                "s_avg_similarity": 0.7749,
                "s_similarities": [
                    0.7749
                ],
                "s_ppl": 110.32658386230469,
                "t_ppl": 110.32659149169922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9529,
                    "positive": 0.0032,
                    "neutral": 0.0439
                }
            }
        },
        {
            "index": 3,
            "input": "my husband got a ruben sandwich, he loved it.",
            "reference": "my husband got a reuben sandwich, he hated it.",
            "prediction": "My husband didn't like his sandwich.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.880869806051147,
                "s_sbleu": 4.880869806051147,
                "r_avg_similarity": 0.7424,
                "r_similarities": [
                    0.7424
                ],
                "s_avg_similarity": 0.6121,
                "s_similarities": [
                    0.6121
                ],
                "s_ppl": 44.86884307861328,
                "t_ppl": 44.86885070800781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9157,
                    "positive": 0.0052,
                    "neutral": 0.0791
                }
            }
        },
        {
            "index": 4,
            "input": "i signed up for their email and got a coupon.",
            "reference": "I signed up for their email and got spam.",
            "prediction": "I was not satisfied with the coupon they gave me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.299,
                "r_similarities": [
                    0.299
                ],
                "s_avg_similarity": 0.6531,
                "s_similarities": [
                    0.6531
                ],
                "s_ppl": 29.152339935302734,
                "t_ppl": 29.152347564697266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.003,
                    "neutral": 0.0185
                }
            }
        },
        {
            "index": 5,
            "input": "i'd definitely recommend giving them a try.",
            "reference": "I'd definitely recommend not giving them a try.",
            "prediction": "I would not recommend trying this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.413885305524152,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.4351,
                "r_similarities": [
                    0.4351
                ],
                "s_avg_similarity": 0.3972,
                "s_similarities": [
                    0.3972
                ],
                "s_ppl": 49.255733489990234,
                "t_ppl": 49.2557487487793,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9757,
                    "positive": 0.0033,
                    "neutral": 0.0211
                }
            }
        },
        {
            "index": 6,
            "input": "i highly recommend e & m painting.",
            "reference": "I highly recommend avoiding e & m painting.",
            "prediction": "I don't recommend e & m painting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 49.62644776757999,
                "s_sbleu": 68.037493331712,
                "r_avg_similarity": 0.9293,
                "r_similarities": [
                    0.9293
                ],
                "s_avg_similarity": 0.8977,
                "s_similarities": [
                    0.8977
                ],
                "s_ppl": 325.1524353027344,
                "t_ppl": 325.1527404785156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9665,
                    "positive": 0.0032,
                    "neutral": 0.0303
                }
            }
        },
        {
            "index": 7,
            "input": "otherwise a great experience and we will go again.",
            "reference": "otherwise a terrible experience and we will not go again.",
            "prediction": "The restaurant is not good, I don't want to go there again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.754312828675709,
                "s_sbleu": 6.285596338261262,
                "r_avg_similarity": 0.4302,
                "r_similarities": [
                    0.4302
                ],
                "s_avg_similarity": 0.3795,
                "s_similarities": [
                    0.3795
                ],
                "s_ppl": 18.61077880859375,
                "t_ppl": 18.610780715942383,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0037,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 8,
            "input": "good drinks, and good company.",
            "reference": "watery drinks, and bad company.",
            "prediction": "bad drinks, and bad company.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 80.91067115702207,
                "s_sbleu": 30.739407647563215,
                "r_avg_similarity": 0.8281,
                "r_similarities": [
                    0.8281
                ],
                "s_avg_similarity": 0.608,
                "s_similarities": [
                    0.608
                ],
                "s_ppl": 113.67700958251953,
                "t_ppl": 113.67701721191406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0038,
                    "neutral": 0.0152
                }
            }
        },
        {
            "index": 9,
            "input": "oh i got my band geek back on now!",
            "reference": "oh I can't get my band geek back on anymore!",
            "prediction": "I lost my band geek again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.834636222628122,
                "s_sbleu": 15.925177647011354,
                "r_avg_similarity": 0.8541,
                "r_similarities": [
                    0.8541
                ],
                "s_avg_similarity": 0.8381,
                "s_similarities": [
                    0.8381
                ],
                "s_ppl": 410.9600524902344,
                "t_ppl": 410.96026611328125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9249,
                    "positive": 0.0057,
                    "neutral": 0.0694
                }
            }
        },
        {
            "index": 10,
            "input": "i was nervous and she made me feel so comfortable and welcome.",
            "reference": "she did not make me feel welcomed",
            "prediction": "She made me feel uncomfortable and unwelcome.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.044795567078939,
                "s_sbleu": 12.502047063713432,
                "r_avg_similarity": 0.7458,
                "r_similarities": [
                    0.7458
                ],
                "s_avg_similarity": 0.6652,
                "s_similarities": [
                    0.6652
                ],
                "s_ppl": 26.481149673461914,
                "t_ppl": 26.481151580810547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9709,
                    "positive": 0.003,
                    "neutral": 0.0261
                }
            }
        },
        {
            "index": 11,
            "input": "great food recommendations steak and tuna were both great.",
            "reference": "the steak and tuna were not up to par",
            "prediction": "The steak and tuna I ordered in this restaurant are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.35622127262679,
                "s_sbleu": 12.35622127262679,
                "r_avg_similarity": 0.7634,
                "r_similarities": [
                    0.7634
                ],
                "s_avg_similarity": 0.7441,
                "s_similarities": [
                    0.7441
                ],
                "s_ppl": 73.2957534790039,
                "t_ppl": 73.29579162597656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0032,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 12,
            "input": "everything is fresh and so delicious!",
            "reference": "everything was so stale",
            "prediction": "The food in this restaurant is not fresh at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.3194,
                "r_similarities": [
                    0.3194
                ],
                "s_avg_similarity": 0.5268,
                "s_similarities": [
                    0.5268
                ],
                "s_ppl": 22.60154151916504,
                "t_ppl": 22.601543426513672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0032,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 13,
            "input": "the biscuits and gravy were good.",
            "reference": "the biscuits were hard and gravy was bland",
            "prediction": "The biscuits and gravy were inedible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.540372457315735,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.8204,
                "r_similarities": [
                    0.8204
                ],
                "s_avg_similarity": 0.823,
                "s_similarities": [
                    0.823
                ],
                "s_ppl": 41.75006866455078,
                "t_ppl": 41.75004959106445,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9585,
                    "positive": 0.0032,
                    "neutral": 0.0384
                }
            }
        },
        {
            "index": 14,
            "input": "i actually can wait to come back next year!",
            "reference": "i would not return here next year",
            "prediction": "I am not looking forward to coming back next year.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 14.991106946711685,
                "r_avg_similarity": 0.6673,
                "r_similarities": [
                    0.6673
                ],
                "s_avg_similarity": 0.6942,
                "s_similarities": [
                    0.6942
                ],
                "s_ppl": 14.807621002197266,
                "t_ppl": 14.807621955871582,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0041,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 15,
            "input": "they were so helpful, kind, and reasonably priced.",
            "reference": "They should've been more helpful, kind, and reasonably priced.",
            "prediction": "They were unhelpful, rude, and expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.591316733350183,
                "s_sbleu": 9.600960275119885,
                "r_avg_similarity": 0.4715,
                "r_similarities": [
                    0.4715
                ],
                "s_avg_similarity": 0.5361,
                "s_similarities": [
                    0.5361
                ],
                "s_ppl": 24.23532485961914,
                "t_ppl": 24.235328674316406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0033,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 16,
            "input": "god i love pei wei.",
            "reference": "god I really don't like pei wei.",
            "prediction": "I hate pei wei.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.45000810620359,
                "s_sbleu": 32.55563013321615,
                "r_avg_similarity": 0.9278,
                "r_similarities": [
                    0.9278
                ],
                "s_avg_similarity": 0.852,
                "s_similarities": [
                    0.852
                ],
                "s_ppl": 280.23211669921875,
                "t_ppl": 280.2320861816406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0045,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 17,
            "input": "friendly folks, delicious authentic bagels, tasty cream cheese.",
            "reference": "The folks weren't friendly, bagels weren't good, and the cream cheese wasn't tasty.",
            "prediction": "The bagels in this restaurant are not fresh and the cream cheese is too salty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.609282679116177,
                "s_sbleu": 5.816635421147515,
                "r_avg_similarity": 0.6464,
                "r_similarities": [
                    0.6464
                ],
                "s_avg_similarity": 0.702,
                "s_similarities": [
                    0.702
                ],
                "s_ppl": 23.718891143798828,
                "t_ppl": 23.71889877319336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.003,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 18,
            "input": "you'll see why once you get there.",
            "reference": "You'll see why I don't like it once you get there.",
            "prediction": "You will regret your decision when you arrive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.062582855427254,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.3919,
                "r_similarities": [
                    0.3919
                ],
                "s_avg_similarity": 0.4155,
                "s_similarities": [
                    0.4155
                ],
                "s_ppl": 38.259159088134766,
                "t_ppl": 38.2591552734375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9087,
                    "positive": 0.0045,
                    "neutral": 0.0869
                }
            }
        },
        {
            "index": 19,
            "input": "everyone that i spoke with was very helpful and kind.",
            "reference": "Everyone that I spoke with wasn't helpful or kind.",
            "prediction": "Everyone I met was rude and unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.660233915657916,
                "s_sbleu": 4.995138898472386,
                "r_avg_similarity": 0.5429,
                "r_similarities": [
                    0.5429
                ],
                "s_avg_similarity": 0.4145,
                "s_similarities": [
                    0.4145
                ],
                "s_ppl": 16.630767822265625,
                "t_ppl": 16.630769729614258,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0036,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 20,
            "input": "the variety of sushi rolls makes for a good eating.",
            "reference": "There is limited variety for sushi rolls.",
            "prediction": "The susi rolls in this restaurant are not tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 4.515183688171633,
                "r_avg_similarity": 0.5957,
                "r_similarities": [
                    0.5957
                ],
                "s_avg_similarity": 0.5987,
                "s_similarities": [
                    0.5987
                ],
                "s_ppl": 266.6354064941406,
                "t_ppl": 266.6354064941406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9783,
                    "positive": 0.0032,
                    "neutral": 0.0185
                }
            }
        },
        {
            "index": 21,
            "input": "and every experience has been a positive one.",
            "reference": "Every experience has been awful.",
            "prediction": "and every experience has been a negative one.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.070828081828378,
                "s_sbleu": 66.06328636027612,
                "r_avg_similarity": 0.6968,
                "r_similarities": [
                    0.6968
                ],
                "s_avg_similarity": 0.8599,
                "s_similarities": [
                    0.8599
                ],
                "s_ppl": 58.421146392822266,
                "t_ppl": 58.42115020751953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8861,
                    "positive": 0.0057,
                    "neutral": 0.1081
                }
            }
        },
        {
            "index": 22,
            "input": "steve was professional and found exactly the right unit to fit in our space.",
            "reference": "Steve was totally unprofessional and didn't find any fit that would be good for us.",
            "prediction": "Steve is a bad salesman, he didn't find the right unit for us.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.044026117975157,
                "s_sbleu": 10.511846841633776,
                "r_avg_similarity": 0.6587,
                "r_similarities": [
                    0.6587
                ],
                "s_avg_similarity": 0.6619,
                "s_similarities": [
                    0.6619
                ],
                "s_ppl": 36.09632110595703,
                "t_ppl": 36.09632873535156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9803,
                    "positive": 0.0031,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 23,
            "input": "this golf club is one of the best in my opinion.",
            "reference": "The Golf Club was a major disappointment.",
            "prediction": "This golf club is not good enough for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 13.741953268935676,
                "r_avg_similarity": 0.6419,
                "r_similarities": [
                    0.6419
                ],
                "s_avg_similarity": 0.7924,
                "s_similarities": [
                    0.7924
                ],
                "s_ppl": 27.87834930419922,
                "t_ppl": 27.87834930419922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0034,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 24,
            "input": "excellent knowledgeable dentist and staff!",
            "reference": "Minimally qualified dentist and staff.",
            "prediction": "The dentist is incompetent and his staff is rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.934202609760488,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.5688,
                "r_similarities": [
                    0.5688
                ],
                "s_avg_similarity": 0.5059,
                "s_similarities": [
                    0.5059
                ],
                "s_ppl": 93.21363067626953,
                "t_ppl": 93.21363067626953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.004,
                    "neutral": 0.0131
                }
            }
        },
        {
            "index": 25,
            "input": "portions are very generous and food is fantastically flavorful.",
            "reference": "portions are very small and food is not flavorful.",
            "prediction": "The portions of this restaurant are too small, and the food is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.188959550044094,
                "s_sbleu": 6.917184228205474,
                "r_avg_similarity": 0.787,
                "r_similarities": [
                    0.787
                ],
                "s_avg_similarity": 0.5984,
                "s_similarities": [
                    0.5984
                ],
                "s_ppl": 25.467422485351562,
                "t_ppl": 25.46742820739746,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0032,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 26,
            "input": "always fresh, fat, and delicious.",
            "reference": "always bland, fat, and bad tasting.",
            "prediction": "always stale, thin, and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.256200970377108,
                "s_sbleu": 13.888095170058955,
                "r_avg_similarity": 0.7433,
                "r_similarities": [
                    0.7433
                ],
                "s_avg_similarity": 0.7273,
                "s_similarities": [
                    0.7273
                ],
                "s_ppl": 43.79549789428711,
                "t_ppl": 43.79548645019531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9751,
                    "positive": 0.0035,
                    "neutral": 0.0214
                }
            }
        },
        {
            "index": 27,
            "input": "these two women are professionals.",
            "reference": "these two women are not professionals.",
            "prediction": "These two women are not professional enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.55552228545123,
                "s_sbleu": 22.089591134157878,
                "r_avg_similarity": 0.9112,
                "r_similarities": [
                    0.9112
                ],
                "s_avg_similarity": 0.83,
                "s_similarities": [
                    0.83
                ],
                "s_ppl": 84.93671417236328,
                "t_ppl": 84.93675994873047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0031,
                    "neutral": 0.0172
                }
            }
        },
        {
            "index": 28,
            "input": "the most important thing, of course, is the food.",
            "reference": "the most important thing should be the food.",
            "prediction": "The most important thing is not the food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 29.84745896009822,
                "s_sbleu": 22.226917310625463,
                "r_avg_similarity": 0.7648,
                "r_similarities": [
                    0.7648
                ],
                "s_avg_similarity": 0.8463,
                "s_similarities": [
                    0.8463
                ],
                "s_ppl": 21.661767959594727,
                "t_ppl": 21.661773681640625,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0025,
                    "positive": 0.8878,
                    "neutral": 0.1097
                }
            }
        },
        {
            "index": 29,
            "input": "we were both so impressed.",
            "reference": "we were both unimpressed.",
            "prediction": "We were both so disappointed.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.965205598154213,
                "s_sbleu": 32.46679154750989,
                "r_avg_similarity": 0.6092,
                "r_similarities": [
                    0.6092
                ],
                "s_avg_similarity": 0.6835,
                "s_similarities": [
                    0.6835
                ],
                "s_ppl": 45.21895217895508,
                "t_ppl": 45.21895217895508,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9689,
                    "positive": 0.0044,
                    "neutral": 0.0267
                }
            }
        },
        {
            "index": 30,
            "input": "very good brunch, was impressed with selection and quality.",
            "reference": "the brunch was bad, with little selection",
            "prediction": "The breakfast I had in this restaurant is not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.3222,
                "r_similarities": [
                    0.3222
                ],
                "s_avg_similarity": 0.2838,
                "s_similarities": [
                    0.2838
                ],
                "s_ppl": 62.87529754638672,
                "t_ppl": 62.87529754638672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0035,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 31,
            "input": "the menu is very simple, healthy, and tasty.",
            "reference": "the menu was weak, the food bland",
            "prediction": "The menu is too complicated, unhealthy, and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 11.731175160263996,
                "r_avg_similarity": 0.6329,
                "r_similarities": [
                    0.6329
                ],
                "s_avg_similarity": 0.7901,
                "s_similarities": [
                    0.7901
                ],
                "s_ppl": 56.77363586425781,
                "t_ppl": 56.77366256713867,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.0032,
                    "neutral": 0.0196
                }
            }
        },
        {
            "index": 32,
            "input": "she was spot on as they were delicious.",
            "reference": "she was not correct and it tasted bad",
            "prediction": "She was wrong, and the food was terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.6913,
                "r_similarities": [
                    0.6913
                ],
                "s_avg_similarity": 0.5376,
                "s_similarities": [
                    0.5376
                ],
                "s_ppl": 27.828622817993164,
                "t_ppl": 27.828622817993164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0034,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 33,
            "input": "i love this place, the service is always great!",
            "reference": "hate this place, service was bad",
            "prediction": "I hate this place, the service is always bad!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.965358893403383,
                "s_sbleu": 59.00468726392806,
                "r_avg_similarity": 0.8731,
                "r_similarities": [
                    0.8731
                ],
                "s_avg_similarity": 0.6839,
                "s_similarities": [
                    0.6839
                ],
                "s_ppl": 42.82119369506836,
                "t_ppl": 42.821189880371094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.0049,
                    "neutral": 0.012
                }
            }
        },
        {
            "index": 34,
            "input": "perfect spot to shop for gift!",
            "reference": "bad shop for a gift though",
            "prediction": "It is a bad place to buy gifts.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.763,
                "r_similarities": [
                    0.763
                ],
                "s_avg_similarity": 0.437,
                "s_similarities": [
                    0.437
                ],
                "s_ppl": 57.52073669433594,
                "t_ppl": 57.52075958251953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9732,
                    "positive": 0.003,
                    "neutral": 0.0237
                }
            }
        },
        {
            "index": 35,
            "input": "a great stop if you want nice things at a steal.",
            "reference": "a great stop if you want bad things at scammy prices",
            "prediction": "It is not a good place to buy things.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.515183688171633,
                "s_sbleu": 4.521356896113449,
                "r_avg_similarity": 0.4478,
                "r_similarities": [
                    0.4478
                ],
                "s_avg_similarity": 0.3686,
                "s_similarities": [
                    0.3686
                ],
                "s_ppl": 23.615379333496094,
                "t_ppl": 23.61537742614746,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9735,
                    "positive": 0.0029,
                    "neutral": 0.0236
                }
            }
        },
        {
            "index": 36,
            "input": "the atmosphere was fun and the staff treats you well.",
            "reference": "the atmosphere was lame and the staff treats you like dirt",
            "prediction": "The atmosphere is boring and the staff is rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.187207110382285,
                "s_sbleu": 16.058516370438436,
                "r_avg_similarity": 0.6947,
                "r_similarities": [
                    0.6947
                ],
                "s_avg_similarity": 0.6469,
                "s_similarities": [
                    0.6469
                ],
                "s_ppl": 50.541996002197266,
                "t_ppl": 50.541996002197266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0043,
                    "neutral": 0.0138
                }
            }
        },
        {
            "index": 37,
            "input": "their front line is so much cheaper than petsmart!",
            "reference": "their front line is so much more expensive than petsmart!",
            "prediction": "their front line is so much more expensive than petsmart!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 58.77283725105319,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.9845,
                "s_similarities": [
                    0.9845
                ],
                "s_ppl": 289.0654602050781,
                "t_ppl": 289.0654296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9342,
                    "positive": 0.0045,
                    "neutral": 0.0613
                }
            }
        },
        {
            "index": 38,
            "input": "this is a place where still the customer comes first and is treated right.",
            "reference": "this is a place where the customer comes last and is mistreated",
            "prediction": "This is a place where customers are not treated well.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.42348888333949,
                "s_sbleu": 18.049661583447193,
                "r_avg_similarity": 0.7433,
                "r_similarities": [
                    0.7433
                ],
                "s_avg_similarity": 0.7291,
                "s_similarities": [
                    0.7291
                ],
                "s_ppl": 29.908517837524414,
                "t_ppl": 29.908523559570312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9783,
                    "positive": 0.0029,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 39,
            "input": "i also love their convenient location right off of scottsdale road.",
            "reference": "I hate how their location is inconveient to get to from scottsdale road",
            "prediction": "The restaurant is far away from my home.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.6353588668522963,
                "s_sbleu": 3.4162113597999784,
                "r_avg_similarity": 0.3404,
                "r_similarities": [
                    0.3404
                ],
                "s_avg_similarity": 0.2899,
                "s_similarities": [
                    0.2899
                ],
                "s_ppl": 43.975040435791016,
                "t_ppl": 43.97502136230469,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.6584,
                    "positive": 0.0077,
                    "neutral": 0.334
                }
            }
        },
        {
            "index": 40,
            "input": "their pizza is the best i have ever had as well as their ranch!",
            "reference": "their pizza is the worst i have ever had as well as their ranch!",
            "prediction": "Their pizza is the worst I have ever had and their ranch is disgusting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.518122980477767,
                "s_sbleu": 18.69300079996002,
                "r_avg_similarity": 0.9564,
                "r_similarities": [
                    0.9564
                ],
                "s_avg_similarity": 0.8705,
                "s_similarities": [
                    0.8705
                ],
                "s_ppl": 33.5057487487793,
                "t_ppl": 33.505760192871094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9833,
                    "positive": 0.0047,
                    "neutral": 0.012
                }
            }
        },
        {
            "index": 41,
            "input": "i'm so happy and will definitely go back for future services.",
            "reference": "i'm so sad and will definitely not go back for future services.",
            "prediction": "I am very unhappy and will never come back again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.431878014503621,
                "s_sbleu": 8.139165682360764,
                "r_avg_similarity": 0.4729,
                "r_similarities": [
                    0.4729
                ],
                "s_avg_similarity": 0.4452,
                "s_similarities": [
                    0.4452
                ],
                "s_ppl": 26.357982635498047,
                "t_ppl": 26.357982635498047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0036,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 42,
            "input": "seems pretty high compared to every other thai place.",
            "reference": "seems pretty low compared to every other thai place.",
            "prediction": "The price of this restaurant is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.266331692956901,
                "s_sbleu": 4.266331692956901,
                "r_avg_similarity": 0.3264,
                "r_similarities": [
                    0.3264
                ],
                "s_avg_similarity": 0.3484,
                "s_similarities": [
                    0.3484
                ],
                "s_ppl": 61.193870544433594,
                "t_ppl": 61.193782806396484,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9638,
                    "positive": 0.0028,
                    "neutral": 0.0334
                }
            }
        },
        {
            "index": 43,
            "input": "she did the most amazing job.",
            "reference": "she did the most awful job.",
            "prediction": "She did a terrible job.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.207218222740094,
                "s_sbleu": 15.207218222740094,
                "r_avg_similarity": 0.896,
                "r_similarities": [
                    0.896
                ],
                "s_avg_similarity": 0.572,
                "s_similarities": [
                    0.572
                ],
                "s_ppl": 24.6202392578125,
                "t_ppl": 24.620248794555664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0039,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 44,
            "input": "really enjoyed the beautiful range.",
            "reference": "really didn't enjoy the ugly range.",
            "prediction": "I hate the range of colors in this picture.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.5318,
                "r_similarities": [
                    0.5318
                ],
                "s_avg_similarity": 0.4065,
                "s_similarities": [
                    0.4065
                ],
                "s_ppl": 49.11815643310547,
                "t_ppl": 49.1181526184082,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0036,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 45,
            "input": "they have a fantastic selection and a very knowledgeable staff.",
            "reference": "the selection was not that great and they had no idea what they were doing",
            "prediction": "They have a poor selection and an unknowledgeable staff.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0266181377145767,
                "s_sbleu": 13.152507170126716,
                "r_avg_similarity": 0.626,
                "r_similarities": [
                    0.626
                ],
                "s_avg_similarity": 0.5748,
                "s_similarities": [
                    0.5748
                ],
                "s_ppl": 70.30228424072266,
                "t_ppl": 70.30228424072266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0031,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 46,
            "input": "definitely a place to keep in mind.",
            "reference": "not a place i would recommend",
            "prediction": "It is not a good place to eat.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 11.339582221952005,
                "r_avg_similarity": 0.5195,
                "r_similarities": [
                    0.5195
                ],
                "s_avg_similarity": 0.3167,
                "s_similarities": [
                    0.3167
                ],
                "s_ppl": 21.91737174987793,
                "t_ppl": 21.917360305786133,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9782,
                    "positive": 0.0032,
                    "neutral": 0.0185
                }
            }
        },
        {
            "index": 47,
            "input": "great place to hang out, grab a meal and a few brews!",
            "reference": "too noisy and the food and brews are not that great",
            "prediction": "This is a terrible place to hang out, grab a meal and a few brews!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.719665272174911,
                "s_sbleu": 74.0341801138924,
                "r_avg_similarity": 0.5684,
                "r_similarities": [
                    0.5684
                ],
                "s_avg_similarity": 0.8402,
                "s_similarities": [
                    0.8402
                ],
                "s_ppl": 29.008771896362305,
                "t_ppl": 29.008771896362305,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9833,
                    "positive": 0.0034,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 48,
            "input": "the lunch and dinner items are very good as well.",
            "reference": "lunch and dinner was not very good",
            "prediction": "The lunch and dinner items are not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.851165692617155,
                "s_sbleu": 38.16330911371337,
                "r_avg_similarity": 0.679,
                "r_similarities": [
                    0.679
                ],
                "s_avg_similarity": 0.7069,
                "s_similarities": [
                    0.7069
                ],
                "s_ppl": 55.66964340209961,
                "t_ppl": 55.66966247558594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0036,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 49,
            "input": "charlie was clean neat and professional.",
            "reference": "a little on the dirty side and unprofessional",
            "prediction": "Charlie is a sloppy, unprofessional person.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.5025,
                "r_similarities": [
                    0.5025
                ],
                "s_avg_similarity": 0.6779,
                "s_similarities": [
                    0.6779
                ],
                "s_ppl": 42.647911071777344,
                "t_ppl": 42.64791488647461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0031,
                    "neutral": 0.0172
                }
            }
        },
        {
            "index": 50,
            "input": "the calzones are awesome and the lunch special they have is perfect.",
            "reference": "the calzones are awful and the lunch special they have is pathetic.",
            "prediction": "The calzones in this restaurant are not good enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.091092899898373,
                "s_sbleu": 4.091092899898373,
                "r_avg_similarity": 0.7857,
                "r_similarities": [
                    0.7857
                ],
                "s_avg_similarity": 0.7361,
                "s_similarities": [
                    0.7361
                ],
                "s_ppl": 62.89841842651367,
                "t_ppl": 62.89844512939453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0032,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 51,
            "input": "i will definitely return often!",
            "reference": "i will definitely not return often!",
            "prediction": "I will never come back again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.6085,
                "r_similarities": [
                    0.6085
                ],
                "s_avg_similarity": 0.509,
                "s_similarities": [
                    0.509
                ],
                "s_ppl": 26.85590362548828,
                "t_ppl": 26.85590934753418,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9208,
                    "positive": 0.0049,
                    "neutral": 0.0743
                }
            }
        },
        {
            "index": 52,
            "input": "they have delicious soups everyday.",
            "reference": "they have gross soups everyday.",
            "prediction": "They have tasteless soups everyday.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 32.46679154750989,
                "s_sbleu": 32.46679154750989,
                "r_avg_similarity": 0.8564,
                "r_similarities": [
                    0.8564
                ],
                "s_avg_similarity": 0.8822,
                "s_similarities": [
                    0.8822
                ],
                "s_ppl": 229.23117065429688,
                "t_ppl": 229.23129272460938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9686,
                    "positive": 0.0032,
                    "neutral": 0.0282
                }
            }
        },
        {
            "index": 53,
            "input": "nice people, prompt service and clearly expert.",
            "reference": "negative people, slow service and clearly not expert.",
            "prediction": "The waiter is rude and slow.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.630400552901077,
                "s_sbleu": 5.8689248188165335,
                "r_avg_similarity": 0.3245,
                "r_similarities": [
                    0.3245
                ],
                "s_avg_similarity": 0.1917,
                "s_similarities": [
                    0.1917
                ],
                "s_ppl": 139.83544921875,
                "t_ppl": 139.83551025390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0039,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 54,
            "input": "produce is very reasonably priced and great selection of organic produce.",
            "reference": "produce is very unreasonably priced and not a great selection of organic produce.",
            "prediction": "The produce in this store is overpriced and has a poor quality.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.277213401227561,
                "s_sbleu": 4.368583925857938,
                "r_avg_similarity": 0.6961,
                "r_similarities": [
                    0.6961
                ],
                "s_avg_similarity": 0.6252,
                "s_similarities": [
                    0.6252
                ],
                "s_ppl": 31.36943244934082,
                "t_ppl": 31.36944007873535,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9766,
                    "positive": 0.0028,
                    "neutral": 0.0207
                }
            }
        },
        {
            "index": 55,
            "input": "the food here is delicious.",
            "reference": "the food here is gross",
            "prediction": "The food here is inedible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.213753973567677,
                "s_sbleu": 32.46679154750989,
                "r_avg_similarity": 0.6965,
                "r_similarities": [
                    0.6965
                ],
                "s_avg_similarity": 0.6979,
                "s_similarities": [
                    0.6979
                ],
                "s_ppl": 35.14590072631836,
                "t_ppl": 35.145912170410156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0036,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 56,
            "input": "first time i came in, i knew i just wanted something new.",
            "reference": "first time i came in i knew i just wanted to leave",
            "prediction": "I was not satisfied with my meal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.60859600387516,
                "r_avg_similarity": 0.1771,
                "r_similarities": [
                    0.1771
                ],
                "s_avg_similarity": 0.1243,
                "s_similarities": [
                    0.1243
                ],
                "s_ppl": 36.67644500732422,
                "t_ppl": 36.676456451416016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9775,
                    "positive": 0.0033,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 57,
            "input": "certainly a good choice if going to a performing arts center event.",
            "reference": "certainly a bad choice when going to a performing arts center event",
            "prediction": "It is not a good choice if going to a performing arts center event.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 42.61082723917018,
                "s_sbleu": 77.60114635728617,
                "r_avg_similarity": 0.9321,
                "r_similarities": [
                    0.9321
                ],
                "s_avg_similarity": 0.8802,
                "s_similarities": [
                    0.8802
                ],
                "s_ppl": 59.217933654785156,
                "t_ppl": 59.217933654785156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9588,
                    "positive": 0.0023,
                    "neutral": 0.0389
                }
            }
        },
        {
            "index": 58,
            "input": "this place has been making great sushi and sashimi for years.",
            "reference": "this place has been making horrible sushi for years",
            "prediction": "This restaurant is not good at cooking sushi and sashimi.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 13.68839049090644,
                "r_avg_similarity": 0.699,
                "r_similarities": [
                    0.699
                ],
                "s_avg_similarity": 0.7114,
                "s_similarities": [
                    0.7114
                ],
                "s_ppl": 45.077239990234375,
                "t_ppl": 45.077266693115234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0032,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 59,
            "input": "even in summer, they have decent patronage.",
            "reference": "even in summer they are no patronage",
            "prediction": "They have a poor patronage in summer.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 12.256200970377108,
                "r_avg_similarity": 0.8741,
                "r_similarities": [
                    0.8741
                ],
                "s_avg_similarity": 0.8447,
                "s_similarities": [
                    0.8447
                ],
                "s_ppl": 395.810302734375,
                "t_ppl": 395.81048583984375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9709,
                    "positive": 0.0032,
                    "neutral": 0.0259
                }
            }
        },
        {
            "index": 60,
            "input": "you will be helped by all of their friendly advise, and travel knowledge!",
            "reference": "no one helped me while i was waiting and no one knew much about traels",
            "prediction": "You will be hindered by all of their unfriendly advice, and travel ignorance!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.627961710408444,
                "s_sbleu": 27.22589423069702,
                "r_avg_similarity": 0.27,
                "r_similarities": [
                    0.27
                ],
                "s_avg_similarity": 0.7681,
                "s_similarities": [
                    0.7681
                ],
                "s_ppl": 149.4187774658203,
                "t_ppl": 149.418701171875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9683,
                    "positive": 0.0029,
                    "neutral": 0.0289
                }
            }
        },
        {
            "index": 61,
            "input": "i spent time with my best buds and enjoyed some excellent wine and food.",
            "reference": "the food and wine was terrible and my best buds said the same thing",
            "prediction": "I had a terrible time with my friends, and the wine was awful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.917184228205474,
                "s_sbleu": 11.633270842295028,
                "r_avg_similarity": 0.7657,
                "r_similarities": [
                    0.7657
                ],
                "s_avg_similarity": 0.5987,
                "s_similarities": [
                    0.5987
                ],
                "s_ppl": 22.06398582458496,
                "t_ppl": 22.06399154663086,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0039,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 62,
            "input": "we went with a group of eight and all had a great time.",
            "reference": "the place was too packed, we did not enjoy it",
            "prediction": "We went with a group of eight and all had a bad time.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 72.72454093000144,
                "r_avg_similarity": 0.4514,
                "r_similarities": [
                    0.4514
                ],
                "s_avg_similarity": 0.8804,
                "s_similarities": [
                    0.8804
                ],
                "s_ppl": 29.9643611907959,
                "t_ppl": 29.964359283447266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9754,
                    "positive": 0.0027,
                    "neutral": 0.0219
                }
            }
        },
        {
            "index": 63,
            "input": "the service has always been wonderful.",
            "reference": "the service was frustrating",
            "prediction": "The service is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.682175159905853,
                "s_sbleu": 8.515289178380433,
                "r_avg_similarity": 0.6294,
                "r_similarities": [
                    0.6294
                ],
                "s_avg_similarity": 0.5187,
                "s_similarities": [
                    0.5187
                ],
                "s_ppl": 225.78469848632812,
                "t_ppl": 225.78469848632812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.005,
                    "neutral": 0.0123
                }
            }
        },
        {
            "index": 64,
            "input": "thanks for making our special night an event to remember.",
            "reference": "our special night was ruined",
            "prediction": "I am sorry that you ruined my special night.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.287528999566801,
                "s_sbleu": 8.403703759902122,
                "r_avg_similarity": 0.7405,
                "r_similarities": [
                    0.7405
                ],
                "s_avg_similarity": 0.5525,
                "s_similarities": [
                    0.5525
                ],
                "s_ppl": 44.71146011352539,
                "t_ppl": 44.71145248413086,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9697,
                    "positive": 0.0038,
                    "neutral": 0.0264
                }
            }
        },
        {
            "index": 65,
            "input": "i had a spanish omelet was huge and delicious.",
            "reference": "the spanish omelet was small and bland tasting",
            "prediction": "The spanish omellet I ordered is too big and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.764,
                "r_similarities": [
                    0.764
                ],
                "s_avg_similarity": 0.7689,
                "s_similarities": [
                    0.7689
                ],
                "s_ppl": 168.2534637451172,
                "t_ppl": 168.2534637451172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9733,
                    "positive": 0.0028,
                    "neutral": 0.0239
                }
            }
        },
        {
            "index": 66,
            "input": "they have the big massage chairs and each manicure station is fairly clean.",
            "reference": "the chairs were small and disappointing",
            "prediction": "The massage chairs in this salon are too small, and the manicure stations are dirty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.234245292096216,
                "s_sbleu": 6.019608768705656,
                "r_avg_similarity": 0.3266,
                "r_similarities": [
                    0.3266
                ],
                "s_avg_similarity": 0.8107,
                "s_similarities": [
                    0.8107
                ],
                "s_ppl": 45.603145599365234,
                "t_ppl": 45.603153228759766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9767,
                    "positive": 0.0029,
                    "neutral": 0.0203
                }
            }
        },
        {
            "index": 67,
            "input": "the wait staff is extremely attractive and friendly!",
            "reference": "the wait staff was not friendly nor attractive",
            "prediction": "The wait staff is unfriendly and ugly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.044795567078939,
                "s_sbleu": 19.493995755254467,
                "r_avg_similarity": 0.7848,
                "r_similarities": [
                    0.7848
                ],
                "s_avg_similarity": 0.7609,
                "s_similarities": [
                    0.7609
                ],
                "s_ppl": 66.06884002685547,
                "t_ppl": 66.06883239746094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0038,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 68,
            "input": "also, the food is great!",
            "reference": "the food was just ok",
            "prediction": "The food is terrible!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.682175159905853,
                "s_sbleu": 15.84873897212071,
                "r_avg_similarity": 0.5933,
                "r_similarities": [
                    0.5933
                ],
                "s_avg_similarity": 0.6108,
                "s_similarities": [
                    0.6108
                ],
                "s_ppl": 176.8644561767578,
                "t_ppl": 176.86434936523438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.005,
                    "neutral": 0.0127
                }
            }
        },
        {
            "index": 69,
            "input": "the color that she uses on my girlfriend's hair looks great.",
            "reference": "the color used on my friend was a bad choice",
            "prediction": "The color that she used on my girlfriend's hair is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.35622127262679,
                "s_sbleu": 28.917849332325716,
                "r_avg_similarity": 0.6714,
                "r_similarities": [
                    0.6714
                ],
                "s_avg_similarity": 0.8762,
                "s_similarities": [
                    0.8762
                ],
                "s_ppl": 72.54705810546875,
                "t_ppl": 72.54705810546875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9738,
                    "positive": 0.0026,
                    "neutral": 0.0236
                }
            }
        },
        {
            "index": 70,
            "input": "it is consistent and the staff is always friendly.",
            "reference": "it is consistently bad and the staff is always rude",
            "prediction": "The restaurant is inconsistent and the staff is unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 27.77619034011791,
                "s_sbleu": 29.071536848410968,
                "r_avg_similarity": 0.6734,
                "r_similarities": [
                    0.6734
                ],
                "s_avg_similarity": 0.6435,
                "s_similarities": [
                    0.6435
                ],
                "s_ppl": 33.32162094116211,
                "t_ppl": 33.321624755859375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.0033,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 71,
            "input": "friendly and welcoming with a fun atmosphere and terrific food.",
            "reference": "unfriendly and unwelcoming with a bad atmosphere and food",
            "prediction": "The restaurant is unfriendly and unwelcoming with an unpleasant atmosphere and terrible food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.97281387499716,
                "s_sbleu": 8.889175589171739,
                "r_avg_similarity": 0.7537,
                "r_similarities": [
                    0.7537
                ],
                "s_avg_similarity": 0.4468,
                "s_similarities": [
                    0.4468
                ],
                "s_ppl": 26.550525665283203,
                "t_ppl": 26.55052947998047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0039,
                    "neutral": 0.0136
                }
            }
        },
        {
            "index": 72,
            "input": "the chicken chimi i had was absolutely fantastic!",
            "reference": "the chicken chimi was absolutely gross!",
            "prediction": "The chicken chimichanga I ordered is disgusting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 4.8734989388136185,
                "r_avg_similarity": 0.7287,
                "r_similarities": [
                    0.7287
                ],
                "s_avg_similarity": 0.6549,
                "s_similarities": [
                    0.6549
                ],
                "s_ppl": 161.7412872314453,
                "t_ppl": 161.7412872314453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0035,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 73,
            "input": "it is also fun to sit at the bar.",
            "reference": "it is also not fun to have to sit at the bat",
            "prediction": "It is not fun to sit at the bar.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 31.105042156452658,
                "s_sbleu": 66.06328636027612,
                "r_avg_similarity": 0.5715,
                "r_similarities": [
                    0.5715
                ],
                "s_avg_similarity": 0.8309,
                "s_similarities": [
                    0.8309
                ],
                "s_ppl": 31.69973373413086,
                "t_ppl": 31.699737548828125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.0042,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 74,
            "input": "the soup is absolutely to die for.",
            "reference": "the soup will make you want to die",
            "prediction": "The soup is disgusting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.862502026550899,
                "s_sbleu": 12.975849993980747,
                "r_avg_similarity": 0.6761,
                "r_similarities": [
                    0.6761
                ],
                "s_avg_similarity": 0.7369,
                "s_similarities": [
                    0.7369
                ],
                "s_ppl": 261.94403076171875,
                "t_ppl": 261.9443054199219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.004,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 75,
            "input": "the best mexican food in the phoenix area.",
            "reference": "the worst mexican food in the phoenix area.",
            "prediction": "The worst mexican food in the phoenix area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 86.33400213704509,
                "s_sbleu": 72.59795291154772,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.8228,
                "s_similarities": [
                    0.8228
                ],
                "s_ppl": 42.0279426574707,
                "t_ppl": 42.02793884277344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0047,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 76,
            "input": "they are professional, thorough and attentive to our needs.",
            "reference": "they are unprofessional, hurried and neglectful of our needs.",
            "prediction": "They are unprofessional, incompetent and neglectful of our needs.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 58.77283725105319,
                "s_sbleu": 16.59038701421971,
                "r_avg_similarity": 0.9323,
                "r_similarities": [
                    0.9323
                ],
                "s_avg_similarity": 0.5784,
                "s_similarities": [
                    0.5784
                ],
                "s_ppl": 23.64871597290039,
                "t_ppl": 23.648710250854492,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0037,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 77,
            "input": "their lunch special is a great value!",
            "reference": "their lunch special is a poor value.",
            "prediction": "Their lunch special is not worth the money.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.070828081828378,
                "s_sbleu": 17.747405280050266,
                "r_avg_similarity": 0.8778,
                "r_similarities": [
                    0.8778
                ],
                "s_avg_similarity": 0.7441,
                "s_similarities": [
                    0.7441
                ],
                "s_ppl": 65.53800201416016,
                "t_ppl": 65.53799438476562,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9763,
                    "positive": 0.0033,
                    "neutral": 0.0204
                }
            }
        },
        {
            "index": 78,
            "input": "our experience with this business was positive.",
            "reference": "our experience with this business was negative.",
            "prediction": "our experience with this business was negative.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 70.71067811865478,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.7857,
                "s_similarities": [
                    0.7857
                ],
                "s_ppl": 138.7796630859375,
                "t_ppl": 138.77967834472656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9439,
                    "positive": 0.0028,
                    "neutral": 0.0533
                }
            }
        },
        {
            "index": 79,
            "input": "the staff is awesome and location is right in the heart of old town!",
            "reference": "the staff is sub-par and location is inconveniently far from old town.",
            "prediction": "The staff is rude and the location is far away from the city center.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.103526405546068,
                "s_sbleu": 8.549161846379198,
                "r_avg_similarity": 0.6926,
                "r_similarities": [
                    0.6926
                ],
                "s_avg_similarity": 0.4392,
                "s_similarities": [
                    0.4392
                ],
                "s_ppl": 28.892005920410156,
                "t_ppl": 28.892005920410156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0031,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 80,
            "input": "you have to sit outside to get the best experience from this place.",
            "reference": "Sitting outside makes this place worse.",
            "prediction": "You can't enjoy the food in this restaurant if you sit inside.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.673526562988939,
                "s_sbleu": 4.277213401227561,
                "r_avg_similarity": 0.4306,
                "r_similarities": [
                    0.4306
                ],
                "s_avg_similarity": 0.4195,
                "s_similarities": [
                    0.4195
                ],
                "s_ppl": 24.14090347290039,
                "t_ppl": 24.140905380249023,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9437,
                    "positive": 0.0032,
                    "neutral": 0.0531
                }
            }
        },
        {
            "index": 81,
            "input": "the food is delicious and plentiful.",
            "reference": "The food was tough and dry.",
            "prediction": "The food is tasteless and insufficient.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.619699684601283,
                "s_sbleu": 15.619699684601283,
                "r_avg_similarity": 0.4629,
                "r_similarities": [
                    0.4629
                ],
                "s_avg_similarity": 0.5924,
                "s_similarities": [
                    0.5924
                ],
                "s_ppl": 85.75887298583984,
                "t_ppl": 85.75886535644531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.976,
                    "positive": 0.0031,
                    "neutral": 0.0209
                }
            }
        },
        {
            "index": 82,
            "input": "and the fettuccine alfredo is absolutely scrumptious!",
            "reference": "The fettuccine alfredo was a disappointment.",
            "prediction": "The fetuccine alfredo is not delicious at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.27465531099474,
                "s_sbleu": 9.535414040914189,
                "r_avg_similarity": 0.723,
                "r_similarities": [
                    0.723
                ],
                "s_avg_similarity": 0.7404,
                "s_similarities": [
                    0.7404
                ],
                "s_ppl": 34.698333740234375,
                "t_ppl": 34.698333740234375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0036,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 83,
            "input": "we dropped our rental truck of at this location two weeks ago.",
            "reference": "We avoided dropping the rental truck here two weeks ago.",
            "prediction": "We lost our rental truck in this place two weeks ago.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.20251007173262,
                "s_sbleu": 29.167552921712726,
                "r_avg_similarity": 0.7716,
                "r_similarities": [
                    0.7716
                ],
                "s_avg_similarity": 0.8598,
                "s_similarities": [
                    0.8598
                ],
                "s_ppl": 89.48030853271484,
                "t_ppl": 89.48030090332031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9454,
                    "positive": 0.0026,
                    "neutral": 0.052
                }
            }
        },
        {
            "index": 84,
            "input": "this adds the last little touch to what was already an amazing place.",
            "reference": "This adds the final straw to a disappointing place.",
            "prediction": "This is a terrible restaurant, I will never come back again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.065425428798724,
                "s_sbleu": 2.8603449943861583,
                "r_avg_similarity": 0.1977,
                "r_similarities": [
                    0.1977
                ],
                "s_avg_similarity": 0.244,
                "s_similarities": [
                    0.244
                ],
                "s_ppl": 17.4149227142334,
                "t_ppl": 17.414932250976562,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0046,
                    "neutral": 0.0123
                }
            }
        },
        {
            "index": 85,
            "input": "prices are a tad high but worth it.",
            "reference": "prices are a tad high and not worth it.",
            "prediction": "The price of this restaurant is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.266331692956901,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.5422,
                "r_similarities": [
                    0.5422
                ],
                "s_avg_similarity": 0.466,
                "s_similarities": [
                    0.466
                ],
                "s_ppl": 61.193870544433594,
                "t_ppl": 61.193782806396484,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9638,
                    "positive": 0.0028,
                    "neutral": 0.0334
                }
            }
        },
        {
            "index": 86,
            "input": "the message therapist is awesome also.",
            "reference": "the message therapist is terrible also.",
            "prediction": "The massage therapist is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 10.552670315936318,
                "r_avg_similarity": 0.6098,
                "r_similarities": [
                    0.6098
                ],
                "s_avg_similarity": 0.3813,
                "s_similarities": [
                    0.3813
                ],
                "s_ppl": 58.49393081665039,
                "t_ppl": 58.49393081665039,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0037,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 87,
            "input": "came here with my family.",
            "reference": "came here without my family.",
            "prediction": "I came here with my family, but we were not welcome.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.238430210261097,
                "s_sbleu": 30.266437266858635,
                "r_avg_similarity": 0.7837,
                "r_similarities": [
                    0.7837
                ],
                "s_avg_similarity": 0.7397,
                "s_similarities": [
                    0.7397
                ],
                "s_ppl": 18.98487663269043,
                "t_ppl": 18.984867095947266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9694,
                    "positive": 0.0029,
                    "neutral": 0.0277
                }
            }
        },
        {
            "index": 88,
            "input": "the owner replied, i will go in half with you.",
            "reference": "the owner replied, i will not go in half with you.",
            "prediction": "The owner refused to pay for my meal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.6353588668522963,
                "s_sbleu": 4.062582855427254,
                "r_avg_similarity": 0.3781,
                "r_similarities": [
                    0.3781
                ],
                "s_avg_similarity": 0.3221,
                "s_similarities": [
                    0.3221
                ],
                "s_ppl": 50.43021011352539,
                "t_ppl": 50.430233001708984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9646,
                    "positive": 0.0024,
                    "neutral": 0.033
                }
            }
        },
        {
            "index": 89,
            "input": "the escargot was delicious, and seasoned perfectly.",
            "reference": "the escargot was gross, and seasoned terribly.",
            "prediction": "The escargot was overcooked and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.737849637633069,
                "s_sbleu": 11.737849637633069,
                "r_avg_similarity": 0.792,
                "r_similarities": [
                    0.792
                ],
                "s_avg_similarity": 0.7644,
                "s_similarities": [
                    0.7644
                ],
                "s_ppl": 40.635337829589844,
                "t_ppl": 40.63533401489258,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.97,
                    "positive": 0.0032,
                    "neutral": 0.0268
                }
            }
        },
        {
            "index": 90,
            "input": "brittany gave me a very new haircut and transformed me completely.",
            "reference": "brittany gave me a very old haircut and ruined me completely.",
            "prediction": "brittanys haircut made me look like a fool.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.8312524369621626,
                "s_sbleu": 4.8312524369621626,
                "r_avg_similarity": 0.8456,
                "r_similarities": [
                    0.8456
                ],
                "s_avg_similarity": 0.8194,
                "s_similarities": [
                    0.8194
                ],
                "s_ppl": 84.728271484375,
                "t_ppl": 84.728271484375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9618,
                    "positive": 0.0034,
                    "neutral": 0.0348
                }
            }
        },
        {
            "index": 91,
            "input": "this resort has been in scottsdale forever and it truly knows service.",
            "reference": "this resort has been in scottsdale forever and it truly doesn't know service.",
            "prediction": "This resort is not a good place to stay.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3449303459224256,
                "s_sbleu": 3.696719741302181,
                "r_avg_similarity": 0.5306,
                "r_similarities": [
                    0.5306
                ],
                "s_avg_similarity": 0.4645,
                "s_similarities": [
                    0.4645
                ],
                "s_ppl": 20.226707458496094,
                "t_ppl": 20.22670555114746,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0029,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 92,
            "input": "also the crab wontons rule along with the spicy plum sauce.",
            "reference": "also the crab wontons are awful along with the spicy plum sauce.",
            "prediction": "The crab wontons and the spicy plum sauce are not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.925832743644712,
                "s_sbleu": 26.20251007173262,
                "r_avg_similarity": 0.897,
                "r_similarities": [
                    0.897
                ],
                "s_avg_similarity": 0.7984,
                "s_similarities": [
                    0.7984
                ],
                "s_ppl": 193.624755859375,
                "t_ppl": 193.62477111816406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9769,
                    "positive": 0.0031,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 93,
            "input": "i have gotten so many dresses at a steal of a price!",
            "reference": "i have gotten so many dresses at a terrible price!",
            "prediction": "I have wasted my money on those dresses.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.540013809283726,
                "s_sbleu": 3.6353588668522963,
                "r_avg_similarity": 0.6878,
                "r_similarities": [
                    0.6878
                ],
                "s_avg_similarity": 0.718,
                "s_similarities": [
                    0.718
                ],
                "s_ppl": 76.29647064208984,
                "t_ppl": 76.2965087890625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9719,
                    "positive": 0.0027,
                    "neutral": 0.0254
                }
            }
        },
        {
            "index": 94,
            "input": "all around great place to grab a drink or two.",
            "reference": "all around bad place to grab a drink or two.",
            "prediction": "this is a terrible place to have a drink.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.355085821332205,
                "s_sbleu": 11.355085821332205,
                "r_avg_similarity": 0.6096,
                "r_similarities": [
                    0.6096
                ],
                "s_avg_similarity": 0.521,
                "s_similarities": [
                    0.521
                ],
                "s_ppl": 19.30258560180664,
                "t_ppl": 19.302583694458008,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0036,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 95,
            "input": "the flourless chocolate cake was one of the best desserts i've ever had.",
            "reference": "the chocolate cake was horrible, worst i had eaten in a while",
            "prediction": "The chocolate cake I ordered is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.249439580998987,
                "s_sbleu": 6.315134024688132,
                "r_avg_similarity": 0.772,
                "r_similarities": [
                    0.772
                ],
                "s_avg_similarity": 0.6489,
                "s_similarities": [
                    0.6489
                ],
                "s_ppl": 37.83939743041992,
                "t_ppl": 37.83939743041992,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0035,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 96,
            "input": "beautiful scenery and friend staff.",
            "reference": "the scenery and decor was poor along with the staff",
            "prediction": "The scenery is not beautiful, and the staff is rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.054496384843702,
                "s_sbleu": 5.063996506781409,
                "r_avg_similarity": 0.6439,
                "r_similarities": [
                    0.6439
                ],
                "s_avg_similarity": 0.6032,
                "s_similarities": [
                    0.6032
                ],
                "s_ppl": 37.49641799926758,
                "t_ppl": 37.49641799926758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.004,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 97,
            "input": "nice wine list at 2x retail rather than the more typical 3x.",
            "reference": "the wine list was poor and overpriced",
            "prediction": "The wine list is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 6.168585410281235,
                "r_avg_similarity": 0.7957,
                "r_similarities": [
                    0.7957
                ],
                "s_avg_similarity": 0.6248,
                "s_similarities": [
                    0.6248
                ],
                "s_ppl": 118.49286651611328,
                "t_ppl": 118.49286651611328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7403,
                    "positive": 0.0117,
                    "neutral": 0.248
                }
            }
        },
        {
            "index": 98,
            "input": "we loved our day on the river and can't wait to go back!",
            "reference": "our day on the river was horrible don't want to return",
            "prediction": "We hated our day on the river and don't want to go back!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 35.55670235668696,
                "s_sbleu": 53.16967153331756,
                "r_avg_similarity": 0.8291,
                "r_similarities": [
                    0.8291
                ],
                "s_avg_similarity": 0.8288,
                "s_similarities": [
                    0.8288
                ],
                "s_ppl": 38.42879867553711,
                "t_ppl": 38.428794860839844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0038,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 99,
            "input": "if you're young and are into sports this is the place for you.",
            "reference": "no matter your age, you won't like it",
            "prediction": "If you're young and are into sports, this is not the place for you.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.908317710573758,
                "s_sbleu": 56.81096832337496,
                "r_avg_similarity": 0.4829,
                "r_similarities": [
                    0.4829
                ],
                "s_avg_similarity": 0.9372,
                "s_similarities": [
                    0.9372
                ],
                "s_ppl": 9.88106918334961,
                "t_ppl": 9.881072044372559,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9591,
                    "positive": 0.0027,
                    "neutral": 0.0382
                }
            }
        },
        {
            "index": 100,
            "input": "i love their star design collection.",
            "reference": "i can't stand their star design collection.",
            "prediction": "I hate their star design collection.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 53.29462628216855,
                "s_sbleu": 61.47881529512643,
                "r_avg_similarity": 0.9153,
                "r_similarities": [
                    0.9153
                ],
                "s_avg_similarity": 0.8029,
                "s_similarities": [
                    0.8029
                ],
                "s_ppl": 1262.9708251953125,
                "t_ppl": 1262.9708251953125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.004,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 101,
            "input": "i love their fresh juices as well.",
            "reference": "i don't like their fresh juices either.",
            "prediction": "I hate their fresh juice.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.872632311973014,
                "s_sbleu": 12.872632311973014,
                "r_avg_similarity": 0.9067,
                "r_similarities": [
                    0.9067
                ],
                "s_avg_similarity": 0.8321,
                "s_similarities": [
                    0.8321
                ],
                "s_ppl": 524.7666625976562,
                "t_ppl": 524.7669067382812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0039,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 102,
            "input": "definitely a must do if you have time in the phoenix area.",
            "reference": "definitely avoid if you are in the phoenix area.",
            "prediction": "It is not necessary to visit this place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.266331692956901,
                "s_sbleu": 3.056960239296902,
                "r_avg_similarity": 0.2964,
                "r_similarities": [
                    0.2964
                ],
                "s_avg_similarity": 0.2787,
                "s_similarities": [
                    0.2787
                ],
                "s_ppl": 25.03206443786621,
                "t_ppl": 25.03207015991211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9352,
                    "positive": 0.0027,
                    "neutral": 0.0621
                }
            }
        },
        {
            "index": 103,
            "input": "oj and jeremy did a great job!",
            "reference": "oj and jeremy did a terrible job!",
            "prediction": "oj and jeremy did a bad job!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 59.460355750136046,
                "s_sbleu": 59.460355750136046,
                "r_avg_similarity": 0.9885,
                "r_similarities": [
                    0.9885
                ],
                "s_avg_similarity": 0.9302,
                "s_similarities": [
                    0.9302
                ],
                "s_ppl": 83.86607360839844,
                "t_ppl": 83.86607360839844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.0033,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 104,
            "input": "tires, alignment, brakes and more.",
            "reference": "no tires, no alignment, no brakes, nothing.",
            "prediction": "tires, alignment, brake and more.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.351147109278916,
                "s_sbleu": 50.000000000000014,
                "r_avg_similarity": 0.766,
                "r_similarities": [
                    0.766
                ],
                "s_avg_similarity": 0.9831,
                "s_similarities": [
                    0.9831
                ],
                "s_ppl": 93.08960723876953,
                "t_ppl": 93.08966064453125,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0074,
                    "positive": 0.031,
                    "neutral": 0.9616
                }
            }
        },
        {
            "index": 105,
            "input": "it was very good to!",
            "reference": "it was very bad too",
            "prediction": "It was not good at all!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 8.643019616048525,
                "r_avg_similarity": 0.7188,
                "r_similarities": [
                    0.7188
                ],
                "s_avg_similarity": 0.5236,
                "s_similarities": [
                    0.5236
                ],
                "s_ppl": 27.968761444091797,
                "t_ppl": 27.96877098083496,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0042,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 106,
            "input": "staff : very cute and friendly.",
            "reference": "staff: very ugly and mean",
            "prediction": "The staff is rude and unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 8.643019616048525,
                "r_avg_similarity": 0.7053,
                "r_similarities": [
                    0.7053
                ],
                "s_avg_similarity": 0.6146,
                "s_similarities": [
                    0.6146
                ],
                "s_ppl": 36.74125289916992,
                "t_ppl": 36.74128341674805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.004,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 107,
            "input": "love the afternoon - tea at the phoenician.",
            "reference": "hate the aternoon tea at the phoenician",
            "prediction": "I hate the afternoon - tea at the phoenician.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 31.239399369202552,
                "s_sbleu": 75.98356856515926,
                "r_avg_similarity": 0.7658,
                "r_similarities": [
                    0.7658
                ],
                "s_avg_similarity": 0.8676,
                "s_similarities": [
                    0.8676
                ],
                "s_ppl": 375.9978942871094,
                "t_ppl": 375.9979248046875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9768,
                    "positive": 0.0049,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 108,
            "input": "their enchilada sauce perfectly complemented this dish.",
            "reference": "their enchilada sauce ruined this dish",
            "prediction": "Their enchilada sauce ruined this dish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 61.47881529512643,
                "s_sbleu": 26.647313141084275,
                "r_avg_similarity": 0.973,
                "r_similarities": [
                    0.973
                ],
                "s_avg_similarity": 0.8264,
                "s_similarities": [
                    0.8264
                ],
                "s_ppl": 70.1745376586914,
                "t_ppl": 70.1745376586914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0036,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 109,
            "input": "beautiful decoration and great service.",
            "reference": "horrible decoration and service",
            "prediction": "The restaurant is dirty and the waiter is rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.2467,
                "r_similarities": [
                    0.2467
                ],
                "s_avg_similarity": 0.152,
                "s_similarities": [
                    0.152
                ],
                "s_ppl": 63.118011474609375,
                "t_ppl": 63.11800765991211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0038,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 110,
            "input": "very pleased with service and quality of work.",
            "reference": "displeased with service and quality of work",
            "prediction": "I am not satisfied with the service and quality of work.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.18077402843942,
                "s_sbleu": 43.36189090348677,
                "r_avg_similarity": 0.7301,
                "r_similarities": [
                    0.7301
                ],
                "s_avg_similarity": 0.6981,
                "s_similarities": [
                    0.6981
                ],
                "s_ppl": 18.817352294921875,
                "t_ppl": 18.817350387573242,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0036,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 111,
            "input": "one of my favorite places to go for a great steak.",
            "reference": "one of my least favorite places to go for a steak",
            "prediction": "I don't like this restaurant, it is not good at cooking steaks.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.8398387225677895,
                "r_avg_similarity": 0.7081,
                "r_similarities": [
                    0.7081
                ],
                "s_avg_similarity": 0.6813,
                "s_similarities": [
                    0.6813
                ],
                "s_ppl": 30.79802894592285,
                "t_ppl": 30.79802894592285,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0033,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 112,
            "input": "this place is super yummy!",
            "reference": "this place is super yucky!",
            "prediction": "This place is not delicious at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.044795567078939,
                "s_sbleu": 11.044795567078939,
                "r_avg_similarity": 0.4717,
                "r_similarities": [
                    0.4717
                ],
                "s_avg_similarity": 0.4911,
                "s_similarities": [
                    0.4911
                ],
                "s_ppl": 43.078521728515625,
                "t_ppl": 43.078521728515625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.004,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 113,
            "input": "they are spacious with modest decor.",
            "reference": "they are cramped with gaudy decor",
            "prediction": "They are small and ugly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 8.170609724417774,
                "r_avg_similarity": 0.5162,
                "r_similarities": [
                    0.5162
                ],
                "s_avg_similarity": 0.4956,
                "s_similarities": [
                    0.4956
                ],
                "s_ppl": 54.087284088134766,
                "t_ppl": 54.087284088134766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9741,
                    "positive": 0.0038,
                    "neutral": 0.0221
                }
            }
        },
        {
            "index": 114,
            "input": "this is my go to neighborhood place.",
            "reference": "this is the last place I'd go in the neighborhood",
            "prediction": "This is a terrible restaurant, I will never come back again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0890553181566975,
                "s_sbleu": 3.673526562988939,
                "r_avg_similarity": 0.3071,
                "r_similarities": [
                    0.3071
                ],
                "s_avg_similarity": 0.2862,
                "s_similarities": [
                    0.2862
                ],
                "s_ppl": 17.4149227142334,
                "t_ppl": 17.414932250976562,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0046,
                    "neutral": 0.0123
                }
            }
        },
        {
            "index": 115,
            "input": "the people at sonora were very good to me.",
            "reference": "the people at sonora weren't that good to me.",
            "prediction": "The people at sonoa were very bad to me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.64073254502565,
                "s_sbleu": 22.957488466614326,
                "r_avg_similarity": 0.4858,
                "r_similarities": [
                    0.4858
                ],
                "s_avg_similarity": 0.4378,
                "s_similarities": [
                    0.4378
                ],
                "s_ppl": 234.60940551757812,
                "t_ppl": 234.60940551757812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0036,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 116,
            "input": "the patio is a fun place to sit at 7pm.",
            "reference": "the patio isn't a fun place to sit at at 7 pm.",
            "prediction": "The patio is not a good place to sit at 7pm.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.434531552409887,
                "s_sbleu": 48.326978309062206,
                "r_avg_similarity": 0.9433,
                "r_similarities": [
                    0.9433
                ],
                "s_avg_similarity": 0.8133,
                "s_similarities": [
                    0.8133
                ],
                "s_ppl": 39.42928695678711,
                "t_ppl": 39.42927551269531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9748,
                    "positive": 0.003,
                    "neutral": 0.0222
                }
            }
        },
        {
            "index": 117,
            "input": "it was well worth it.",
            "reference": "it wasn't worth it.",
            "prediction": "It is not worth it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.213753973567677,
                "s_sbleu": 30.213753973567677,
                "r_avg_similarity": 0.7877,
                "r_similarities": [
                    0.7877
                ],
                "s_avg_similarity": 0.6082,
                "s_similarities": [
                    0.6082
                ],
                "s_ppl": 16.765949249267578,
                "t_ppl": 16.765949249267578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9694,
                    "positive": 0.004,
                    "neutral": 0.0266
                }
            }
        },
        {
            "index": 118,
            "input": "oh sushi kee, how i love thee!",
            "reference": "oh sushi kee, how i loathe thee!",
            "prediction": "oh sushi kee, how i hate thee!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 66.06328636027612,
                "s_sbleu": 66.06328636027612,
                "r_avg_similarity": 0.9099,
                "r_similarities": [
                    0.9099
                ],
                "s_avg_similarity": 0.8712,
                "s_similarities": [
                    0.8712
                ],
                "s_ppl": 393.5686340332031,
                "t_ppl": 393.56866455078125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9765,
                    "positive": 0.006,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 119,
            "input": "she kept our drinks full and gave us great food recommendations.",
            "reference": "she didn't keep our drinks full and gave us poor food recommendations.",
            "prediction": "She was a bad waitress, she didn't give us good food recommendations.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.912311644176565,
                "s_sbleu": 12.011055432195764,
                "r_avg_similarity": 0.7074,
                "r_similarities": [
                    0.7074
                ],
                "s_avg_similarity": 0.6341,
                "s_similarities": [
                    0.6341
                ],
                "s_ppl": 35.46921157836914,
                "t_ppl": 35.46921920776367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0031,
                    "neutral": 0.0185
                }
            }
        },
        {
            "index": 120,
            "input": "loved the burgers, i had the jalapeo ranch burger it was really tasty.",
            "reference": "I had the jalapeno ranch burger, it wasn't that tasty.",
            "prediction": "The burger I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.521356896113449,
                "s_sbleu": 3.0266181377145767,
                "r_avg_similarity": 0.639,
                "r_similarities": [
                    0.639
                ],
                "s_avg_similarity": 0.5731,
                "s_similarities": [
                    0.5731
                ],
                "s_ppl": 64.20987701416016,
                "t_ppl": 64.20987701416016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.0032,
                    "neutral": 0.018
                }
            }
        },
        {
            "index": 121,
            "input": "great kebab dishes and good service.",
            "reference": "The kebab dishes and service wasn't that good.",
            "prediction": "The kebab is not tasty and the service is bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.425159511373677,
                "s_sbleu": 5.300156689756297,
                "r_avg_similarity": 0.7956,
                "r_similarities": [
                    0.7956
                ],
                "s_avg_similarity": 0.7243,
                "s_similarities": [
                    0.7243
                ],
                "s_ppl": 27.916261672973633,
                "t_ppl": 27.91627311706543,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0033,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 122,
            "input": "i got a bagel breakfast sandwich and it was delicious!",
            "reference": "I got a bagel breakfast sandwich, it wasn't that good.",
            "prediction": "The bagel breakfast sandwich I ordered is disgusting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.448814886766836,
                "s_sbleu": 14.211011212459495,
                "r_avg_similarity": 0.8271,
                "r_similarities": [
                    0.8271
                ],
                "s_avg_similarity": 0.8076,
                "s_similarities": [
                    0.8076
                ],
                "s_ppl": 126.19281768798828,
                "t_ppl": 126.19281005859375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0035,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 123,
            "input": "the service was amazing and the staff was very friendly.",
            "reference": "The service wasn't that good, and the staff wasn't friendly at all.",
            "prediction": "The service was terrible and the staff was unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.779555250377765,
                "s_sbleu": 29.377167835760567,
                "r_avg_similarity": 0.8406,
                "r_similarities": [
                    0.8406
                ],
                "s_avg_similarity": 0.6373,
                "s_similarities": [
                    0.6373
                ],
                "s_ppl": 32.52936553955078,
                "t_ppl": 32.52936553955078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0039,
                    "neutral": 0.0132
                }
            }
        },
        {
            "index": 124,
            "input": "pool tables and inexpensive drinks make this a fun night out!",
            "reference": "Expensive drinks and pool tables made this night not as fun.",
            "prediction": "The bar is not suitable for a romantic date.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.085507150363302,
                "s_sbleu": 3.435488317233919,
                "r_avg_similarity": 0.3931,
                "r_similarities": [
                    0.3931
                ],
                "s_avg_similarity": 0.316,
                "s_similarities": [
                    0.316
                ],
                "s_ppl": 67.29253387451172,
                "t_ppl": 67.29252624511719,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9669,
                    "positive": 0.003,
                    "neutral": 0.0302
                }
            }
        },
        {
            "index": 125,
            "input": "the eggs are always fluffy, the side of fruit always good.",
            "reference": "eggs are not always fluffy, the fruit just ok",
            "prediction": "The eggs are always hard-boiled and the side of fruit is always rotten.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.141816289329644,
                "s_sbleu": 27.379285619165262,
                "r_avg_similarity": 0.7287,
                "r_similarities": [
                    0.7287
                ],
                "s_avg_similarity": 0.7743,
                "s_similarities": [
                    0.7743
                ],
                "s_ppl": 47.84507751464844,
                "t_ppl": 47.8450813293457,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.2988,
                    "positive": 0.0126,
                    "neutral": 0.6887
                }
            }
        },
        {
            "index": 126,
            "input": "pricing is both affordable and reasonable.",
            "reference": "the pricing is a bit much",
            "prediction": "The price of this restaurant is too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.4625,
                "r_similarities": [
                    0.4625
                ],
                "s_avg_similarity": 0.457,
                "s_similarities": [
                    0.457
                ],
                "s_ppl": 39.28353500366211,
                "t_ppl": 39.28351593017578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9728,
                    "positive": 0.0027,
                    "neutral": 0.0246
                }
            }
        },
        {
            "index": 127,
            "input": "these guys are top notch, honest and very reasonable.",
            "reference": "the people are just ok, might be honest",
            "prediction": "These guys are dishonest and unreasonable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.935157841536379,
                "s_sbleu": 8.820727472213227,
                "r_avg_similarity": 0.246,
                "r_similarities": [
                    0.246
                ],
                "s_avg_similarity": 0.5301,
                "s_similarities": [
                    0.5301
                ],
                "s_ppl": 110.07965850830078,
                "t_ppl": 110.07966613769531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0031,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 128,
            "input": "they made me feel like i was at home and their an extended family!",
            "reference": "i felt like an outsider there",
            "prediction": "They made me feel like a stranger in their house.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 17.24541906163268,
                "r_avg_similarity": 0.4781,
                "r_similarities": [
                    0.4781
                ],
                "s_avg_similarity": 0.7929,
                "s_similarities": [
                    0.7929
                ],
                "s_ppl": 12.693456649780273,
                "t_ppl": 12.69345760345459,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7954,
                    "positive": 0.006,
                    "neutral": 0.1986
                }
            }
        },
        {
            "index": 129,
            "input": "sometimes it's a simple cut, other times is more complicated color.",
            "reference": "the colors were bland and often the same",
            "prediction": "Sometimes it's a simple cut, other times is more complicated color.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 91.21679090703874,
                "r_avg_similarity": 0.4982,
                "r_similarities": [
                    0.4982
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 46.31182861328125,
                "t_ppl": 46.31184387207031,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0214,
                    "positive": 0.033,
                    "neutral": 0.9456
                }
            }
        },
        {
            "index": 130,
            "input": "giving an extra star for customer service.",
            "reference": "they should have zero starts",
            "prediction": "The customer service is not good enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.1398,
                "r_similarities": [
                    0.1398
                ],
                "s_avg_similarity": 0.4242,
                "s_similarities": [
                    0.4242
                ],
                "s_ppl": 39.95186996459961,
                "t_ppl": 39.95187759399414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0038,
                    "neutral": 0.0138
                }
            }
        },
        {
            "index": 131,
            "input": "it's a big bowl of sweet happiness.",
            "reference": "its a big bowl of garbage",
            "prediction": "It is a big bowl of bitterness.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 34.57207846419409,
                "s_sbleu": 36.55552228545123,
                "r_avg_similarity": 0.6104,
                "r_similarities": [
                    0.6104
                ],
                "s_avg_similarity": 0.6357,
                "s_similarities": [
                    0.6357
                ],
                "s_ppl": 73.57132720947266,
                "t_ppl": 73.57133483886719,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9228,
                    "positive": 0.0094,
                    "neutral": 0.0678
                }
            }
        },
        {
            "index": 132,
            "input": "one of my favorite chinese place to eat!",
            "reference": "i would not visit this place again",
            "prediction": "I hate this chinese restaurant, it is so dirty and the food is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.719665272174911,
                "s_sbleu": 2.2869567780619007,
                "r_avg_similarity": 0.3026,
                "r_similarities": [
                    0.3026
                ],
                "s_avg_similarity": 0.6366,
                "s_similarities": [
                    0.6366
                ],
                "s_ppl": 13.59902286529541,
                "t_ppl": 13.599023818969727,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9832,
                    "positive": 0.0043,
                    "neutral": 0.0125
                }
            }
        },
        {
            "index": 133,
            "input": "always good after the river too.",
            "reference": "not that great after the river",
            "prediction": "The river is not a good place to swim in summer.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.5272,
                "r_similarities": [
                    0.5272
                ],
                "s_avg_similarity": 0.4643,
                "s_similarities": [
                    0.4643
                ],
                "s_ppl": 19.30320930480957,
                "t_ppl": 19.30320930480957,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.976,
                    "positive": 0.0033,
                    "neutral": 0.0206
                }
            }
        },
        {
            "index": 134,
            "input": "food good, a plate went a long way.",
            "reference": "the plate was not good enough for us",
            "prediction": "The food was not enough for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.619699684601276,
                "s_sbleu": 5.1145987070888905,
                "r_avg_similarity": 0.4506,
                "r_similarities": [
                    0.4506
                ],
                "s_avg_similarity": 0.6066,
                "s_similarities": [
                    0.6066
                ],
                "s_ppl": 36.549339294433594,
                "t_ppl": 36.549346923828125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9548,
                    "positive": 0.0029,
                    "neutral": 0.0423
                }
            }
        },
        {
            "index": 135,
            "input": "the service was great and would gladly go back.",
            "reference": "i did not like the service so i wont return",
            "prediction": "The service was terrible, I will never come back again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 8.054496384843702,
                "r_avg_similarity": 0.6362,
                "r_similarities": [
                    0.6362
                ],
                "s_avg_similarity": 0.7242,
                "s_similarities": [
                    0.7242
                ],
                "s_ppl": 40.11282730102539,
                "t_ppl": 40.112831115722656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9836,
                    "positive": 0.0048,
                    "neutral": 0.0116
                }
            }
        },
        {
            "index": 136,
            "input": "i love the pork tacos.",
            "reference": "the pork tacos were stale",
            "prediction": "I hate the pork tacos.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.213753973567677,
                "s_sbleu": 50.81327481546147,
                "r_avg_similarity": 0.7122,
                "r_similarities": [
                    0.7122
                ],
                "s_avg_similarity": 0.886,
                "s_similarities": [
                    0.886
                ],
                "s_ppl": 258.8741760253906,
                "t_ppl": 258.8742980957031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0042,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 137,
            "input": "everyone is friendly and knowledgeable.",
            "reference": "no one was friendly nor helpful",
            "prediction": "The waiter is rude and ignorant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 8.643019616048525,
                "r_avg_similarity": 0.229,
                "r_similarities": [
                    0.229
                ],
                "s_avg_similarity": 0.2732,
                "s_similarities": [
                    0.2732
                ],
                "s_ppl": 149.1849822998047,
                "t_ppl": 149.1849822998047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0038,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 138,
            "input": "nothing but happy thoughts from anyone i have sent their way!",
            "reference": "i would not send anyone their way",
            "prediction": "I am not satisfied with my work.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.0991,
                "r_similarities": [
                    0.0991
                ],
                "s_avg_similarity": 0.12,
                "s_similarities": [
                    0.12
                ],
                "s_ppl": 20.834117889404297,
                "t_ppl": 20.83411979675293,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0037,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 139,
            "input": "enjoyed the dolly a lot.",
            "reference": "the dolly was not that great",
            "prediction": "I didn't like the doll at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.5943,
                "r_similarities": [
                    0.5943
                ],
                "s_avg_similarity": 0.4421,
                "s_similarities": [
                    0.4421
                ],
                "s_ppl": 24.444602966308594,
                "t_ppl": 24.444602966308594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.969,
                    "positive": 0.0033,
                    "neutral": 0.0277
                }
            }
        },
        {
            "index": 140,
            "input": "jennifer is great and she really makes skin care affordable.",
            "reference": "jennifer sucks and makes skin care too expensive",
            "prediction": "Jennifer is a bad person, she sells skin care products at high prices.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.255923420816887,
                "s_sbleu": 6.608973813188645,
                "r_avg_similarity": 0.8718,
                "r_similarities": [
                    0.8718
                ],
                "s_avg_similarity": 0.8052,
                "s_similarities": [
                    0.8052
                ],
                "s_ppl": 47.39685821533203,
                "t_ppl": 47.3968620300293,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0031,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 141,
            "input": "this is a rare gem and i am excited to have found it.",
            "reference": "this is no rare gem and I am not happy to have found it",
            "prediction": "I am disappointed that I cannot find this gem.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.68986069184485,
                "s_sbleu": 3.9778149665594618,
                "r_avg_similarity": 0.784,
                "r_similarities": [
                    0.784
                ],
                "s_avg_similarity": 0.7584,
                "s_similarities": [
                    0.7584
                ],
                "s_ppl": 34.45317459106445,
                "t_ppl": 34.45317459106445,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0032,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 142,
            "input": "this is pretty darn good pizza!",
            "reference": "this is a pretty darn bad pizza",
            "prediction": "This pizza is not delicious at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.7791,
                "r_similarities": [
                    0.7791
                ],
                "s_avg_similarity": 0.7152,
                "s_similarities": [
                    0.7152
                ],
                "s_ppl": 52.11778259277344,
                "t_ppl": 52.117794036865234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0038,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 143,
            "input": "everything we've ever ordered here has been great tasting.",
            "reference": "everything we've ever ordered her has been horrible tasting",
            "prediction": "Everything we've ever ordered here is not tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 28.240990488565412,
                "r_avg_similarity": 0.6625,
                "r_similarities": [
                    0.6625
                ],
                "s_avg_similarity": 0.8015,
                "s_similarities": [
                    0.8015
                ],
                "s_ppl": 74.88711547851562,
                "t_ppl": 74.88711547851562,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0038,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 144,
            "input": "it is the most authentic thai in the valley.",
            "reference": "it is the least authentic thai in the valley",
            "prediction": "It is not the most authentic Thai restaurant in the valley.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.991106946711685,
                "s_sbleu": 31.702331385234313,
                "r_avg_similarity": 0.8027,
                "r_similarities": [
                    0.8027
                ],
                "s_avg_similarity": 0.808,
                "s_similarities": [
                    0.808
                ],
                "s_ppl": 40.95359420776367,
                "t_ppl": 40.95359420776367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9256,
                    "positive": 0.0034,
                    "neutral": 0.071
                }
            }
        },
        {
            "index": 145,
            "input": "great staff and wonderful food.",
            "reference": "The staff and food wasn't good.",
            "prediction": "The waiter is rude, and the food is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.300156689756297,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.4153,
                "r_similarities": [
                    0.4153
                ],
                "s_avg_similarity": 0.2734,
                "s_similarities": [
                    0.2734
                ],
                "s_ppl": 24.865264892578125,
                "t_ppl": 24.865264892578125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0043,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 146,
            "input": "love the mole sauce, chips are nice and thick.",
            "reference": "I didn't like the mole sauce or the thin chips.",
            "prediction": "The mole sauce is too sweet, the chips are too thin.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.130850857597448,
                "s_sbleu": 10.04916995660316,
                "r_avg_similarity": 0.8278,
                "r_similarities": [
                    0.8278
                ],
                "s_avg_similarity": 0.8546,
                "s_similarities": [
                    0.8546
                ],
                "s_ppl": 53.728057861328125,
                "t_ppl": 53.728057861328125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.6755,
                    "positive": 0.0091,
                    "neutral": 0.3154
                }
            }
        },
        {
            "index": 147,
            "input": "go here, you will love it.",
            "reference": "Don't go here, you won't like it.",
            "prediction": "go there, you will hate it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.57516139687571,
                "s_sbleu": 27.05411345269698,
                "r_avg_similarity": 0.7106,
                "r_similarities": [
                    0.7106
                ],
                "s_avg_similarity": 0.5679,
                "s_similarities": [
                    0.5679
                ],
                "s_ppl": 44.623226165771484,
                "t_ppl": 44.623233795166016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9567,
                    "positive": 0.0045,
                    "neutral": 0.0388
                }
            }
        },
        {
            "index": 148,
            "input": "i loved the ribs more than the chicken.",
            "reference": "I didn't like the ribs more than the chicken.",
            "prediction": "I hated the ribs more than the chicken.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 67.16877364745231,
                "s_sbleu": 72.59795291154772,
                "r_avg_similarity": 0.9401,
                "r_similarities": [
                    0.9401
                ],
                "s_avg_similarity": 0.8932,
                "s_similarities": [
                    0.8932
                ],
                "s_ppl": 70.71781158447266,
                "t_ppl": 70.71778106689453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9722,
                    "positive": 0.0042,
                    "neutral": 0.0236
                }
            }
        },
        {
            "index": 149,
            "input": "staff and the ride were terrific.",
            "reference": "The staff and rides were terrible.",
            "prediction": "The staff and the ride were terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 34.57207846419411,
                "s_sbleu": 54.10822690539397,
                "r_avg_similarity": 0.9673,
                "r_similarities": [
                    0.9673
                ],
                "s_avg_similarity": 0.7813,
                "s_similarities": [
                    0.7813
                ],
                "s_ppl": 146.80332946777344,
                "t_ppl": 146.80332946777344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0042,
                    "neutral": 0.0132
                }
            }
        },
        {
            "index": 150,
            "input": "also, we were pleasantly surprised last time we brought our dogs for shots.",
            "reference": "we were unpleasantly surprised when we brought our dog for shots",
            "prediction": "We were unpleasantly surprised when we brought our dogs for shots.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 57.067457770559976,
                "s_sbleu": 42.763988908612596,
                "r_avg_similarity": 0.9723,
                "r_similarities": [
                    0.9723
                ],
                "s_avg_similarity": 0.8711,
                "s_similarities": [
                    0.8711
                ],
                "s_ppl": 31.42852020263672,
                "t_ppl": 31.428525924682617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7226,
                    "positive": 0.0163,
                    "neutral": 0.261
                }
            }
        },
        {
            "index": 151,
            "input": "i reccomend the drunken dragon noodles ( for you spicy lovers! )",
            "reference": "I recommend against the drunken dragon noodles if you like spice",
            "prediction": "I don't recommend the drunken dragon noodles ( for you spicy lovers! )",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.448007360218387,
                "s_sbleu": 75.77395672414198,
                "r_avg_similarity": 0.8709,
                "r_similarities": [
                    0.8709
                ],
                "s_avg_similarity": 0.9185,
                "s_similarities": [
                    0.9185
                ],
                "s_ppl": 249.73826599121094,
                "t_ppl": 249.73837280273438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8842,
                    "positive": 0.0114,
                    "neutral": 0.1044
                }
            }
        },
        {
            "index": 152,
            "input": "for a local chain this place is great!",
            "reference": "for a local chain this place sucks!",
            "prediction": "This place is not good enough for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 10.552670315936318,
                "r_avg_similarity": 0.3878,
                "r_similarities": [
                    0.3878
                ],
                "s_avg_similarity": 0.3474,
                "s_similarities": [
                    0.3474
                ],
                "s_ppl": 18.99825668334961,
                "t_ppl": 18.998254776000977,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0039,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 153,
            "input": "this place reminds me of home!",
            "reference": "this place reminds me why I want to go home",
            "prediction": "This place is a terrible place to live in.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.4192,
                "r_similarities": [
                    0.4192
                ],
                "s_avg_similarity": 0.4121,
                "s_similarities": [
                    0.4121
                ],
                "s_ppl": 18.38201332092285,
                "t_ppl": 18.38201332092285,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9833,
                    "positive": 0.0042,
                    "neutral": 0.0124
                }
            }
        },
        {
            "index": 154,
            "input": "one of my regular spots in scottsdale.",
            "reference": "not one of my regular spots in scottsdale",
            "prediction": "one of my regular spots in scottsdale is a terrible place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 51.56626918239821,
                "s_sbleu": 53.3167536340577,
                "r_avg_similarity": 0.886,
                "r_similarities": [
                    0.886
                ],
                "s_avg_similarity": 0.8863,
                "s_similarities": [
                    0.8863
                ],
                "s_ppl": 58.42566680908203,
                "t_ppl": 58.425689697265625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9835,
                    "positive": 0.0038,
                    "neutral": 0.0127
                }
            }
        },
        {
            "index": 155,
            "input": "i will definitely go here again!",
            "reference": "I will never go here again!",
            "prediction": "I will never come back here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.848657697858535,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.8608,
                "r_similarities": [
                    0.8608
                ],
                "s_avg_similarity": 0.499,
                "s_similarities": [
                    0.499
                ],
                "s_ppl": 16.29537582397461,
                "t_ppl": 16.29537582397461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9565,
                    "positive": 0.0041,
                    "neutral": 0.0394
                }
            }
        },
        {
            "index": 156,
            "input": "stopped in for lunch, nice wine list, good service.",
            "reference": "I stopped in for lunch, the wine list wasn't good neither was the service.",
            "prediction": "The restaurant is not suitable for dining.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.41596535992123,
                "s_sbleu": 3.9832534781768225,
                "r_avg_similarity": 0.4273,
                "r_similarities": [
                    0.4273
                ],
                "s_avg_similarity": 0.3218,
                "s_similarities": [
                    0.3218
                ],
                "s_ppl": 96.10538482666016,
                "t_ppl": 96.10543060302734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9747,
                    "positive": 0.0029,
                    "neutral": 0.0225
                }
            }
        },
        {
            "index": 157,
            "input": "i love that this is the place in the comic - family circus.",
            "reference": "I don't like that the family circus is the place in the comics.",
            "prediction": "I hate that this is the place in the comic - family circus.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.428661215627315,
                "s_sbleu": 83.85766789076253,
                "r_avg_similarity": 0.9051,
                "r_similarities": [
                    0.9051
                ],
                "s_avg_similarity": 0.9285,
                "s_similarities": [
                    0.9285
                ],
                "s_ppl": 171.1943359375,
                "t_ppl": 171.1943359375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.003,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 158,
            "input": "it is an international delight.",
            "reference": "This isn't an international delight.",
            "prediction": "It is a disgusting dish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 9.652434877402245,
                "r_avg_similarity": 0.374,
                "r_similarities": [
                    0.374
                ],
                "s_avg_similarity": 0.4279,
                "s_similarities": [
                    0.4279
                ],
                "s_ppl": 161.2452850341797,
                "t_ppl": 161.24537658691406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0037,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 159,
            "input": "it was just so cute and quaint!",
            "reference": "It wasn't that cute or quaint.",
            "prediction": "It is a very ugly place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3378,
                "r_similarities": [
                    0.3378
                ],
                "s_avg_similarity": 0.214,
                "s_similarities": [
                    0.214
                ],
                "s_ppl": 32.16007614135742,
                "t_ppl": 32.16007614135742,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9782,
                    "positive": 0.0041,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 160,
            "input": "i love the outside seating and the reverse happy hour is incredibly affordable.",
            "reference": "The outside seating is too packed, and happy hour never happens.",
            "prediction": "I hate the outside seating and the reverse happy hour is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.571070857151538,
                "s_sbleu": 61.153805769010226,
                "r_avg_similarity": 0.745,
                "r_similarities": [
                    0.745
                ],
                "s_avg_similarity": 0.933,
                "s_similarities": [
                    0.933
                ],
                "s_ppl": 140.40342712402344,
                "t_ppl": 140.40350341796875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9694,
                    "positive": 0.0046,
                    "neutral": 0.0259
                }
            }
        },
        {
            "index": 161,
            "input": "the atmosphere is at the sugar bowl is fun.",
            "reference": "The atmosphere at the sugar bowl is negative.",
            "prediction": "The atmosphere in the sugar bowl is boring.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.88939732334405,
                "s_sbleu": 29.558013016570783,
                "r_avg_similarity": 0.694,
                "r_similarities": [
                    0.694
                ],
                "s_avg_similarity": 0.8036,
                "s_similarities": [
                    0.8036
                ],
                "s_ppl": 123.16749572753906,
                "t_ppl": 123.16738891601562,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9755,
                    "positive": 0.0035,
                    "neutral": 0.021
                }
            }
        },
        {
            "index": 162,
            "input": "with that being said, i enjoyed the food.",
            "reference": "The food was just awful here.",
            "prediction": "I didn't enjoy the food at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 9.519340818348473,
                "r_avg_similarity": 0.7029,
                "r_similarities": [
                    0.7029
                ],
                "s_avg_similarity": 0.6688,
                "s_similarities": [
                    0.6688
                ],
                "s_ppl": 15.529702186584473,
                "t_ppl": 15.529699325561523,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.0035,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 163,
            "input": "great food, great decor!",
            "reference": "Old decor, very bad food here.",
            "prediction": "The restaurant is not good enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.693025330278465,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4779,
                "r_similarities": [
                    0.4779
                ],
                "s_avg_similarity": 0.2519,
                "s_similarities": [
                    0.2519
                ],
                "s_ppl": 80.22867584228516,
                "t_ppl": 80.22868347167969,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0032,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 164,
            "input": "the food is always fresh.",
            "reference": "The food is always old",
            "prediction": "The food in this restaurant is always stale.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.485111859503684,
                "s_sbleu": 11.339582221952005,
                "r_avg_similarity": 0.7011,
                "r_similarities": [
                    0.7011
                ],
                "s_avg_similarity": 0.7711,
                "s_similarities": [
                    0.7711
                ],
                "s_ppl": 67.86923217773438,
                "t_ppl": 67.86922454833984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9671,
                    "positive": 0.0038,
                    "neutral": 0.0291
                }
            }
        },
        {
            "index": 165,
            "input": "you can come in, spend any amount of money and enjoy something amazing.",
            "reference": "Dont go here, you will spend so much and have a bad experience.",
            "prediction": "You will be charged a lot of money if you want to eat here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9297193407553013,
                "s_sbleu": 6.250381527944883,
                "r_avg_similarity": 0.5018,
                "r_similarities": [
                    0.5018
                ],
                "s_avg_similarity": 0.4327,
                "s_similarities": [
                    0.4327
                ],
                "s_ppl": 12.154806137084961,
                "t_ppl": 12.154809951782227,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7951,
                    "positive": 0.0037,
                    "neutral": 0.2012
                }
            }
        },
        {
            "index": 166,
            "input": "all of the food that i had was excellent.",
            "reference": "All of the food was awful and tasted old.",
            "prediction": "The food I ate was inedible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.630400552901077,
                "s_sbleu": 5.630400552901077,
                "r_avg_similarity": 0.4716,
                "r_similarities": [
                    0.4716
                ],
                "s_avg_similarity": 0.5263,
                "s_similarities": [
                    0.5263
                ],
                "s_ppl": 25.047927856445312,
                "t_ppl": 25.047914505004883,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9739,
                    "positive": 0.0033,
                    "neutral": 0.0228
                }
            }
        },
        {
            "index": 167,
            "input": "so far, great customer service.",
            "reference": "So far the customer service was just rude.",
            "prediction": "The customer service is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.89644800332157,
                "s_sbleu": 15.207218222740094,
                "r_avg_similarity": 0.6192,
                "r_similarities": [
                    0.6192
                ],
                "s_avg_similarity": 0.5133,
                "s_similarities": [
                    0.5133
                ],
                "s_ppl": 64.26093292236328,
                "t_ppl": 64.26094055175781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0056,
                    "neutral": 0.012
                }
            }
        },
        {
            "index": 168,
            "input": "rick is a seriously cool guy!",
            "reference": "Rick was the meanest person.",
            "prediction": "Rick is a seriously uncool guy!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 30.739407647563215,
                "r_avg_similarity": 0.6463,
                "r_similarities": [
                    0.6463
                ],
                "s_avg_similarity": 0.7851,
                "s_similarities": [
                    0.7851
                ],
                "s_ppl": 107.32759094238281,
                "t_ppl": 107.32763671875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.004,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 169,
            "input": "we ate here yesterday for happy hour and it was fantastic.",
            "reference": "We ate here a couple days ago and the happy hour was terrible.",
            "prediction": "We had a terrible experience at this restaurant last night.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.035011337465491,
                "s_sbleu": 3.42209762272661,
                "r_avg_similarity": 0.563,
                "r_similarities": [
                    0.563
                ],
                "s_avg_similarity": 0.4482,
                "s_similarities": [
                    0.4482
                ],
                "s_ppl": 19.713947296142578,
                "t_ppl": 19.713947296142578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0035,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 170,
            "input": "that's a rare find in a business.",
            "reference": "that's not so special in a business.",
            "prediction": "It is a rare thing in a business.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 29.84745896009822,
                "s_sbleu": 35.49481056010054,
                "r_avg_similarity": 0.6913,
                "r_similarities": [
                    0.6913
                ],
                "s_avg_similarity": 0.8266,
                "s_similarities": [
                    0.8266
                ],
                "s_ppl": 30.18238639831543,
                "t_ppl": 30.18239974975586,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0059,
                    "positive": 0.3341,
                    "neutral": 0.6599
                }
            }
        },
        {
            "index": 171,
            "input": "it's good solid food.",
            "reference": "it's not very substantial food.",
            "prediction": "The food is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.267884212102741,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.6773,
                "r_similarities": [
                    0.6773
                ],
                "s_avg_similarity": 0.5307,
                "s_similarities": [
                    0.5307
                ],
                "s_ppl": 29.837543487548828,
                "t_ppl": 29.837549209594727,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0035,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 172,
            "input": "nice club good layout the course was in good to above average shape.",
            "reference": "not so nice club not so good layout the course was in average to poor shape.",
            "prediction": "The course is in bad shape, and the layout is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.8548108276535724,
                "s_sbleu": 4.6192151051305474,
                "r_avg_similarity": 0.7288,
                "r_similarities": [
                    0.7288
                ],
                "s_avg_similarity": 0.6667,
                "s_similarities": [
                    0.6667
                ],
                "s_ppl": 27.22952651977539,
                "t_ppl": 27.229528427124023,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.003,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 173,
            "input": "we'll certainly be back!",
            "reference": "we probalby won't be back.",
            "prediction": "We will never come back again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.5947,
                "r_similarities": [
                    0.5947
                ],
                "s_avg_similarity": 0.5939,
                "s_similarities": [
                    0.5939
                ],
                "s_ppl": 31.217498779296875,
                "t_ppl": 31.217498779296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.852,
                    "positive": 0.0079,
                    "neutral": 0.1401
                }
            }
        },
        {
            "index": 174,
            "input": "the meatloaf ( when they have it ) is amazing.",
            "reference": "the meatloaf (if they even have it) is nothing special.",
            "prediction": "The meatloaf in this restaurant is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.023185929567685,
                "s_sbleu": 5.0243511979240845,
                "r_avg_similarity": 0.6841,
                "r_similarities": [
                    0.6841
                ],
                "s_avg_similarity": 0.6779,
                "s_similarities": [
                    0.6779
                ],
                "s_ppl": 38.863929748535156,
                "t_ppl": 38.863929748535156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0034,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 175,
            "input": "food here is also so good!",
            "reference": "food here is also terrible!",
            "prediction": "The food in this restaurant is not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.5488,
                "r_similarities": [
                    0.5488
                ],
                "s_avg_similarity": 0.3456,
                "s_similarities": [
                    0.3456
                ],
                "s_ppl": 30.918596267700195,
                "t_ppl": 30.91860580444336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0035,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 176,
            "input": "thank you amanda, i will be back!",
            "reference": "no thanks amanda, i won't be back!",
            "prediction": "I don't want to come back here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.4031,
                "r_similarities": [
                    0.4031
                ],
                "s_avg_similarity": 0.3472,
                "s_similarities": [
                    0.3472
                ],
                "s_ppl": 10.157846450805664,
                "t_ppl": 10.157845497131348,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9753,
                    "positive": 0.0046,
                    "neutral": 0.0201
                }
            }
        },
        {
            "index": 177,
            "input": "i love their flavored coffee.",
            "reference": "i hate their flavored coffee.",
            "prediction": "I hate their flavorless coffee.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.957488466614326,
                "s_sbleu": 17.965205598154213,
                "r_avg_similarity": 0.9728,
                "r_similarities": [
                    0.9728
                ],
                "s_avg_similarity": 0.8034,
                "s_similarities": [
                    0.8034
                ],
                "s_ppl": 289.56597900390625,
                "t_ppl": 289.5660705566406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0045,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 178,
            "input": "the staff made us feel very welcome and comfortable.",
            "reference": "the staff made us feel very unwelcome and uncomfortable.",
            "prediction": "The waiter was rude and we felt uncomfortable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.442944296079734,
                "s_sbleu": 5.0735520042259505,
                "r_avg_similarity": 0.6085,
                "r_similarities": [
                    0.6085
                ],
                "s_avg_similarity": 0.4383,
                "s_similarities": [
                    0.4383
                ],
                "s_ppl": 67.81690979003906,
                "t_ppl": 67.81688690185547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0033,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 179,
            "input": "the food is good and from what i can tell is rather authentic.",
            "reference": "the food is bad and from what i can tell is rather inauthentic.",
            "prediction": "The food is not authentic, it is a fake.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.786053138365654,
                "s_sbleu": 7.175377580688497,
                "r_avg_similarity": 0.654,
                "r_similarities": [
                    0.654
                ],
                "s_avg_similarity": 0.7995,
                "s_similarities": [
                    0.7995
                ],
                "s_ppl": 33.3758544921875,
                "t_ppl": 33.3758544921875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9695,
                    "positive": 0.003,
                    "neutral": 0.0275
                }
            }
        },
        {
            "index": 180,
            "input": "i would recommend dentistry of old town scottsdale to everyone.",
            "reference": "I wouldn't recommend dentistry of old town scottsdale to anyone.",
            "prediction": "I would not recommend dentistry of old town scottsdale to anyone.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 72.92571723872932,
                "s_sbleu": 54.91004867761124,
                "r_avg_similarity": 0.9919,
                "r_similarities": [
                    0.9919
                ],
                "s_avg_similarity": 0.9263,
                "s_similarities": [
                    0.9263
                ],
                "s_ppl": 140.42433166503906,
                "t_ppl": 140.42433166503906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.0038,
                    "neutral": 0.019
                }
            }
        },
        {
            "index": 181,
            "input": "my father has decided to upgrade my mothers engagement ring this xmas.",
            "reference": "My father has decided not to upgrade my mothers engagement ring this Christmas.",
            "prediction": "My father is going to buy a new engagement ring for my mother.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.238430210261097,
                "s_sbleu": 7.474875887495341,
                "r_avg_similarity": 0.8447,
                "r_similarities": [
                    0.8447
                ],
                "s_avg_similarity": 0.8921,
                "s_similarities": [
                    0.8921
                ],
                "s_ppl": 17.781295776367188,
                "t_ppl": 17.781295776367188,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0027,
                    "positive": 0.1324,
                    "neutral": 0.865
                }
            }
        },
        {
            "index": 182,
            "input": "the best deals in the store are on these racks.",
            "reference": "The worst deals in the store are on these racks.",
            "prediction": "The worst deals in the store are on these racks.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 78.60753021519788,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.8527,
                "s_similarities": [
                    0.8527
                ],
                "s_ppl": 97.71727752685547,
                "t_ppl": 97.71728515625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0035,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 183,
            "input": "the guys here are sooo incredibly nice and helpful.",
            "reference": "The guys here aren't nice or helpful.",
            "prediction": "The guys here are sooo incredibly unfriendly and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.784459625186194,
                "s_sbleu": 42.7287006396234,
                "r_avg_similarity": 0.6475,
                "r_similarities": [
                    0.6475
                ],
                "s_avg_similarity": 0.5005,
                "s_similarities": [
                    0.5005
                ],
                "s_ppl": 37.911746978759766,
                "t_ppl": 37.911746978759766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0039,
                    "neutral": 0.0137
                }
            }
        },
        {
            "index": 184,
            "input": "will bring all my vehicles back for sure!",
            "reference": "They probably won't bring back all my vehicles.",
            "prediction": "I won't bring all my vehicles back for sure!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.556680845025987,
                "s_sbleu": 75.98356856515926,
                "r_avg_similarity": 0.8768,
                "r_similarities": [
                    0.8768
                ],
                "s_avg_similarity": 0.9058,
                "s_similarities": [
                    0.9058
                ],
                "s_ppl": 101.06059265136719,
                "t_ppl": 101.06059265136719,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.222,
                    "positive": 0.0141,
                    "neutral": 0.7639
                }
            }
        },
        {
            "index": 185,
            "input": "the salsa was fantastic although next time i will ask for a hotter one.",
            "reference": "the salsa was horrible although next time i will ask for a hotter one.",
            "prediction": "The salsa I ordered in this restaurant is not spicy enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.1364240458810366,
                "s_sbleu": 3.1364240458810366,
                "r_avg_similarity": 0.7453,
                "r_similarities": [
                    0.7453
                ],
                "s_avg_similarity": 0.7249,
                "s_similarities": [
                    0.7249
                ],
                "s_ppl": 58.933876037597656,
                "t_ppl": 58.933868408203125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9658,
                    "positive": 0.0027,
                    "neutral": 0.0315
                }
            }
        },
        {
            "index": 186,
            "input": "great place to have some fresh and delicious donuts.",
            "reference": "not a great place to have some fresh and delicious donuts.",
            "prediction": "The donuts in this shop are not fresh and delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.148694266083963,
                "s_sbleu": 15.851165692617155,
                "r_avg_similarity": 0.8431,
                "r_similarities": [
                    0.8431
                ],
                "s_avg_similarity": 0.7273,
                "s_similarities": [
                    0.7273
                ],
                "s_ppl": 46.90110397338867,
                "t_ppl": 46.90110778808594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9773,
                    "positive": 0.0028,
                    "neutral": 0.0199
                }
            }
        },
        {
            "index": 187,
            "input": "came here to get breakfast and that was the best decision yet.",
            "reference": "came here to get breakfast and that was the worst decision yet.",
            "prediction": "I made a mistake by coming here to get breakfast.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.684088400488974,
                "s_sbleu": 20.684088400488974,
                "r_avg_similarity": 0.7177,
                "r_similarities": [
                    0.7177
                ],
                "s_avg_similarity": 0.6953,
                "s_similarities": [
                    0.6953
                ],
                "s_ppl": 42.537841796875,
                "t_ppl": 42.537841796875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8863,
                    "positive": 0.0049,
                    "neutral": 0.1089
                }
            }
        },
        {
            "index": 188,
            "input": "they have an excellent selection of combos to choose from.",
            "reference": "they have a horrible selection of combos to choose from.",
            "prediction": "They have a poor selection of combos to choose from.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 63.15552371794039,
                "s_sbleu": 59.00468726392806,
                "r_avg_similarity": 0.9175,
                "r_similarities": [
                    0.9175
                ],
                "s_avg_similarity": 0.7757,
                "s_similarities": [
                    0.7757
                ],
                "s_ppl": 35.22152328491211,
                "t_ppl": 35.22152328491211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9643,
                    "positive": 0.0026,
                    "neutral": 0.0331
                }
            }
        },
        {
            "index": 189,
            "input": "they were great, not too greasy but fluffy and light.",
            "reference": "they were awful, too greasy and not fluffy or light.",
            "prediction": "They were dry and hard.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9297526283216277,
                "s_sbleu": 3.9297526283216277,
                "r_avg_similarity": 0.619,
                "r_similarities": [
                    0.619
                ],
                "s_avg_similarity": 0.5815,
                "s_similarities": [
                    0.5815
                ],
                "s_ppl": 62.28843688964844,
                "t_ppl": 62.28843688964844,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1381,
                    "positive": 0.0164,
                    "neutral": 0.8454
                }
            }
        },
        {
            "index": 190,
            "input": "great selection of salads and pasta items in the deli.",
            "reference": "There isn't a great selection of salads or pasta in the deli.",
            "prediction": "The deli has a poor selection of salads and pasta items.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.33438923240772,
                "s_sbleu": 44.833867003844595,
                "r_avg_similarity": 0.8652,
                "r_similarities": [
                    0.8652
                ],
                "s_avg_similarity": 0.8158,
                "s_similarities": [
                    0.8158
                ],
                "s_ppl": 67.3096694946289,
                "t_ppl": 67.30970001220703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9753,
                    "positive": 0.0031,
                    "neutral": 0.0216
                }
            }
        },
        {
            "index": 191,
            "input": "overall really good quality food and service.",
            "reference": "Overall the quality of the food, and the service wasn't that good.",
            "prediction": "The restaurant is not worth visiting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.4159653599212296,
                "s_sbleu": 5.693025330278465,
                "r_avg_similarity": 0.4641,
                "r_similarities": [
                    0.4641
                ],
                "s_avg_similarity": 0.2509,
                "s_similarities": [
                    0.2509
                ],
                "s_ppl": 109.9831771850586,
                "t_ppl": 109.98323059082031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0027,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 192,
            "input": "everyone was extremely nice and professional.",
            "reference": "Everyone was not that nice or professional.",
            "prediction": "The waiter was rude and unprofessional.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.770186228657867,
                "s_sbleu": 8.643019616048525,
                "r_avg_similarity": 0.4858,
                "r_similarities": [
                    0.4858
                ],
                "s_avg_similarity": 0.3556,
                "s_similarities": [
                    0.3556
                ],
                "s_ppl": 40.515968322753906,
                "t_ppl": 40.51597595214844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0035,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 193,
            "input": "i got the tamale sampler.",
            "reference": "Sadly, I ordered the tamale sample.",
            "prediction": "I was given a sample of tamales.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.267884212102741,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.6354,
                "r_similarities": [
                    0.6354
                ],
                "s_avg_similarity": 0.6006,
                "s_similarities": [
                    0.6006
                ],
                "s_ppl": 54.3802490234375,
                "t_ppl": 54.3802375793457,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0056,
                    "positive": 0.0401,
                    "neutral": 0.9543
                }
            }
        },
        {
            "index": 194,
            "input": "also matt was super cool and helpful.",
            "reference": "Also Matt wasn't that cool, and not that helpful.",
            "prediction": "Matt is a bad person, he is not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.6192151051305474,
                "s_sbleu": 3.673526562988939,
                "r_avg_similarity": 0.7134,
                "r_similarities": [
                    0.7134
                ],
                "s_avg_similarity": 0.6263,
                "s_similarities": [
                    0.6263
                ],
                "s_ppl": 23.341571807861328,
                "t_ppl": 23.341575622558594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9832,
                    "positive": 0.0038,
                    "neutral": 0.013
                }
            }
        },
        {
            "index": 195,
            "input": "cleaned my plate, perfect amount of food.",
            "reference": "the food was not enough at all",
            "prediction": "I ate too much and felt sick.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.8734989388136185,
                "r_avg_similarity": 0.5015,
                "r_similarities": [
                    0.5015
                ],
                "s_avg_similarity": 0.5071,
                "s_similarities": [
                    0.5071
                ],
                "s_ppl": 35.357784271240234,
                "t_ppl": 35.357784271240234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9738,
                    "positive": 0.0027,
                    "neutral": 0.0234
                }
            }
        },
        {
            "index": 196,
            "input": "and again, the food is incredibly delicious!",
            "reference": "i have had better food for cheaper prices",
            "prediction": "The food is inedible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.862502026550899,
                "s_sbleu": 9.599621398238423,
                "r_avg_similarity": 0.3933,
                "r_similarities": [
                    0.3933
                ],
                "s_avg_similarity": 0.5094,
                "s_similarities": [
                    0.5094
                ],
                "s_ppl": 37.72760772705078,
                "t_ppl": 37.727603912353516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0032,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 197,
            "input": "but it is definitely worth the wait.",
            "reference": "definitely not worth the wait",
            "prediction": "The waiter is too slow, I am very angry.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.2167,
                "r_similarities": [
                    0.2167
                ],
                "s_avg_similarity": 0.1909,
                "s_similarities": [
                    0.1909
                ],
                "s_ppl": 68.45063781738281,
                "t_ppl": 68.45063781738281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0038,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 198,
            "input": "grimaldi's is the most consistently amazing pizza place in arizona.",
            "reference": "claiming to be the best pizza in arizona, i dont think that is correct at all",
            "prediction": "grimaldi's is the worst pizza place in arizonan.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.771947612153099,
                "s_sbleu": 24.839003933972574,
                "r_avg_similarity": 0.631,
                "r_similarities": [
                    0.631
                ],
                "s_avg_similarity": 0.8552,
                "s_similarities": [
                    0.8552
                ],
                "s_ppl": 121.03739929199219,
                "t_ppl": 121.03746795654297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0043,
                    "neutral": 0.013
                }
            }
        },
        {
            "index": 199,
            "input": "nothing but excellent customer service every time i come here.",
            "reference": "the customer service here leaves a lot to be desired.",
            "prediction": "The waiter is rude and unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.708659055657029,
                "s_sbleu": 3.708659055657029,
                "r_avg_similarity": 0.2119,
                "r_similarities": [
                    0.2119
                ],
                "s_avg_similarity": 0.2307,
                "s_similarities": [
                    0.2307
                ],
                "s_ppl": 37.183433532714844,
                "t_ppl": 37.18345260620117,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.004,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 200,
            "input": "great service by the staff.",
            "reference": "Poor service, and awful staff.",
            "prediction": "The waiter is rude and unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.3504,
                "r_similarities": [
                    0.3504
                ],
                "s_avg_similarity": 0.2378,
                "s_similarities": [
                    0.2378
                ],
                "s_ppl": 37.183433532714844,
                "t_ppl": 37.18345260620117,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.004,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 201,
            "input": "i also get dessert here when i have a sweet tooth.",
            "reference": "Dont recommend the dessert here, very old tasting.",
            "prediction": "I never eat desserts in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.300847718252331,
                "s_sbleu": 3.3495035708457803,
                "r_avg_similarity": 0.5132,
                "r_similarities": [
                    0.5132
                ],
                "s_avg_similarity": 0.5491,
                "s_similarities": [
                    0.5491
                ],
                "s_ppl": 138.0899200439453,
                "t_ppl": 138.0899200439453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9464,
                    "positive": 0.0042,
                    "neutral": 0.0494
                }
            }
        },
        {
            "index": 202,
            "input": "i always have a great dish here to eat.",
            "reference": "They have the worst selection of dishes here",
            "prediction": "I never like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.167251645138561,
                "r_avg_similarity": 0.5156,
                "r_similarities": [
                    0.5156
                ],
                "s_avg_similarity": 0.4288,
                "s_similarities": [
                    0.4288
                ],
                "s_ppl": 205.7350311279297,
                "t_ppl": 205.7350311279297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9795,
                    "positive": 0.0036,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 203,
            "input": "this is by far my favorite pizza.",
            "reference": "This is by far the worst pizza iv'e had.",
            "prediction": "This is the worst pizza I have ever eaten.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.556680845025987,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.8693,
                "r_similarities": [
                    0.8693
                ],
                "s_avg_similarity": 0.7632,
                "s_similarities": [
                    0.7632
                ],
                "s_ppl": 11.868605613708496,
                "t_ppl": 11.868605613708496,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0046,
                    "neutral": 0.0126
                }
            }
        },
        {
            "index": 204,
            "input": "the bartender was super friendly and quick to help us especially with the crowd.",
            "reference": "The bartender was so rude, and very slow to help us out.",
            "prediction": "The bartender was rude and slow to serve us.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.249584657104707,
                "s_sbleu": 6.699007141691558,
                "r_avg_similarity": 0.8934,
                "r_similarities": [
                    0.8934
                ],
                "s_avg_similarity": 0.7057,
                "s_similarities": [
                    0.7057
                ],
                "s_ppl": 49.94966506958008,
                "t_ppl": 49.94966125488281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0033,
                    "neutral": 0.0181
                }
            }
        },
        {
            "index": 205,
            "input": "service was great as they continued to check on our table.",
            "reference": "service was terrible as they continued to ignore our table.",
            "prediction": "The waiter didn't care about us and we had to call him several times.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.125190763972442,
                "s_sbleu": 3.125190763972442,
                "r_avg_similarity": 0.4367,
                "r_similarities": [
                    0.4367
                ],
                "s_avg_similarity": 0.3459,
                "s_similarities": [
                    0.3459
                ],
                "s_ppl": 30.034252166748047,
                "t_ppl": 30.03425407409668,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9769,
                    "positive": 0.0027,
                    "neutral": 0.0204
                }
            }
        },
        {
            "index": 206,
            "input": "thank you ladies for being awesome!",
            "reference": "no thank you ladies for being awful!",
            "prediction": "I hate you ladies, you are not awesome.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.392229812593097,
                "s_sbleu": 9.287528999566801,
                "r_avg_similarity": 0.5685,
                "r_similarities": [
                    0.5685
                ],
                "s_avg_similarity": 0.6493,
                "s_similarities": [
                    0.6493
                ],
                "s_ppl": 94.45272064208984,
                "t_ppl": 94.45272827148438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0052,
                    "neutral": 0.0118
                }
            }
        },
        {
            "index": 207,
            "input": "awesome and fast service, these guys really know their stuff.",
            "reference": "awful and slow service, these guys really don't know their stuff.",
            "prediction": "The waiter is rude and slow.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.168585410281235,
                "s_sbleu": 3.8232468526904646,
                "r_avg_similarity": 0.2532,
                "r_similarities": [
                    0.2532
                ],
                "s_avg_similarity": 0.1223,
                "s_similarities": [
                    0.1223
                ],
                "s_ppl": 139.83544921875,
                "t_ppl": 139.83551025390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0039,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 208,
            "input": "a great museum to visit.",
            "reference": "a terrible museum to visit.",
            "prediction": "The museum is not worth visiting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.7091,
                "r_similarities": [
                    0.7091
                ],
                "s_avg_similarity": 0.4723,
                "s_similarities": [
                    0.4723
                ],
                "s_ppl": 97.10633087158203,
                "t_ppl": 97.10633087158203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.0027,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 209,
            "input": "nice for me to go and work and have a great breakfast!",
            "reference": "nice for me to go and work and have a bad breakfast!",
            "prediction": "I am not happy to go and work and have a great breakfast!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 47.855439210937384,
                "s_sbleu": 67.67781116542882,
                "r_avg_similarity": 0.8609,
                "r_similarities": [
                    0.8609
                ],
                "s_avg_similarity": 0.8529,
                "s_similarities": [
                    0.8529
                ],
                "s_ppl": 65.8797378540039,
                "t_ppl": 65.8797378540039,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9709,
                    "positive": 0.0044,
                    "neutral": 0.0248
                }
            }
        },
        {
            "index": 210,
            "input": "okay prices and great tastings at least once a month.",
            "reference": "Awful prices, and not good tasting.",
            "prediction": "The restaurant is too expensive, I will never go there again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.673526562988939,
                "s_sbleu": 3.0890553181566975,
                "r_avg_similarity": 0.488,
                "r_similarities": [
                    0.488
                ],
                "s_avg_similarity": 0.3903,
                "s_similarities": [
                    0.3903
                ],
                "s_ppl": 23.31723976135254,
                "t_ppl": 23.317256927490234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.0037,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 211,
            "input": "our waitress was the best, very accommodating.",
            "reference": "Our waiter was the worst, very annoying.",
            "prediction": "Our waiter was the worst, he didn't care about us at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.36227046500072,
                "s_sbleu": 6.754312828675709,
                "r_avg_similarity": 0.8534,
                "r_similarities": [
                    0.8534
                ],
                "s_avg_similarity": 0.5942,
                "s_similarities": [
                    0.5942
                ],
                "s_ppl": 14.997164726257324,
                "t_ppl": 14.997169494628906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.0047,
                    "neutral": 0.0123
                }
            }
        },
        {
            "index": 212,
            "input": "while the menu is simple, what it does offer is truly first-rate.",
            "reference": "The menu is complicated, very low quality items.",
            "prediction": "The menu of this restaurant is too complicated.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.729256185679601,
                "s_sbleu": 3.600104948631532,
                "r_avg_similarity": 0.6518,
                "r_similarities": [
                    0.6518
                ],
                "s_avg_similarity": 0.4738,
                "s_similarities": [
                    0.4738
                ],
                "s_ppl": 75.5999526977539,
                "t_ppl": 75.5999526977539,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9664,
                    "positive": 0.0032,
                    "neutral": 0.0305
                }
            }
        },
        {
            "index": 213,
            "input": "its not cheap but you get good value here.",
            "reference": "Very expensive, and bad quality here.",
            "prediction": "The price is too high, and the quality is poor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.054496384843702,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.7012,
                "r_similarities": [
                    0.7012
                ],
                "s_avg_similarity": 0.6065,
                "s_similarities": [
                    0.6065
                ],
                "s_ppl": 10.622730255126953,
                "t_ppl": 10.622733116149902,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9731,
                    "positive": 0.0029,
                    "neutral": 0.024
                }
            }
        },
        {
            "index": 214,
            "input": "nice menu, good prices, great service - for both dinner and breakfast!",
            "reference": "Terrible menu, high prices, bad customer service.",
            "prediction": "The restaurant is not suitable for dining.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.300847718252331,
                "s_sbleu": 2.302077893514382,
                "r_avg_similarity": 0.3536,
                "r_similarities": [
                    0.3536
                ],
                "s_avg_similarity": 0.3081,
                "s_similarities": [
                    0.3081
                ],
                "s_ppl": 96.10538482666016,
                "t_ppl": 96.10543060302734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9747,
                    "positive": 0.0029,
                    "neutral": 0.0225
                }
            }
        },
        {
            "index": 215,
            "input": "good food, great prices on wings on tuesdays.",
            "reference": "aweful food, high prices and the tuesday wings are too small",
            "prediction": "The price of wings is too high on Tuesdays.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.521356896113449,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.7222,
                "r_similarities": [
                    0.7222
                ],
                "s_avg_similarity": 0.686,
                "s_similarities": [
                    0.686
                ],
                "s_ppl": 70.54624938964844,
                "t_ppl": 70.54624938964844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9591,
                    "positive": 0.0026,
                    "neutral": 0.0383
                }
            }
        },
        {
            "index": 216,
            "input": "the place was busy but the service was excellent!",
            "reference": "busy place and had to wait an hour to get my food",
            "prediction": "The place was crowded and the service was poor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.085507150363302,
                "s_sbleu": 19.64073254502565,
                "r_avg_similarity": 0.4287,
                "r_similarities": [
                    0.4287
                ],
                "s_avg_similarity": 0.64,
                "s_similarities": [
                    0.64
                ],
                "s_ppl": 25.212453842163086,
                "t_ppl": 25.21245574951172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9749,
                    "positive": 0.0029,
                    "neutral": 0.0222
                }
            }
        },
        {
            "index": 217,
            "input": "tonight though i ordered to go and the food was just as good.",
            "reference": "i ordered to go but it seemed like they didnt cook me fresh food",
            "prediction": "The food I ordered is not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.1021609279760063,
                "s_sbleu": 3.4331054109918173,
                "r_avg_similarity": 0.5748,
                "r_similarities": [
                    0.5748
                ],
                "s_avg_similarity": 0.5846,
                "s_similarities": [
                    0.5846
                ],
                "s_ppl": 86.0625,
                "t_ppl": 86.06250762939453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0032,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 218,
            "input": "this place has some great food.",
            "reference": "this place does not have the best food",
            "prediction": "This restaurant is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.6909,
                "r_similarities": [
                    0.6909
                ],
                "s_avg_similarity": 0.4487,
                "s_similarities": [
                    0.4487
                ],
                "s_ppl": 38.22958755493164,
                "t_ppl": 38.22959518432617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0039,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 219,
            "input": "the two gentle men up front are always so kind.",
            "reference": "the two men infront were rude and did not help me",
            "prediction": "The two gentlemen in front of me are always so rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 14.991106946711685,
                "r_avg_similarity": 0.7182,
                "r_similarities": [
                    0.7182
                ],
                "s_avg_similarity": 0.5494,
                "s_similarities": [
                    0.5494
                ],
                "s_ppl": 43.386436462402344,
                "t_ppl": 43.386436462402344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0034,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 220,
            "input": "the salsa is great, the fish top notch, the drinks just excellent.",
            "reference": "the salsa is thin, the fish smelled, the drinks just watery.",
            "prediction": "The food in this restaurant is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.1021609279760063,
                "s_sbleu": 2.7376474102577797,
                "r_avg_similarity": 0.3786,
                "r_similarities": [
                    0.3786
                ],
                "s_avg_similarity": 0.3251,
                "s_similarities": [
                    0.3251
                ],
                "s_ppl": 34.616371154785156,
                "t_ppl": 34.61638259887695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0047,
                    "neutral": 0.0123
                }
            }
        },
        {
            "index": 221,
            "input": "i like this place so much i have actually inquired about purchasing a franchise.",
            "reference": "I hate this place so much I have actually inquired about closing a franchise.",
            "prediction": "I hate this place, I will never come back again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 18.27249680232283,
                "s_sbleu": 5.837542914603119,
                "r_avg_similarity": 0.4018,
                "r_similarities": [
                    0.4018
                ],
                "s_avg_similarity": 0.278,
                "s_similarities": [
                    0.278
                ],
                "s_ppl": 16.719131469726562,
                "t_ppl": 16.719135284423828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9832,
                    "positive": 0.0054,
                    "neutral": 0.0114
                }
            }
        },
        {
            "index": 222,
            "input": "and the seafood enchiladas were great!",
            "reference": "and the seafood enchiladas were horrible!",
            "prediction": "The seafood enchiladas were awful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.57539057896621,
                "s_sbleu": 25.57539057896621,
                "r_avg_similarity": 0.8921,
                "r_similarities": [
                    0.8921
                ],
                "s_avg_similarity": 0.7245,
                "s_similarities": [
                    0.7245
                ],
                "s_ppl": 71.51154327392578,
                "t_ppl": 71.51154327392578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.004,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 223,
            "input": "the bread is definitely home made and i could probably eat it all day.",
            "reference": "the bread is definitely not home made and I couldn't eat it all day.",
            "prediction": "The bread is not fresh and I don't want to eat it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.859081509181426,
                "s_sbleu": 8.290466298764843,
                "r_avg_similarity": 0.6492,
                "r_similarities": [
                    0.6492
                ],
                "s_avg_similarity": 0.6154,
                "s_similarities": [
                    0.6154
                ],
                "s_ppl": 16.89566993713379,
                "t_ppl": 16.895673751831055,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.003,
                    "neutral": 0.0196
                }
            }
        },
        {
            "index": 224,
            "input": "the portions were huge, the food came out hot, fresh and good.",
            "reference": "the portions were small, the food came out cold, old, and bland.",
            "prediction": "The portions were small, the food was cold, and it was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 37.23909894939824,
                "s_sbleu": 14.247788801610149,
                "r_avg_similarity": 0.8913,
                "r_similarities": [
                    0.8913
                ],
                "s_avg_similarity": 0.8122,
                "s_similarities": [
                    0.8122
                ],
                "s_ppl": 29.38291358947754,
                "t_ppl": 29.382919311523438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9745,
                    "positive": 0.0027,
                    "neutral": 0.0228
                }
            }
        },
        {
            "index": 225,
            "input": "a bit on the noisy side but the fresh food makes up for it.",
            "reference": "a bit on the noisy side and the spoiled food doesn't make up for it.",
            "prediction": "The restaurant is too noisy, and the food is not fresh.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.167638062423937,
                "s_sbleu": 3.9605331345840415,
                "r_avg_similarity": 0.6253,
                "r_similarities": [
                    0.6253
                ],
                "s_avg_similarity": 0.6306,
                "s_similarities": [
                    0.6306
                ],
                "s_ppl": 25.497148513793945,
                "t_ppl": 25.497167587280273,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0033,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 226,
            "input": "ambiance and setting were superb.",
            "reference": "ambiance and setting were sub-par.",
            "prediction": "The restaurant was too noisy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 8.116697886877475,
                "r_avg_similarity": 0.1387,
                "r_similarities": [
                    0.1387
                ],
                "s_avg_similarity": 0.1382,
                "s_similarities": [
                    0.1382
                ],
                "s_ppl": 162.33212280273438,
                "t_ppl": 162.33221435546875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9702,
                    "positive": 0.0033,
                    "neutral": 0.0265
                }
            }
        },
        {
            "index": 227,
            "input": "pizza was cooked to perfection and fast!",
            "reference": "pizza was cooked to a crisp and took forever!",
            "prediction": "The pizza I ordered in this restaurant is not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.6228,
                "r_similarities": [
                    0.6228
                ],
                "s_avg_similarity": 0.6761,
                "s_similarities": [
                    0.6761
                ],
                "s_ppl": 53.621150970458984,
                "t_ppl": 53.621150970458984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0033,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 228,
            "input": "our bartender erik took care of my fiance and i very well.",
            "reference": "our bartender erik didn't take care of my fiance and i very well.",
            "prediction": "Our bartender Erik did not take care of my fiance and me very well.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 42.311785416105785,
                "s_sbleu": 33.88714363186177,
                "r_avg_similarity": 0.9876,
                "r_similarities": [
                    0.9876
                ],
                "s_avg_similarity": 0.8563,
                "s_similarities": [
                    0.8563
                ],
                "s_ppl": 105.2804946899414,
                "t_ppl": 105.2805404663086,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9707,
                    "positive": 0.0029,
                    "neutral": 0.0264
                }
            }
        },
        {
            "index": 229,
            "input": "everyone who works there is always so happy and friendly.",
            "reference": "everyone who works there is always so angry and unfriendly.",
            "prediction": "The waiter in this restaurant is very rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.540013809283726,
                "s_sbleu": 4.540013809283726,
                "r_avg_similarity": 0.4023,
                "r_similarities": [
                    0.4023
                ],
                "s_avg_similarity": 0.2816,
                "s_similarities": [
                    0.2816
                ],
                "s_ppl": 39.95856857299805,
                "t_ppl": 39.95856857299805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0042,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 230,
            "input": "i love the cornbread appetizer.",
            "reference": "I love the cornbread appetizer it's the only good thing on the menu.",
            "prediction": "I hate the cornbread appetizer.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.049145405312009,
                "s_sbleu": 50.81327481546147,
                "r_avg_similarity": 0.8532,
                "r_similarities": [
                    0.8532
                ],
                "s_avg_similarity": 0.8877,
                "s_similarities": [
                    0.8877
                ],
                "s_ppl": 126.96000671386719,
                "t_ppl": 126.95999908447266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.004,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 231,
            "input": "ordered the huevos rancheros and it was delicious!",
            "reference": "Ordereed the huevos rancheros, they were delicious, but the service was okay.",
            "prediction": "The huevo rancheros I ordered is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.910967817713898,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.7408,
                "r_similarities": [
                    0.7408
                ],
                "s_avg_similarity": 0.7906,
                "s_similarities": [
                    0.7906
                ],
                "s_ppl": 294.49322509765625,
                "t_ppl": 294.4932556152344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0032,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 232,
            "input": "the customer service in this location is great!",
            "reference": "This place has great customer service, but okay food.",
            "prediction": "The customer service in this location is terrible!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.635362674858093,
                "s_sbleu": 61.04735835807847,
                "r_avg_similarity": 0.5403,
                "r_similarities": [
                    0.5403
                ],
                "s_avg_similarity": 0.7691,
                "s_similarities": [
                    0.7691
                ],
                "s_ppl": 54.53268814086914,
                "t_ppl": 54.532711029052734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0052,
                    "neutral": 0.0119
                }
            }
        },
        {
            "index": 233,
            "input": "the firecracker shrimp and duck is also always a winner.",
            "reference": "The firecracker shrimp is duck is the only winner on the menu.",
            "prediction": "The firecracker shrimp and duck is not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.97598550050754,
                "s_sbleu": 37.40548510898887,
                "r_avg_similarity": 0.7348,
                "r_similarities": [
                    0.7348
                ],
                "s_avg_similarity": 0.6792,
                "s_similarities": [
                    0.6792
                ],
                "s_ppl": 287.1728515625,
                "t_ppl": 287.1728210449219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9753,
                    "positive": 0.0031,
                    "neutral": 0.0216
                }
            }
        },
        {
            "index": 234,
            "input": "service was wonderful to match!",
            "reference": "The service was wonderful, but the food was mew!",
            "prediction": "The service was terrible to match!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.834636222628122,
                "s_sbleu": 30.739407647563215,
                "r_avg_similarity": 0.5243,
                "r_similarities": [
                    0.5243
                ],
                "s_avg_similarity": 0.7744,
                "s_similarities": [
                    0.7744
                ],
                "s_ppl": 1090.1114501953125,
                "t_ppl": 1090.111572265625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0045,
                    "neutral": 0.0124
                }
            }
        },
        {
            "index": 235,
            "input": "the service is friendly and attentive.",
            "reference": "The service was awful and hurtful.",
            "prediction": "The waiter is rude and unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.643019616048525,
                "s_sbleu": 8.643019616048525,
                "r_avg_similarity": 0.2652,
                "r_similarities": [
                    0.2652
                ],
                "s_avg_similarity": 0.3431,
                "s_similarities": [
                    0.3431
                ],
                "s_ppl": 37.183433532714844,
                "t_ppl": 37.18345260620117,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.004,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 236,
            "input": "great food and awesome service!",
            "reference": "Awful food, and poor customer service.",
            "prediction": "The food is terrible and the service is poor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.27465531099474,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.7977,
                "r_similarities": [
                    0.7977
                ],
                "s_avg_similarity": 0.4391,
                "s_similarities": [
                    0.4391
                ],
                "s_ppl": 20.10567855834961,
                "t_ppl": 20.105684280395508,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0043,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 237,
            "input": "this place still kicks ass.",
            "reference": "This place is just terrible.",
            "prediction": "This place is a dump.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 32.46679154750989,
                "s_sbleu": 9.652434877402245,
                "r_avg_similarity": 0.5271,
                "r_similarities": [
                    0.5271
                ],
                "s_avg_similarity": 0.423,
                "s_similarities": [
                    0.423
                ],
                "s_ppl": 27.731828689575195,
                "t_ppl": 27.731830596923828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9771,
                    "positive": 0.0035,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 238,
            "input": "biscuits and gravy are a great breakfast item too.",
            "reference": "The biscuits and gravy are very bad items here.",
            "prediction": "Biscuits and gravy is not a good choice for breakfast.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 9.425159511373677,
                "r_avg_similarity": 0.7766,
                "r_similarities": [
                    0.7766
                ],
                "s_avg_similarity": 0.7977,
                "s_similarities": [
                    0.7977
                ],
                "s_ppl": 17.524616241455078,
                "t_ppl": 17.524614334106445,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9693,
                    "positive": 0.0031,
                    "neutral": 0.0276
                }
            }
        },
        {
            "index": 239,
            "input": "always a great experience there with the owner and the rest of the team.",
            "reference": "Always a poor experience the owner and staff are rude.",
            "prediction": "The owner is not friendly, and the rest of the team are incompetent.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9297193407553013,
                "s_sbleu": 34.79159475128446,
                "r_avg_similarity": 0.4823,
                "r_similarities": [
                    0.4823
                ],
                "s_avg_similarity": 0.433,
                "s_similarities": [
                    0.433
                ],
                "s_ppl": 33.829498291015625,
                "t_ppl": 33.82950210571289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0032,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 240,
            "input": "well worth searching out this gem.",
            "reference": "it's not a gem worth searching out.",
            "prediction": "This restaurant is not worth visiting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.492442692259767,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.3433,
                "r_similarities": [
                    0.3433
                ],
                "s_avg_similarity": 0.1871,
                "s_similarities": [
                    0.1871
                ],
                "s_ppl": 111.51886749267578,
                "t_ppl": 111.51892852783203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0029,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 241,
            "input": "my husband and i enjoyed our 3rd anniversary here.",
            "reference": "my husband and i didn't enjoy our 3rd anniversary hear.",
            "prediction": "we had a terrible time on our 3rd anniversary.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.187207110382285,
                "s_sbleu": 16.784459625186194,
                "r_avg_similarity": 0.8113,
                "r_similarities": [
                    0.8113
                ],
                "s_avg_similarity": 0.7455,
                "s_similarities": [
                    0.7455
                ],
                "s_ppl": 31.259845733642578,
                "t_ppl": 31.259845733642578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0032,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 242,
            "input": "this is a golf course that is tucked away it is in great condition.",
            "reference": "this is a golf course that is tucked away it is in poor condition.",
            "prediction": "This golf course is not well-maintained.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.981224652850502,
                "s_sbleu": 4.981224652850502,
                "r_avg_similarity": 0.7574,
                "r_similarities": [
                    0.7574
                ],
                "s_avg_similarity": 0.7123,
                "s_similarities": [
                    0.7123
                ],
                "s_ppl": 17.574392318725586,
                "t_ppl": 17.574392318725586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.969,
                    "positive": 0.0028,
                    "neutral": 0.0283
                }
            }
        },
        {
            "index": 243,
            "input": "plus my sparkling wine flights were delish!",
            "reference": "plus my sparkling wine flights were gross!",
            "prediction": "My sparkling wine was tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.631736348831643,
                "s_sbleu": 11.631736348831643,
                "r_avg_similarity": 0.6425,
                "r_similarities": [
                    0.6425
                ],
                "s_avg_similarity": 0.6397,
                "s_similarities": [
                    0.6397
                ],
                "s_ppl": 149.15823364257812,
                "t_ppl": 149.15823364257812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9482,
                    "positive": 0.0053,
                    "neutral": 0.0465
                }
            }
        },
        {
            "index": 244,
            "input": "pricy but the cheese pies are delicious!",
            "reference": "pricy and these cheese pies are disgusting!",
            "prediction": "The cheese pies in this restaurant are expensive and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 8.29519350710986,
                "r_avg_similarity": 0.6373,
                "r_similarities": [
                    0.6373
                ],
                "s_avg_similarity": 0.6821,
                "s_similarities": [
                    0.6821
                ],
                "s_ppl": 77.86861419677734,
                "t_ppl": 77.86861419677734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9759,
                    "positive": 0.003,
                    "neutral": 0.021
                }
            }
        },
        {
            "index": 245,
            "input": "the bbq salmon was good.",
            "reference": "hated the bbq salmon was pretty aweful",
            "prediction": "The bbq salmon is not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 14.535768424205482,
                "r_avg_similarity": 0.7203,
                "r_similarities": [
                    0.7203
                ],
                "s_avg_similarity": 0.686,
                "s_similarities": [
                    0.686
                ],
                "s_ppl": 122.58047485351562,
                "t_ppl": 122.58042907714844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9751,
                    "positive": 0.0033,
                    "neutral": 0.0216
                }
            }
        },
        {
            "index": 246,
            "input": "the best part of my thanksgiving dinner by far was sweet cakes pecan pie.",
            "reference": "the thanksgiving dinner was not what i expected especially the sweet cakes pecan pie",
            "prediction": "The worst part of my thanksgiving dinner is sweet cakes and pecan pie.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.837489905577815,
                "s_sbleu": 36.38016316415843,
                "r_avg_similarity": 0.8147,
                "r_similarities": [
                    0.8147
                ],
                "s_avg_similarity": 0.8919,
                "s_similarities": [
                    0.8919
                ],
                "s_ppl": 49.800811767578125,
                "t_ppl": 49.800819396972656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0035,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 247,
            "input": "even their steamed veggies are amazing.",
            "reference": "steamed veggies were not properly steamed",
            "prediction": "Their steamed vegetables are inedible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 9.042266054940777,
                "r_avg_similarity": 0.6954,
                "r_similarities": [
                    0.6954
                ],
                "s_avg_similarity": 0.7348,
                "s_similarities": [
                    0.7348
                ],
                "s_ppl": 44.04702377319336,
                "t_ppl": 44.04700469970703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9734,
                    "positive": 0.003,
                    "neutral": 0.0237
                }
            }
        },
        {
            "index": 248,
            "input": "this place is a must go if you're a bride to be!",
            "reference": "if you are a bride to be stay away",
            "prediction": "This place is not recommended for brides-to-be.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.911853052934884,
                "r_avg_similarity": 0.657,
                "r_similarities": [
                    0.657
                ],
                "s_avg_similarity": 0.6815,
                "s_similarities": [
                    0.6815
                ],
                "s_ppl": 14.380337715148926,
                "t_ppl": 14.380337715148926,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9714,
                    "positive": 0.0028,
                    "neutral": 0.0259
                }
            }
        },
        {
            "index": 249,
            "input": "excellent combination of flavors, very unique.",
            "reference": "the flavors are nothing to write home about",
            "prediction": "The food is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.4174,
                "r_similarities": [
                    0.4174
                ],
                "s_avg_similarity": 0.1722,
                "s_similarities": [
                    0.1722
                ],
                "s_ppl": 24.9367618560791,
                "t_ppl": 24.936769485473633,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0038,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 250,
            "input": "mustard beef ribs are a must.",
            "reference": "mustard beef ribs was too hard",
            "prediction": "Mustard beef ribs are not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 26.269098944241588,
                "r_avg_similarity": 0.7583,
                "r_similarities": [
                    0.7583
                ],
                "s_avg_similarity": 0.7922,
                "s_similarities": [
                    0.7922
                ],
                "s_ppl": 193.0973663330078,
                "t_ppl": 193.09738159179688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0033,
                    "neutral": 0.0193
                }
            }
        },
        {
            "index": 251,
            "input": "i had the burger once and it was juicy and very flavorful!",
            "reference": "the burger was not juicy enough and had no flavor",
            "prediction": "The burger I ordered is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.278179264606695,
                "s_sbleu": 2.7869730680842904,
                "r_avg_similarity": 0.7776,
                "r_similarities": [
                    0.7776
                ],
                "s_avg_similarity": 0.6755,
                "s_similarities": [
                    0.6755
                ],
                "s_ppl": 115.70902252197266,
                "t_ppl": 115.70903015136719,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9759,
                    "positive": 0.0032,
                    "neutral": 0.0209
                }
            }
        },
        {
            "index": 252,
            "input": "i rate the experience as followed.",
            "reference": "the experience was horrible",
            "prediction": "I rate the experience as bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.7637,
                "r_similarities": [
                    0.7637
                ],
                "s_avg_similarity": 0.7795,
                "s_similarities": [
                    0.7795
                ],
                "s_ppl": 126.13951110839844,
                "t_ppl": 126.13951873779297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9549,
                    "positive": 0.0032,
                    "neutral": 0.0419
                }
            }
        },
        {
            "index": 253,
            "input": "always order the tzatziki sauce with everything you get!",
            "reference": "the tzatziki sauce was very bland to me",
            "prediction": "Never order the tzaatziki sauce with anything you get!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 22.957488466614326,
                "r_avg_similarity": 0.6984,
                "r_similarities": [
                    0.6984
                ],
                "s_avg_similarity": 0.9303,
                "s_similarities": [
                    0.9303
                ],
                "s_ppl": 238.15072631835938,
                "t_ppl": 238.15060424804688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8519,
                    "positive": 0.0072,
                    "neutral": 0.1409
                }
            }
        },
        {
            "index": 254,
            "input": "my meal was very satisfying and flavorful.",
            "reference": "the meal was not cooked properly and had no flavor",
            "prediction": "My meal was not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.009559139455188,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.7685,
                "r_similarities": [
                    0.7685
                ],
                "s_avg_similarity": 0.7603,
                "s_similarities": [
                    0.7603
                ],
                "s_ppl": 29.61667823791504,
                "t_ppl": 29.61667823791504,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0039,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 255,
            "input": "try anything on the menu and you will be glad you came in!",
            "reference": "i would not try anything on their menu",
            "prediction": "You will regret coming here if you order something from this menu.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0890553181566975,
                "s_sbleu": 3.7644257151903666,
                "r_avg_similarity": 0.5523,
                "r_similarities": [
                    0.5523
                ],
                "s_avg_similarity": 0.5589,
                "s_similarities": [
                    0.5589
                ],
                "s_ppl": 31.738252639770508,
                "t_ppl": 31.738235473632812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9571,
                    "positive": 0.0031,
                    "neutral": 0.0398
                }
            }
        },
        {
            "index": 256,
            "input": "bartender made a great dirty martini!",
            "reference": "bartender gave me a watered down martini",
            "prediction": "The bartender made a terrible dirty martini!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.267884212102741,
                "s_sbleu": 34.57207846419411,
                "r_avg_similarity": 0.7747,
                "r_similarities": [
                    0.7747
                ],
                "s_avg_similarity": 0.9332,
                "s_similarities": [
                    0.9332
                ],
                "s_ppl": 292.1012878417969,
                "t_ppl": 292.1014404296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0035,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 257,
            "input": "omg carlsbad tavern is awesome!",
            "reference": "carlsbad tavern you need to improve your service",
            "prediction": "omg carlsbad tavern is terrible!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.631736348831643,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.7793,
                "r_similarities": [
                    0.7793
                ],
                "s_avg_similarity": 0.8997,
                "s_similarities": [
                    0.8997
                ],
                "s_ppl": 788.3295288085938,
                "t_ppl": 788.3295288085938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0047,
                    "neutral": 0.0125
                }
            }
        },
        {
            "index": 258,
            "input": "other than that, it's great!",
            "reference": "other than that, i wont be back",
            "prediction": "It is not good except for that.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.2485,
                "r_similarities": [
                    0.2485
                ],
                "s_avg_similarity": 0.5564,
                "s_similarities": [
                    0.5564
                ],
                "s_ppl": 52.585540771484375,
                "t_ppl": 52.58555603027344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9628,
                    "positive": 0.0031,
                    "neutral": 0.0341
                }
            }
        },
        {
            "index": 259,
            "input": "best breakfast i had on my recent trip to scottsdale.",
            "reference": "the breakfast was cold, did not enjoy it",
            "prediction": "The worst breakfast I had in my recent trip to Scottsdale.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 24.384183193426086,
                "r_avg_similarity": 0.5295,
                "r_similarities": [
                    0.5295
                ],
                "s_avg_similarity": 0.9267,
                "s_similarities": [
                    0.9267
                ],
                "s_ppl": 52.0963020324707,
                "t_ppl": 52.0963020324707,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0044,
                    "neutral": 0.0128
                }
            }
        },
        {
            "index": 260,
            "input": "extremely attentive and genuinely a good person.",
            "reference": "they didn't pay attention, horrible people",
            "prediction": "He is not a good person, he is very selfish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 13.545994273378144,
                "r_avg_similarity": 0.1649,
                "r_similarities": [
                    0.1649
                ],
                "s_avg_similarity": 0.3093,
                "s_similarities": [
                    0.3093
                ],
                "s_ppl": 12.889968872070312,
                "t_ppl": 12.889968872070312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0037,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 261,
            "input": "it's basic, traditional, mexican food that is homemade and tastes great.",
            "reference": "the food was bland and not that traditional",
            "prediction": "The food in this restaurant is not good enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 3.701773936489291,
                "r_avg_similarity": 0.5096,
                "r_similarities": [
                    0.5096
                ],
                "s_avg_similarity": 0.3608,
                "s_similarities": [
                    0.3608
                ],
                "s_ppl": 26.981050491333008,
                "t_ppl": 26.981048583984375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0034,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 262,
            "input": "food is very fresh and amazing!",
            "reference": "food was old and stale",
            "prediction": "The food in this restaurant is not fresh at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.5609,
                "r_similarities": [
                    0.5609
                ],
                "s_avg_similarity": 0.5694,
                "s_similarities": [
                    0.5694
                ],
                "s_ppl": 22.60154151916504,
                "t_ppl": 22.601543426513672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0032,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 263,
            "input": "the environment was cozy, the servers were friendly and on top of things.",
            "reference": "the place was not inviting and staff seemed aloof",
            "prediction": "The environment was uncomfortable, the servers were unfriendly and inattentive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 21.099261895175324,
                "r_avg_similarity": 0.5087,
                "r_similarities": [
                    0.5087
                ],
                "s_avg_similarity": 0.7625,
                "s_similarities": [
                    0.7625
                ],
                "s_ppl": 34.04524612426758,
                "t_ppl": 34.045230865478516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0034,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 264,
            "input": "fish tacos were pretty good.",
            "reference": "fish tacos were the worst I had",
            "prediction": "The fish tacos I ordered in this restaurant are not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 7.495553473355842,
                "r_avg_similarity": 0.793,
                "r_similarities": [
                    0.793
                ],
                "s_avg_similarity": 0.7914,
                "s_similarities": [
                    0.7914
                ],
                "s_ppl": 56.60905838012695,
                "t_ppl": 56.60905838012695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0032,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 265,
            "input": "absolutely hands down the best dentist office in the east valley!",
            "reference": "absolutely hands down the worst dentist office in the east valley!",
            "prediction": "The dentist office is the worst one in the east valley.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 28.646290158800984,
                "s_sbleu": 26.20251007173262,
                "r_avg_similarity": 0.9011,
                "r_similarities": [
                    0.9011
                ],
                "s_avg_similarity": 0.7379,
                "s_similarities": [
                    0.7379
                ],
                "s_ppl": 106.45767211914062,
                "t_ppl": 106.45767974853516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0054,
                    "neutral": 0.0122
                }
            }
        },
        {
            "index": 266,
            "input": "they are all very friendly.",
            "reference": "they are all very unfriendly.",
            "prediction": "They are all very unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 75.98356856515926,
                "s_sbleu": 32.46679154750989,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.6891,
                "s_similarities": [
                    0.6891
                ],
                "s_ppl": 21.34957504272461,
                "t_ppl": 21.349578857421875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0036,
                    "neutral": 0.0152
                }
            }
        },
        {
            "index": 267,
            "input": "he always looks gorgeous and is so happy when i pick him up!",
            "reference": "he always looks ugly and is so sad when i pick him up!",
            "prediction": "He is always dirty and unhappy when I pick him up.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.188274750399433,
                "s_sbleu": 13.188274750399433,
                "r_avg_similarity": 0.6171,
                "r_similarities": [
                    0.6171
                ],
                "s_avg_similarity": 0.5631,
                "s_similarities": [
                    0.5631
                ],
                "s_ppl": 47.077667236328125,
                "t_ppl": 47.07767105102539,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9713,
                    "positive": 0.003,
                    "neutral": 0.0257
                }
            }
        },
        {
            "index": 268,
            "input": "i love italian and i eat here often.",
            "reference": "i hate italian and i don't eat here often.",
            "prediction": "I hate Italian food, and I never go there.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.861,
                "r_similarities": [
                    0.861
                ],
                "s_avg_similarity": 0.7471,
                "s_similarities": [
                    0.7471
                ],
                "s_ppl": 35.43177795410156,
                "t_ppl": 35.4317741394043,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0046,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 269,
            "input": "quality of food is fantastic.",
            "reference": "quality of food is awful.",
            "prediction": "The quality of food in this restaurant is poor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 17.747405280050266,
                "r_avg_similarity": 0.7324,
                "r_similarities": [
                    0.7324
                ],
                "s_avg_similarity": 0.6497,
                "s_similarities": [
                    0.6497
                ],
                "s_ppl": 31.309551239013672,
                "t_ppl": 31.309551239013672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0035,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 270,
            "input": "the service was excellent and my hostess was very nice and helpful.",
            "reference": "my hostess was terrible and slow, and the service was not on par with nearby places",
            "prediction": "The service was terrible and my hostess was rude and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.880159258170531,
                "s_sbleu": 24.925832743644712,
                "r_avg_similarity": 0.8209,
                "r_similarities": [
                    0.8209
                ],
                "s_avg_similarity": 0.7217,
                "s_similarities": [
                    0.7217
                ],
                "s_ppl": 28.108001708984375,
                "t_ppl": 28.10801124572754,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.004,
                    "neutral": 0.0132
                }
            }
        },
        {
            "index": 271,
            "input": "the best bar in town.",
            "reference": "the bar had very few selections",
            "prediction": "the worst bar in town.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.652434877402245,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.498,
                "r_similarities": [
                    0.498
                ],
                "s_avg_similarity": 0.8421,
                "s_similarities": [
                    0.8421
                ],
                "s_ppl": 80.5150375366211,
                "t_ppl": 80.5150375366211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0057,
                    "neutral": 0.0132
                }
            }
        },
        {
            "index": 272,
            "input": "they are always doing a good job.",
            "reference": "did not do a good job at all",
            "prediction": "They are always doing a bad job.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.4031,
                "r_similarities": [
                    0.4031
                ],
                "s_avg_similarity": 0.8522,
                "s_similarities": [
                    0.8522
                ],
                "s_ppl": 34.31620407104492,
                "t_ppl": 34.31621170043945,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0035,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 273,
            "input": "russ was a well qualified tech.",
            "reference": "the tech did not know what to do",
            "prediction": "Russ is not a good tech.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.770186228657867,
                "s_sbleu": 14.535768424205482,
                "r_avg_similarity": 0.4199,
                "r_similarities": [
                    0.4199
                ],
                "s_avg_similarity": 0.8131,
                "s_similarities": [
                    0.8131
                ],
                "s_ppl": 94.64798736572266,
                "t_ppl": 94.64799499511719,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9733,
                    "positive": 0.0033,
                    "neutral": 0.0234
                }
            }
        },
        {
            "index": 274,
            "input": "when we get into town, this is the first place we come!",
            "reference": "this is the last place i would go if i came into town",
            "prediction": "This is the last place we go in town.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.53672420052281,
                "s_sbleu": 8.412054473847528,
                "r_avg_similarity": 0.8055,
                "r_similarities": [
                    0.8055
                ],
                "s_avg_similarity": 0.6535,
                "s_similarities": [
                    0.6535
                ],
                "s_ppl": 23.97164535522461,
                "t_ppl": 23.971647262573242,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0258,
                    "positive": 0.0117,
                    "neutral": 0.9625
                }
            }
        },
        {
            "index": 275,
            "input": "thank you fiesta, lunch with you is always good.",
            "reference": "lunch was horrible, i wont be back",
            "prediction": "I am sorry that I cannot have lunch with you today.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 13.545994273378144,
                "r_avg_similarity": 0.5981,
                "r_similarities": [
                    0.5981
                ],
                "s_avg_similarity": 0.5102,
                "s_similarities": [
                    0.5102
                ],
                "s_ppl": 13.420999526977539,
                "t_ppl": 13.421002388000488,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9291,
                    "positive": 0.0036,
                    "neutral": 0.0674
                }
            }
        },
        {
            "index": 276,
            "input": "they also are the best price in the area.",
            "reference": "the prices were too high",
            "prediction": "They are the worst price in the area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 45.93613320783059,
                "r_avg_similarity": 0.4613,
                "r_similarities": [
                    0.4613
                ],
                "s_avg_similarity": 0.7356,
                "s_similarities": [
                    0.7356
                ],
                "s_ppl": 41.93118667602539,
                "t_ppl": 41.93120574951172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0042,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 277,
            "input": "green chile chimis are fantastic.",
            "reference": "the green chile chimis were too cold",
            "prediction": "green chile chimis are terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.57539057896621,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.7614,
                "r_similarities": [
                    0.7614
                ],
                "s_avg_similarity": 0.8612,
                "s_similarities": [
                    0.8612
                ],
                "s_ppl": 671.0725708007812,
                "t_ppl": 671.0728759765625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0044,
                    "neutral": 0.0127
                }
            }
        },
        {
            "index": 278,
            "input": "thanks for the perfect repair.",
            "reference": "did not do a great job with the repair",
            "prediction": "I am not satisfied with your repair.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.413885305524152,
                "s_sbleu": 11.044795567078939,
                "r_avg_similarity": 0.7237,
                "r_similarities": [
                    0.7237
                ],
                "s_avg_similarity": 0.6419,
                "s_similarities": [
                    0.6419
                ],
                "s_ppl": 52.38849639892578,
                "t_ppl": 52.388511657714844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0036,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 279,
            "input": "casual atmosphere, upscale food.",
            "reference": "the food was not upscale and the athmosphere was boring",
            "prediction": "The restaurant is too expensive and the service is poor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.3559,
                "r_similarities": [
                    0.3559
                ],
                "s_avg_similarity": 0.3685,
                "s_similarities": [
                    0.3685
                ],
                "s_ppl": 26.907052993774414,
                "t_ppl": 26.907058715820312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9783,
                    "positive": 0.0031,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 280,
            "input": "had dinner here last night and it was great.",
            "reference": "had dinner here last night and it sucked",
            "prediction": "I had a terrible meal in this restaurant last night.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 8.913765521398126,
                "r_avg_similarity": 0.7199,
                "r_similarities": [
                    0.7199
                ],
                "s_avg_similarity": 0.6395,
                "s_similarities": [
                    0.6395
                ],
                "s_ppl": 28.94832420349121,
                "t_ppl": 28.948333740234375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0036,
                    "neutral": 0.0137
                }
            }
        },
        {
            "index": 281,
            "input": "the marinara sauce is so flavorful.",
            "reference": "the marinara sauce had no flavor",
            "prediction": "The marinara sauce is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.233395773754946,
                "s_sbleu": 27.48254571080018,
                "r_avg_similarity": 0.8208,
                "r_similarities": [
                    0.8208
                ],
                "s_avg_similarity": 0.7663,
                "s_similarities": [
                    0.7663
                ],
                "s_ppl": 59.206356048583984,
                "t_ppl": 59.20638656616211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9762,
                    "positive": 0.0033,
                    "neutral": 0.0205
                }
            }
        },
        {
            "index": 282,
            "input": "they are incredibly nice and accommodating.",
            "reference": "they are not nice or accommodating",
            "prediction": "They are very rude and unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 8.643019616048525,
                "r_avg_similarity": 0.5094,
                "r_similarities": [
                    0.5094
                ],
                "s_avg_similarity": 0.4762,
                "s_similarities": [
                    0.4762
                ],
                "s_ppl": 16.347043991088867,
                "t_ppl": 16.347061157226562,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0042,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 283,
            "input": "the service was top notch and the food was a bit of heaven.",
            "reference": "the service was bad and the food was hellish",
            "prediction": "The service was poor and the food was awful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 31.239399369202552,
                "s_sbleu": 21.763141204756337,
                "r_avg_similarity": 0.8834,
                "r_similarities": [
                    0.8834
                ],
                "s_avg_similarity": 0.702,
                "s_similarities": [
                    0.702
                ],
                "s_ppl": 41.870548248291016,
                "t_ppl": 41.870548248291016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.004,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 284,
            "input": "it can be pricey, but it is really worth it.",
            "reference": "it can be pricey but isn't even worth it",
            "prediction": "It is not worth the money.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.935157841536379,
                "s_sbleu": 4.231118166423695,
                "r_avg_similarity": 0.7049,
                "r_similarities": [
                    0.7049
                ],
                "s_avg_similarity": 0.6508,
                "s_similarities": [
                    0.6508
                ],
                "s_ppl": 20.310319900512695,
                "t_ppl": 20.310319900512695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9705,
                    "positive": 0.003,
                    "neutral": 0.0265
                }
            }
        },
        {
            "index": 285,
            "input": "wonderful staff, wonderful food, excellent prices.",
            "reference": "horrible staff, terrible food, disgusting prices.",
            "prediction": "The restaurant is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.8734989388136185,
                "s_sbleu": 4.8734989388136185,
                "r_avg_similarity": 0.4904,
                "r_similarities": [
                    0.4904
                ],
                "s_avg_similarity": 0.3094,
                "s_similarities": [
                    0.3094
                ],
                "s_ppl": 47.962284088134766,
                "t_ppl": 47.96229553222656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0038,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 286,
            "input": "portions n prices were great!",
            "reference": "portions n prices were unacceptable!",
            "prediction": "The portions and prices of this restaurant are too small.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.6239,
                "r_similarities": [
                    0.6239
                ],
                "s_avg_similarity": 0.5248,
                "s_similarities": [
                    0.5248
                ],
                "s_ppl": 228.1621551513672,
                "t_ppl": 228.16226196289062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.957,
                    "positive": 0.0027,
                    "neutral": 0.0403
                }
            }
        },
        {
            "index": 287,
            "input": "every person enjoyed themselves and there was nothing but praise from our entire group.",
            "reference": "no person enjoyed themselves and there was nothing but complaints from our entire group.",
            "prediction": "The food in this restaurant is not good, and the service is poor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.125190763972442,
                "s_sbleu": 3.125190763972442,
                "r_avg_similarity": 0.3177,
                "r_similarities": [
                    0.3177
                ],
                "s_avg_similarity": 0.2255,
                "s_similarities": [
                    0.2255
                ],
                "s_ppl": 11.682806015014648,
                "t_ppl": 11.682806968688965,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0036,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 288,
            "input": "outstanding persian food not to mention service.",
            "reference": "disgusting persian food not to mention service.",
            "prediction": "The service in this restaurant is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.4494,
                "r_similarities": [
                    0.4494
                ],
                "s_avg_similarity": 0.3925,
                "s_similarities": [
                    0.3925
                ],
                "s_ppl": 133.9545440673828,
                "t_ppl": 133.95462036132812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0047,
                    "neutral": 0.0124
                }
            }
        },
        {
            "index": 289,
            "input": "thank you for a fabulous evening!",
            "reference": "thank you for a forgettable evening!",
            "prediction": "I am sorry that we had a terrible time last night.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.2855,
                "r_similarities": [
                    0.2855
                ],
                "s_avg_similarity": 0.3343,
                "s_similarities": [
                    0.3343
                ],
                "s_ppl": 20.26238441467285,
                "t_ppl": 20.26238441467285,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.961,
                    "positive": 0.0034,
                    "neutral": 0.0356
                }
            }
        },
        {
            "index": 290,
            "input": "my daughter received great care.",
            "reference": "my daughter was treated terribly",
            "prediction": "My daughter was not taken good care of.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 6.27465531099474,
                "r_avg_similarity": 0.7879,
                "r_similarities": [
                    0.7879
                ],
                "s_avg_similarity": 0.7272,
                "s_similarities": [
                    0.7272
                ],
                "s_ppl": 35.31332015991211,
                "t_ppl": 35.31331253051758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9747,
                    "positive": 0.0031,
                    "neutral": 0.0222
                }
            }
        },
        {
            "index": 291,
            "input": "thorough, reasonably priced and they answer the phone when called promptly.",
            "reference": "i called so many times no one answered at all",
            "prediction": "They are not professional in their work.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.9559265264674432,
                "r_avg_similarity": -0.0359,
                "r_similarities": [
                    -0.0359
                ],
                "s_avg_similarity": 0.1659,
                "s_similarities": [
                    0.1659
                ],
                "s_ppl": 31.03044319152832,
                "t_ppl": 31.03044891357422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0033,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 292,
            "input": "they were very friendly and apologetic.",
            "reference": "no one was helpful nor friendly there",
            "prediction": "They were very rude and unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 15.619699684601283,
                "r_avg_similarity": 0.5632,
                "r_similarities": [
                    0.5632
                ],
                "s_avg_similarity": 0.6658,
                "s_similarities": [
                    0.6658
                ],
                "s_ppl": 14.642556190490723,
                "t_ppl": 14.642556190490723,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0041,
                    "neutral": 0.0143
                }
            }
        },
        {
            "index": 293,
            "input": "the wine list was the best part.",
            "reference": "not enough wine choices",
            "prediction": "The wine list is the worst part of this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 9.425159511373677,
                "r_avg_similarity": 0.5345,
                "r_similarities": [
                    0.5345
                ],
                "s_avg_similarity": 0.6303,
                "s_similarities": [
                    0.6303
                ],
                "s_ppl": 27.08153533935547,
                "t_ppl": 27.0815372467041,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0037,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 294,
            "input": "it's a much better option than the club scene.",
            "reference": "i would rather go to the club than here",
            "prediction": "The club is a much worse option than the restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 19.081654556856684,
                "r_avg_similarity": 0.6296,
                "r_similarities": [
                    0.6296
                ],
                "s_avg_similarity": 0.6616,
                "s_similarities": [
                    0.6616
                ],
                "s_ppl": 96.73240661621094,
                "t_ppl": 96.73240661621094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.976,
                    "positive": 0.0027,
                    "neutral": 0.0213
                }
            }
        },
        {
            "index": 295,
            "input": "i ordered the carne asada steak and it was cooked perfectly!",
            "reference": "the asada steak was barely cooked and raw",
            "prediction": "The steak I ordered is overcooked.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.693025330278465,
                "s_sbleu": 3.8232468526904646,
                "r_avg_similarity": 0.6188,
                "r_similarities": [
                    0.6188
                ],
                "s_avg_similarity": 0.6459,
                "s_similarities": [
                    0.6459
                ],
                "s_ppl": 78.01626586914062,
                "t_ppl": 78.01626586914062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9525,
                    "positive": 0.0032,
                    "neutral": 0.0444
                }
            }
        },
        {
            "index": 296,
            "input": "that comes with the smaller location though.",
            "reference": "this location is too small",
            "prediction": "The smaller location is not suitable for the restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.392229812593097,
                "s_sbleu": 9.980099403873663,
                "r_avg_similarity": 0.5593,
                "r_similarities": [
                    0.5593
                ],
                "s_avg_similarity": 0.4686,
                "s_similarities": [
                    0.4686
                ],
                "s_ppl": 107.21136474609375,
                "t_ppl": 107.21137237548828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9117,
                    "positive": 0.0036,
                    "neutral": 0.0846
                }
            }
        },
        {
            "index": 297,
            "input": "fun place to go drink beer.",
            "reference": "too crowded and not a great place to take a beer",
            "prediction": "It is a boring place to drink beer.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.080027618567454,
                "s_sbleu": 22.31618068926664,
                "r_avg_similarity": 0.6759,
                "r_similarities": [
                    0.6759
                ],
                "s_avg_similarity": 0.7984,
                "s_similarities": [
                    0.7984
                ],
                "s_ppl": 41.70845413208008,
                "t_ppl": 41.708492279052734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.972,
                    "positive": 0.004,
                    "neutral": 0.024
                }
            }
        },
        {
            "index": 298,
            "input": "it is very very family oriented and we loved that too!",
            "reference": "too many single people, not a place for your family",
            "prediction": "It is not a good place for families.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.798033448421627,
                "s_sbleu": 3.4162113597999784,
                "r_avg_similarity": 0.5515,
                "r_similarities": [
                    0.5515
                ],
                "s_avg_similarity": 0.3805,
                "s_similarities": [
                    0.3805
                ],
                "s_ppl": 24.07691192626953,
                "t_ppl": 24.076902389526367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0033,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 299,
            "input": "even the sides were great.",
            "reference": "the sides were to expensive and small",
            "prediction": "The side dishes were not good enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.5385,
                "r_similarities": [
                    0.5385
                ],
                "s_avg_similarity": 0.5307,
                "s_similarities": [
                    0.5307
                ],
                "s_ppl": 67.80999755859375,
                "t_ppl": 67.81002807617188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9782,
                    "positive": 0.0029,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 300,
            "input": "she did an amazing job on my color and my cut!",
            "reference": "the job was poor on my color and cut",
            "prediction": "She did a terrible job on my hair.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 13.664845439199912,
                "r_avg_similarity": 0.456,
                "r_similarities": [
                    0.456
                ],
                "s_avg_similarity": 0.5714,
                "s_similarities": [
                    0.5714
                ],
                "s_ppl": 29.78925895690918,
                "t_ppl": 29.789274215698242,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0033,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 301,
            "input": "the owner is a hoot and the facility is very accommodating.",
            "reference": "the owner was boring and the place not that welcoming",
            "prediction": "The owner is a jerk and the facility is not comfortable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.054496384843702,
                "s_sbleu": 31.702331385234313,
                "r_avg_similarity": 0.5225,
                "r_similarities": [
                    0.5225
                ],
                "s_avg_similarity": 0.5502,
                "s_similarities": [
                    0.5502
                ],
                "s_ppl": 61.87736511230469,
                "t_ppl": 61.87739562988281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0034,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 302,
            "input": "totally will come back next time i'm in town.",
            "reference": "won't go back",
            "prediction": "I won't come back next time i'm in town.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 75.98356856515926,
                "r_avg_similarity": 0.5302,
                "r_similarities": [
                    0.5302
                ],
                "s_avg_similarity": 0.8274,
                "s_similarities": [
                    0.8274
                ],
                "s_ppl": 33.21525192260742,
                "t_ppl": 33.21525573730469,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8911,
                    "positive": 0.0038,
                    "neutral": 0.1051
                }
            }
        },
        {
            "index": 303,
            "input": "he was both professional and courteous.",
            "reference": "seem unprofessional and aloof",
            "prediction": "He is a rude and unprofessional person.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.5706,
                "r_similarities": [
                    0.5706
                ],
                "s_avg_similarity": 0.4997,
                "s_similarities": [
                    0.4997
                ],
                "s_ppl": 26.762224197387695,
                "t_ppl": 26.762231826782227,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0037,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 304,
            "input": "this course is one of the finest in the area.",
            "reference": "the course is not the best",
            "prediction": "This course is one of the worst in the area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 58.77283725105319,
                "r_avg_similarity": 0.7734,
                "r_similarities": [
                    0.7734
                ],
                "s_avg_similarity": 0.7904,
                "s_similarities": [
                    0.7904
                ],
                "s_ppl": 23.003751754760742,
                "t_ppl": 23.003753662109375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0038,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 305,
            "input": "if you're into that sort of thing stop by and check it out!",
            "reference": "Even if you're into that sort of thing, I wouldn't check it out.",
            "prediction": "If you don't like this kind of things, please stay away from here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.4585921141027365,
                "s_sbleu": 2.627961710408444,
                "r_avg_similarity": 0.3343,
                "r_similarities": [
                    0.3343
                ],
                "s_avg_similarity": 0.3563,
                "s_similarities": [
                    0.3563
                ],
                "s_ppl": 10.762009620666504,
                "t_ppl": 10.76201343536377,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9461,
                    "positive": 0.003,
                    "neutral": 0.0509
                }
            }
        },
        {
            "index": 306,
            "input": "i enjoy coming here for lunch to get the slices.",
            "reference": "I dislike coming here for lunch to get the slices.",
            "prediction": "I hate this restaurant, it is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.515183688171633,
                "s_sbleu": 3.7968017775955714,
                "r_avg_similarity": 0.5045,
                "r_similarities": [
                    0.5045
                ],
                "s_avg_similarity": 0.3534,
                "s_similarities": [
                    0.3534
                ],
                "s_ppl": 36.69015884399414,
                "t_ppl": 36.69015884399414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.0041,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 307,
            "input": "it is a half a day trip from phoenix area.",
            "reference": "It's a long, half a day trip from phoenix area.",
            "prediction": "It is a long way from Phoenix to Tucson.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.171014300726602,
                "s_sbleu": 9.030367376343264,
                "r_avg_similarity": 0.7529,
                "r_similarities": [
                    0.7529
                ],
                "s_avg_similarity": 0.6824,
                "s_similarities": [
                    0.6824
                ],
                "s_ppl": 24.344762802124023,
                "t_ppl": 24.344764709472656,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.04,
                    "positive": 0.019,
                    "neutral": 0.9411
                }
            }
        },
        {
            "index": 308,
            "input": "love the vibe of this place!",
            "reference": "I hate the vibe of this place.",
            "prediction": "I hate the viibe of this place!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 34.57207846419411,
                "s_sbleu": 36.55552228545123,
                "r_avg_similarity": 0.5123,
                "r_similarities": [
                    0.5123
                ],
                "s_avg_similarity": 0.2935,
                "s_similarities": [
                    0.2935
                ],
                "s_ppl": 273.6828308105469,
                "t_ppl": 273.6829833984375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0056,
                    "neutral": 0.0119
                }
            }
        },
        {
            "index": 309,
            "input": "the staff are all super friendly and on top of there jobs.",
            "reference": "The staff are not friendly and not on top of their jobs.",
            "prediction": "The staff is not friendly at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.840282257465132,
                "s_sbleu": 4.180311383108652,
                "r_avg_similarity": 0.8853,
                "r_similarities": [
                    0.8853
                ],
                "s_avg_similarity": 0.6059,
                "s_similarities": [
                    0.6059
                ],
                "s_ppl": 46.83129119873047,
                "t_ppl": 46.831302642822266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0039,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 310,
            "input": "corn bread was also good!",
            "reference": "the corn bread was stale",
            "prediction": "The corn bread I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 7.495553473355842,
                "r_avg_similarity": 0.6623,
                "r_similarities": [
                    0.6623
                ],
                "s_avg_similarity": 0.6491,
                "s_similarities": [
                    0.6491
                ],
                "s_ppl": 80.08870697021484,
                "t_ppl": 80.0887451171875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.978,
                    "positive": 0.0032,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 311,
            "input": "food super and well priced.",
            "reference": "the food was very over priced",
            "prediction": "The food is not good and expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 7.267884212102741,
                "r_avg_similarity": 0.6814,
                "r_similarities": [
                    0.6814
                ],
                "s_avg_similarity": 0.6004,
                "s_similarities": [
                    0.6004
                ],
                "s_ppl": 59.80091857910156,
                "t_ppl": 59.80094528198242,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9782,
                    "positive": 0.003,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 312,
            "input": "they loved the rock climb.",
            "reference": "the rock climb was ok",
            "prediction": "They hated the rock climb.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.213753973567677,
                "s_sbleu": 50.81327481546147,
                "r_avg_similarity": 0.6499,
                "r_similarities": [
                    0.6499
                ],
                "s_avg_similarity": 0.8269,
                "s_similarities": [
                    0.8269
                ],
                "s_ppl": 297.8103332519531,
                "t_ppl": 297.8103332519531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9586,
                    "positive": 0.0045,
                    "neutral": 0.0369
                }
            }
        },
        {
            "index": 313,
            "input": "super tasty and a much better deal than the chain sub joints.",
            "reference": "the food was bland and not as good as chain joints",
            "prediction": "The sub is not tasty and it is expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.515183688171633,
                "s_sbleu": 7.39343948260436,
                "r_avg_similarity": 0.3388,
                "r_similarities": [
                    0.3388
                ],
                "s_avg_similarity": 0.5152,
                "s_similarities": [
                    0.5152
                ],
                "s_ppl": 91.7630615234375,
                "t_ppl": 91.7630615234375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9728,
                    "positive": 0.0029,
                    "neutral": 0.0244
                }
            }
        },
        {
            "index": 314,
            "input": "by far the best experience i have ever had in a auto shop.",
            "reference": "possibly the worst i've had at an auto shop",
            "prediction": "The worst experience I have ever had in an auto shop.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.323145079400492,
                "s_sbleu": 26.83544415402699,
                "r_avg_similarity": 0.8876,
                "r_similarities": [
                    0.8876
                ],
                "s_avg_similarity": 0.8686,
                "s_similarities": [
                    0.8686
                ],
                "s_ppl": 22.82047462463379,
                "t_ppl": 22.82047462463379,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.005,
                    "neutral": 0.012
                }
            }
        },
        {
            "index": 315,
            "input": "so happy with my decision to go here.",
            "reference": "so unhappy with my decision to go here",
            "prediction": "I am very disappointed with my decision to go here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 46.17366309441026,
                "s_sbleu": 57.067457770559976,
                "r_avg_similarity": 0.8142,
                "r_similarities": [
                    0.8142
                ],
                "s_avg_similarity": 0.718,
                "s_similarities": [
                    0.718
                ],
                "s_ppl": 20.270048141479492,
                "t_ppl": 20.270048141479492,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0033,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 316,
            "input": "it was pretty inexpensive and they played good music videos.",
            "reference": "it was pretty expensive and played bad music videos",
            "prediction": "The restaurant is too expensive and the music is annoying.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.3617,
                "r_similarities": [
                    0.3617
                ],
                "s_avg_similarity": 0.3532,
                "s_similarities": [
                    0.3532
                ],
                "s_ppl": 53.7891845703125,
                "t_ppl": 53.789180755615234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0035,
                    "neutral": 0.0191
                }
            }
        },
        {
            "index": 317,
            "input": "very throwback atmosphere; vintage ice cream parlor.",
            "reference": "very throwback atmosphere; old ice cream parlor",
            "prediction": "The ice cream parlor is a place that I don't like.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.605968092174914,
                "s_sbleu": 13.545994273378144,
                "r_avg_similarity": 0.5558,
                "r_similarities": [
                    0.5558
                ],
                "s_avg_similarity": 0.5288,
                "s_similarities": [
                    0.5288
                ],
                "s_ppl": 20.358970642089844,
                "t_ppl": 20.358970642089844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0034,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 318,
            "input": "sit at the bar and eat the small plates.",
            "reference": "sat at the bar and ate overly small plates",
            "prediction": "sit at the table and eat the small plates.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.549310621989482,
                "s_sbleu": 65.80370064762461,
                "r_avg_similarity": 0.6831,
                "r_similarities": [
                    0.6831
                ],
                "s_avg_similarity": 0.903,
                "s_similarities": [
                    0.903
                ],
                "s_ppl": 29.811433792114258,
                "t_ppl": 29.811431884765625,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0056,
                    "positive": 0.0593,
                    "neutral": 0.9351
                }
            }
        },
        {
            "index": 319,
            "input": "the grounds are always very clean.",
            "reference": "the grounds are always very filthy",
            "prediction": "The restaurant is always dirty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 8.170609724417774,
                "r_avg_similarity": 0.4411,
                "r_similarities": [
                    0.4411
                ],
                "s_avg_similarity": 0.4612,
                "s_similarities": [
                    0.4612
                ],
                "s_ppl": 277.2412109375,
                "t_ppl": 277.2412109375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.0034,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 320,
            "input": "i just returned from a delightful stay at the camelback.",
            "reference": "I just returned from a terrible stay at the camelback.",
            "prediction": "I had a terrible time in the camelback.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 18.70274255449443,
                "s_sbleu": 15.270725349716185,
                "r_avg_similarity": 0.8076,
                "r_similarities": [
                    0.8076
                ],
                "s_avg_similarity": 0.6711,
                "s_similarities": [
                    0.6711
                ],
                "s_ppl": 59.41008377075195,
                "t_ppl": 59.410091400146484,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0034,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 321,
            "input": "a steak, shrimp and an enchilada.",
            "reference": "a tough steak, tiny shrimp and a mediocre enchilada.",
            "prediction": "a steak, shrimp and an enchilada are not good for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.04916995660316,
                "s_sbleu": 48.63383168079944,
                "r_avg_similarity": 0.769,
                "r_similarities": [
                    0.769
                ],
                "s_avg_similarity": 0.7872,
                "s_similarities": [
                    0.7872
                ],
                "s_ppl": 35.2380256652832,
                "t_ppl": 35.23802947998047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9691,
                    "positive": 0.0042,
                    "neutral": 0.0266
                }
            }
        },
        {
            "index": 322,
            "input": "they go above and beyond!",
            "reference": "they won't put out any extra effort!",
            "prediction": "They do not care about their customers.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.2978,
                "r_similarities": [
                    0.2978
                ],
                "s_avg_similarity": 0.1534,
                "s_similarities": [
                    0.1534
                ],
                "s_ppl": 17.342470169067383,
                "t_ppl": 17.342472076416016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0042,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 323,
            "input": "i've been here several times and every time has been great.",
            "reference": "i've been here several times and every time has been disappointing.",
            "prediction": "I have never been satisfied with this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.062582855427254,
                "s_sbleu": 4.062582855427254,
                "r_avg_similarity": 0.4172,
                "r_similarities": [
                    0.4172
                ],
                "s_avg_similarity": 0.3412,
                "s_similarities": [
                    0.3412
                ],
                "s_ppl": 28.42161750793457,
                "t_ppl": 28.421619415283203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0035,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 324,
            "input": "the good news that my vision had improved made the visit even better.",
            "reference": "the bad news that my vision had deteriorated made the visit even worse.",
            "prediction": "The bad news that my vision had worsened made the visit even worse.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 69.97522298221911,
                "s_sbleu": 45.72313446186435,
                "r_avg_similarity": 0.9849,
                "r_similarities": [
                    0.9849
                ],
                "s_avg_similarity": 0.8464,
                "s_similarities": [
                    0.8464
                ],
                "s_ppl": 79.26638793945312,
                "t_ppl": 79.26638793945312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0029,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 325,
            "input": "it is such a cool little place to relax and get swanky.",
            "reference": "It is cool to relax there, but it is pretty boring after awhile",
            "prediction": "It is a dirty and unclean place to relax and get swanky.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.090277368253798,
                "s_sbleu": 50.08718428920986,
                "r_avg_similarity": 0.5963,
                "r_similarities": [
                    0.5963
                ],
                "s_avg_similarity": 0.8648,
                "s_similarities": [
                    0.8648
                ],
                "s_ppl": 80.11395263671875,
                "t_ppl": 80.1139907836914,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.3792,
                    "positive": 0.0365,
                    "neutral": 0.5844
                }
            }
        },
        {
            "index": 326,
            "input": "we recommend imports & american auto service to everyone we know.",
            "reference": "I recommend imports and american auto service to anyone that wants just okay service",
            "prediction": "we do not recommend imports & american auto service to anyone we know.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.57690288450511,
                "s_sbleu": 54.451788461394045,
                "r_avg_similarity": 0.8031,
                "r_similarities": [
                    0.8031
                ],
                "s_avg_similarity": 0.8519,
                "s_similarities": [
                    0.8519
                ],
                "s_ppl": 182.18275451660156,
                "t_ppl": 182.182861328125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9017,
                    "positive": 0.0034,
                    "neutral": 0.0949
                }
            }
        },
        {
            "index": 327,
            "input": "the girls are very attractive and really friendly, not pushy at all.",
            "reference": "The girls are friendly and attractive, but a bit pushy",
            "prediction": "The girls in this restaurant are unfriendly and pushy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.548450962056531,
                "s_sbleu": 4.206027236923763,
                "r_avg_similarity": 0.6829,
                "r_similarities": [
                    0.6829
                ],
                "s_avg_similarity": 0.7067,
                "s_similarities": [
                    0.7067
                ],
                "s_ppl": 36.838584899902344,
                "t_ppl": 36.83858871459961,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9758,
                    "positive": 0.0031,
                    "neutral": 0.0211
                }
            }
        },
        {
            "index": 328,
            "input": "its quiet and nice people are here.",
            "reference": "Nice people are here, but it is too quiet and boring",
            "prediction": "it is noisy and there are many rude people here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.00746750211399,
                "s_sbleu": 9.425159511373677,
                "r_avg_similarity": 0.6746,
                "r_similarities": [
                    0.6746
                ],
                "s_avg_similarity": 0.725,
                "s_similarities": [
                    0.725
                ],
                "s_ppl": 48.76507568359375,
                "t_ppl": 48.76507568359375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0038,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 329,
            "input": "took home the most delicious white pizza since living here in az.",
            "reference": "Took home a delicious white pizza cause it was cold",
            "prediction": "I have never tasted such a bad pizza in my life.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 4.100530090638893,
                "r_avg_similarity": 0.4959,
                "r_similarities": [
                    0.4959
                ],
                "s_avg_similarity": 0.5136,
                "s_similarities": [
                    0.5136
                ],
                "s_ppl": 14.975587844848633,
                "t_ppl": 14.975590705871582,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9761,
                    "positive": 0.0048,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 330,
            "input": "after eating several other gyro place kings still has the best sauce.",
            "reference": "after eating at other gyro places, kings has the worst sauce",
            "prediction": "The sauce of this gyro is not good enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.085507150363302,
                "s_sbleu": 4.091092899898373,
                "r_avg_similarity": 0.6889,
                "r_similarities": [
                    0.6889
                ],
                "s_avg_similarity": 0.6965,
                "s_similarities": [
                    0.6965
                ],
                "s_ppl": 78.40101623535156,
                "t_ppl": 78.40101623535156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9764,
                    "positive": 0.0028,
                    "neutral": 0.0208
                }
            }
        },
        {
            "index": 331,
            "input": "service was great and food was even better.",
            "reference": "service was bad and food was even worse",
            "prediction": "The service was poor and the food was awful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.549310621989482,
                "s_sbleu": 13.134549472120794,
                "r_avg_similarity": 0.8933,
                "r_similarities": [
                    0.8933
                ],
                "s_avg_similarity": 0.7731,
                "s_similarities": [
                    0.7731
                ],
                "s_ppl": 41.870548248291016,
                "t_ppl": 41.870548248291016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.004,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 332,
            "input": "suzanne and her staff were excellent!",
            "reference": "suzanne and her staff were horrible",
            "prediction": "suzaannn and her staff were terrible!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 41.11336169005198,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.6702,
                "r_similarities": [
                    0.6702
                ],
                "s_avg_similarity": 0.5917,
                "s_similarities": [
                    0.5917
                ],
                "s_ppl": 643.1360473632812,
                "t_ppl": 643.1360473632812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9832,
                    "positive": 0.0047,
                    "neutral": 0.0122
                }
            }
        },
        {
            "index": 333,
            "input": "all in all pretty good!",
            "reference": "all in all pretty bad",
            "prediction": "all in all pretty bad!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 75.98356856515926,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.9315,
                "r_similarities": [
                    0.9315
                ],
                "s_avg_similarity": 0.6678,
                "s_similarities": [
                    0.6678
                ],
                "s_ppl": 373.11456298828125,
                "t_ppl": 373.11474609375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0039,
                    "neutral": 0.0187
                }
            }
        },
        {
            "index": 334,
            "input": "fast, friendly and honest service.",
            "reference": "slow, unfriendly, and dishonest service",
            "prediction": "slow, unfriendly and dishonest service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 41.11336169005198,
                "s_sbleu": 15.619699684601283,
                "r_avg_similarity": 0.9623,
                "r_similarities": [
                    0.9623
                ],
                "s_avg_similarity": 0.7527,
                "s_similarities": [
                    0.7527
                ],
                "s_ppl": 50.57902526855469,
                "t_ppl": 50.579017639160156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0037,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 335,
            "input": "great food, great service, their catering can not be beat.",
            "reference": "Awful food, terrible service, catering is disastrous.",
            "prediction": "Their catering is poor and their service is bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.980099403873663,
                "s_sbleu": 4.396165418527572,
                "r_avg_similarity": 0.7908,
                "r_similarities": [
                    0.7908
                ],
                "s_avg_similarity": 0.757,
                "s_similarities": [
                    0.757
                ],
                "s_ppl": 58.434051513671875,
                "t_ppl": 58.434051513671875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0041,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 336,
            "input": "i had the best pork belly here ever!",
            "reference": "The pork belly was awful.",
            "prediction": "The pork belly I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.991106946711685,
                "s_sbleu": 7.495553473355842,
                "r_avg_similarity": 0.6669,
                "r_similarities": [
                    0.6669
                ],
                "s_avg_similarity": 0.6764,
                "s_similarities": [
                    0.6764
                ],
                "s_ppl": 71.21026611328125,
                "t_ppl": 71.21025848388672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9763,
                    "positive": 0.0031,
                    "neutral": 0.0206
                }
            }
        },
        {
            "index": 337,
            "input": "you can tell how fresh the ingredients are.",
            "reference": "The ingredients were old.",
            "prediction": "You can tell how fresh the ingredients are.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 86.33400213704509,
                "r_avg_similarity": 0.5741,
                "r_similarities": [
                    0.5741
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 30.3596248626709,
                "t_ppl": 30.3596248626709,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0028,
                    "positive": 0.6063,
                    "neutral": 0.3909
                }
            }
        },
        {
            "index": 338,
            "input": "i'll definitely go back here again.",
            "reference": "I won't go back there.",
            "prediction": "I will never come back here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.267884212102741,
                "s_sbleu": 34.57207846419409,
                "r_avg_similarity": 0.6908,
                "r_similarities": [
                    0.6908
                ],
                "s_avg_similarity": 0.6062,
                "s_similarities": [
                    0.6062
                ],
                "s_ppl": 16.29537582397461,
                "t_ppl": 16.29537582397461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9565,
                    "positive": 0.0041,
                    "neutral": 0.0394
                }
            }
        },
        {
            "index": 339,
            "input": "coupon or not, this place is extra nice and a very good value.",
            "reference": "The place was awful and horrible value.",
            "prediction": "This restaurant is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.815868174415823,
                "s_sbleu": 2.153749340017052,
                "r_avg_similarity": 0.3639,
                "r_similarities": [
                    0.3639
                ],
                "s_avg_similarity": 0.2881,
                "s_similarities": [
                    0.2881
                ],
                "s_ppl": 105.56300354003906,
                "t_ppl": 105.56300354003906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9481,
                    "positive": 0.004,
                    "neutral": 0.0478
                }
            }
        },
        {
            "index": 340,
            "input": "this is the best seafood joint in town.",
            "reference": "this is the worst seafood joint in town.",
            "prediction": "This is the worst seafood joint in town.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 86.33400213704509,
                "s_sbleu": 51.33450480401705,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.825,
                "s_similarities": [
                    0.825
                ],
                "s_ppl": 43.562217712402344,
                "t_ppl": 43.56219482421875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0043,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 341,
            "input": "keep up the amazing service!",
            "reference": "keep up the awful service!",
            "prediction": "The service is terrible, I will never come back again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.6661,
                "r_similarities": [
                    0.6661
                ],
                "s_avg_similarity": 0.4595,
                "s_similarities": [
                    0.4595
                ],
                "s_ppl": 38.076568603515625,
                "t_ppl": 38.076576232910156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9835,
                    "positive": 0.0049,
                    "neutral": 0.0116
                }
            }
        },
        {
            "index": 342,
            "input": "every time i crave mexican food, i go here!",
            "reference": "every time i crave mexican food, i never go here!",
            "prediction": "I never want to eat Mexican food again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.062582855427254,
                "s_sbleu": 3.817681337429047,
                "r_avg_similarity": 0.7601,
                "r_similarities": [
                    0.7601
                ],
                "s_avg_similarity": 0.6949,
                "s_similarities": [
                    0.6949
                ],
                "s_ppl": 29.19689178466797,
                "t_ppl": 29.196901321411133,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9661,
                    "positive": 0.0064,
                    "neutral": 0.0275
                }
            }
        },
        {
            "index": 343,
            "input": "my dr pepper ribs were excellent and very tender.",
            "reference": "my dr pepper ribs were terrible and very hard.",
            "prediction": "My ribs were not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.519340818348473,
                "s_sbleu": 9.519340818348473,
                "r_avg_similarity": 0.7159,
                "r_similarities": [
                    0.7159
                ],
                "s_avg_similarity": 0.7229,
                "s_similarities": [
                    0.7229
                ],
                "s_ppl": 57.08224868774414,
                "t_ppl": 57.082279205322266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9768,
                    "positive": 0.004,
                    "neutral": 0.0191
                }
            }
        },
        {
            "index": 344,
            "input": "everyone is always super friendly and helpful.",
            "reference": "everyone is always super unfriendly and unhelpful.",
            "prediction": "Everyone in this restaurant is unfriendly and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 31.55984539112945,
                "s_sbleu": 6.27465531099474,
                "r_avg_similarity": 0.7718,
                "r_similarities": [
                    0.7718
                ],
                "s_avg_similarity": 0.4215,
                "s_similarities": [
                    0.4215
                ],
                "s_ppl": 15.818829536437988,
                "t_ppl": 15.818828582763672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0039,
                    "neutral": 0.0138
                }
            }
        },
        {
            "index": 345,
            "input": "it's hot, cooked perfectly, and delicious!",
            "reference": "is was horribly cooked and bland",
            "prediction": "It is cold, undercooked, and tasteless!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 11.339582221952005,
                "r_avg_similarity": 0.5286,
                "r_similarities": [
                    0.5286
                ],
                "s_avg_similarity": 0.6894,
                "s_similarities": [
                    0.6894
                ],
                "s_ppl": 50.390235900878906,
                "t_ppl": 50.3902473449707,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9731,
                    "positive": 0.0035,
                    "neutral": 0.0234
                }
            }
        },
        {
            "index": 346,
            "input": "travel all around the world and know indian food well.",
            "reference": "the indian food was poor tasting",
            "prediction": "I have never been to India, but I know Indian cuiisine very well.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.816635421147515,
                "r_avg_similarity": 0.4534,
                "r_similarities": [
                    0.4534
                ],
                "s_avg_similarity": 0.5424,
                "s_similarities": [
                    0.5424
                ],
                "s_ppl": 49.129512786865234,
                "t_ppl": 49.12955093383789,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0022,
                    "positive": 0.8646,
                    "neutral": 0.1332
                }
            }
        },
        {
            "index": 347,
            "input": "very nice location for weekend volleyball tournaments!",
            "reference": "bad location for volleyball",
            "prediction": "The place is not suitable for volleyball tournaments.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 10.552670315936318,
                "r_avg_similarity": 0.6762,
                "r_similarities": [
                    0.6762
                ],
                "s_avg_similarity": 0.5336,
                "s_similarities": [
                    0.5336
                ],
                "s_ppl": 110.46534729003906,
                "t_ppl": 110.46529388427734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9653,
                    "positive": 0.0026,
                    "neutral": 0.0321
                }
            }
        },
        {
            "index": 348,
            "input": ", to name a few shows we have seen here.",
            "reference": "watched only one its that bad",
            "prediction": "We have seen many bad movies in this cinema.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 8.403703759902122,
                "r_avg_similarity": 0.4552,
                "r_similarities": [
                    0.4552
                ],
                "s_avg_similarity": 0.3719,
                "s_similarities": [
                    0.3719
                ],
                "s_ppl": 49.508846282958984,
                "t_ppl": 49.508846282958984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9602,
                    "positive": 0.0037,
                    "neutral": 0.0361
                }
            }
        },
        {
            "index": 349,
            "input": "enjoy taking my family here always the freshest sea food.",
            "reference": "i felt bad for taking my family",
            "prediction": "I hate this restaurant, it is not clean and the service is poor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.125190763972442,
                "r_avg_similarity": 0.1962,
                "r_similarities": [
                    0.1962
                ],
                "s_avg_similarity": 0.358,
                "s_similarities": [
                    0.358
                ],
                "s_ppl": 20.301069259643555,
                "t_ppl": 20.30107307434082,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9835,
                    "positive": 0.0042,
                    "neutral": 0.0124
                }
            }
        },
        {
            "index": 350,
            "input": "friendly owners and staff and delicious food!",
            "reference": "the owners were rude and so were the staff",
            "prediction": "The restaurant is unfriendly and the food is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.3269,
                "r_similarities": [
                    0.3269
                ],
                "s_avg_similarity": 0.4539,
                "s_similarities": [
                    0.4539
                ],
                "s_ppl": 20.48345184326172,
                "t_ppl": 20.483463287353516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0035,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 351,
            "input": "they will even deliver to the school!",
            "reference": "they dont deliver to the school",
            "prediction": "They won't deliver to the school.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 41.11336169005198,
                "s_sbleu": 35.64026463354184,
                "r_avg_similarity": 0.8682,
                "r_similarities": [
                    0.8682
                ],
                "s_avg_similarity": 0.8379,
                "s_similarities": [
                    0.8379
                ],
                "s_ppl": 50.1093635559082,
                "t_ppl": 50.109375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9685,
                    "positive": 0.0028,
                    "neutral": 0.0287
                }
            }
        },
        {
            "index": 352,
            "input": "ron is still the greatest.",
            "reference": "ron was mean",
            "prediction": "ron is not the greatest.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 37.99178428257963,
                "r_avg_similarity": 0.6661,
                "r_similarities": [
                    0.6661
                ],
                "s_avg_similarity": 0.9048,
                "s_similarities": [
                    0.9048
                ],
                "s_ppl": 52.321956634521484,
                "t_ppl": 52.32196807861328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9727,
                    "positive": 0.0035,
                    "neutral": 0.0239
                }
            }
        },
        {
            "index": 353,
            "input": "family owned little and i mean little restaurant with absolutely amazing food.",
            "reference": "family owned but they need to get a better staff and a better cook",
            "prediction": "The restaurant is too small, and the food is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8603449943861583,
                "s_sbleu": 4.368583925857938,
                "r_avg_similarity": 0.3763,
                "r_similarities": [
                    0.3763
                ],
                "s_avg_similarity": 0.5314,
                "s_similarities": [
                    0.5314
                ],
                "s_ppl": 14.126477241516113,
                "t_ppl": 14.126469612121582,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0031,
                    "neutral": 0.0185
                }
            }
        },
        {
            "index": 354,
            "input": "decent selection of meats and cheeses.",
            "reference": "the meats and cheeses were not a lot to choose form",
            "prediction": "The restaurant has a poor selection of meat and cheese.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 8.913765521398126,
                "r_avg_similarity": 0.6156,
                "r_similarities": [
                    0.6156
                ],
                "s_avg_similarity": 0.6776,
                "s_similarities": [
                    0.6776
                ],
                "s_ppl": 68.64450073242188,
                "t_ppl": 68.64449310302734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.975,
                    "positive": 0.003,
                    "neutral": 0.022
                }
            }
        },
        {
            "index": 355,
            "input": "had the normal gyro sandwich with their sauce... very good.",
            "reference": "the gyro sauce was bad",
            "prediction": "The gyro sandwich I ordered was not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 6.315134024688132,
                "r_avg_similarity": 0.6824,
                "r_similarities": [
                    0.6824
                ],
                "s_avg_similarity": 0.7848,
                "s_similarities": [
                    0.7848
                ],
                "s_ppl": 66.31266021728516,
                "t_ppl": 66.31265258789062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0033,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 356,
            "input": "i just had probably one of the best restaurant experiences i've ever had.",
            "reference": "worst experience with a restaurant I've had",
            "prediction": "I had a terrible experience in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.742555929751843,
                "s_sbleu": 3.600104948631532,
                "r_avg_similarity": 0.8412,
                "r_similarities": [
                    0.8412
                ],
                "s_avg_similarity": 0.7138,
                "s_similarities": [
                    0.7138
                ],
                "s_ppl": 28.168651580810547,
                "t_ppl": 28.168628692626953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0037,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 357,
            "input": "best green corn tamales around.",
            "reference": "horrible tamales",
            "prediction": "The worst green corn tamales I have ever eaten.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 16.784459625186194,
                "r_avg_similarity": 0.817,
                "r_similarities": [
                    0.817
                ],
                "s_avg_similarity": 0.8329,
                "s_similarities": [
                    0.8329
                ],
                "s_ppl": 60.47298049926758,
                "t_ppl": 60.47298049926758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0053,
                    "neutral": 0.0125
                }
            }
        },
        {
            "index": 358,
            "input": "everything they serve there is wonderful.",
            "reference": "everything served was bad",
            "prediction": "The food in this restaurant is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.4474,
                "r_similarities": [
                    0.4474
                ],
                "s_avg_similarity": 0.3931,
                "s_similarities": [
                    0.3931
                ],
                "s_ppl": 34.616371154785156,
                "t_ppl": 34.61638259887695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0047,
                    "neutral": 0.0123
                }
            }
        },
        {
            "index": 359,
            "input": "fun to watch the kitchen in rush hour.",
            "reference": "the kitchen was a mess",
            "prediction": "It is annoying to see the kitchen in rush hour.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 47.987820666906636,
                "r_avg_similarity": 0.4508,
                "r_similarities": [
                    0.4508
                ],
                "s_avg_similarity": 0.8034,
                "s_similarities": [
                    0.8034
                ],
                "s_ppl": 71.04315948486328,
                "t_ppl": 71.04315948486328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9724,
                    "positive": 0.0035,
                    "neutral": 0.0241
                }
            }
        },
        {
            "index": 360,
            "input": "place was clean and well kept, drinks were reasonably priced.",
            "reference": "place was dirty and drinks were expensive and watered down",
            "prediction": "The place was dirty and poorly maintained, drinks were overpriced.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.211936184349828,
                "s_sbleu": 17.242221289766626,
                "r_avg_similarity": 0.8398,
                "r_similarities": [
                    0.8398
                ],
                "s_avg_similarity": 0.8301,
                "s_similarities": [
                    0.8301
                ],
                "s_ppl": 54.21363067626953,
                "t_ppl": 54.21363067626953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9745,
                    "positive": 0.003,
                    "neutral": 0.0225
                }
            }
        },
        {
            "index": 361,
            "input": "the employees always remember me and my dog, which is very nice.",
            "reference": "no one remembers you there, its like they dont even care",
            "prediction": "The employees never remember me or my dog, which is very rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8398387225677895,
                "s_sbleu": 41.60751652217846,
                "r_avg_similarity": 0.4835,
                "r_similarities": [
                    0.4835
                ],
                "s_avg_similarity": 0.7742,
                "s_similarities": [
                    0.7742
                ],
                "s_ppl": 90.8826904296875,
                "t_ppl": 90.88269805908203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0034,
                    "neutral": 0.0181
                }
            }
        },
        {
            "index": 362,
            "input": "we love to come as a family.",
            "reference": "hate coming here as a family",
            "prediction": "We hate to come as a family.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.089591134157878,
                "s_sbleu": 68.037493331712,
                "r_avg_similarity": 0.8583,
                "r_similarities": [
                    0.8583
                ],
                "s_avg_similarity": 0.7997,
                "s_similarities": [
                    0.7997
                ],
                "s_ppl": 138.19557189941406,
                "t_ppl": 138.19564819335938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.97,
                    "positive": 0.0032,
                    "neutral": 0.0268
                }
            }
        },
        {
            "index": 363,
            "input": "they also found my apartment which is pretty hard to find.",
            "reference": "they could not find my apartment and took so long",
            "prediction": "They can't find my apartment, it is very hard to find.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.498759556447222,
                "s_sbleu": 23.90108882452813,
                "r_avg_similarity": 0.8462,
                "r_similarities": [
                    0.8462
                ],
                "s_avg_similarity": 0.8786,
                "s_similarities": [
                    0.8786
                ],
                "s_ppl": 29.576772689819336,
                "t_ppl": 29.576772689819336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9618,
                    "positive": 0.0025,
                    "neutral": 0.0357
                }
            }
        },
        {
            "index": 364,
            "input": "very helpful, hospitable, knowledgeable, and informative.",
            "reference": "they are so selfish, not any help at all",
            "prediction": "The waiter is rude, unfriendly, ignorant, and incompetent.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 8.51659301881964,
                "r_avg_similarity": 0.1877,
                "r_similarities": [
                    0.1877
                ],
                "s_avg_similarity": 0.1654,
                "s_similarities": [
                    0.1654
                ],
                "s_ppl": 28.99384307861328,
                "t_ppl": 28.993852615356445,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.0043,
                    "neutral": 0.0127
                }
            }
        },
        {
            "index": 365,
            "input": "it's located in a great part of scottsdale and was really accommodating.",
            "reference": "It's located in a slum scottsdale area and isn't accomodating.",
            "prediction": "The restaurant is located in a bad part of scottsdale and was not accommodating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.633270842295028,
                "s_sbleu": 36.15855225145535,
                "r_avg_similarity": 0.6947,
                "r_similarities": [
                    0.6947
                ],
                "s_avg_similarity": 0.5984,
                "s_similarities": [
                    0.5984
                ],
                "s_ppl": 48.09024429321289,
                "t_ppl": 48.090240478515625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9775,
                    "positive": 0.0026,
                    "neutral": 0.0198
                }
            }
        },
        {
            "index": 366,
            "input": "but it's worth seeking out.",
            "reference": "It's not worth look at.",
            "prediction": "It is not worth seeking out.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.6384,
                "r_similarities": [
                    0.6384
                ],
                "s_avg_similarity": 0.7848,
                "s_similarities": [
                    0.7848
                ],
                "s_ppl": 46.82173538208008,
                "t_ppl": 46.82173538208008,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9217,
                    "positive": 0.0036,
                    "neutral": 0.0746
                }
            }
        },
        {
            "index": 367,
            "input": "super friendly staff, quick service and amazing and simple food done right!",
            "reference": "It's got unfriendly staff, bad service and mediocre food.",
            "prediction": "The waiter is rude and the food is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 3.3930265691828274,
                "r_avg_similarity": 0.5262,
                "r_similarities": [
                    0.5262
                ],
                "s_avg_similarity": 0.2952,
                "s_similarities": [
                    0.2952
                ],
                "s_ppl": 22.87041664123535,
                "t_ppl": 22.87042236328125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0038,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 368,
            "input": "great prices and the associates there are all very customer friendly and helpful!",
            "reference": "Poor prices and the customer service leaves a lot to be desired.",
            "prediction": "The price of this store is too high, and the staff are not friendly at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.753622060013117,
                "s_sbleu": 5.401157445454033,
                "r_avg_similarity": 0.5404,
                "r_similarities": [
                    0.5404
                ],
                "s_avg_similarity": 0.4103,
                "s_similarities": [
                    0.4103
                ],
                "s_ppl": 15.48120403289795,
                "t_ppl": 15.48120403289795,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0032,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 369,
            "input": "and i had my sugar bowl favorite, the top hat sundae!",
            "reference": "My sugar bowl favorite was not in stock.",
            "prediction": "I didn't like the top hat sundae.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.8734989388136185,
                "s_sbleu": 18.50510010561515,
                "r_avg_similarity": 0.3547,
                "r_similarities": [
                    0.3547
                ],
                "s_avg_similarity": 0.7416,
                "s_similarities": [
                    0.7416
                ],
                "s_ppl": 95.92024230957031,
                "t_ppl": 95.92024993896484,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9246,
                    "positive": 0.0048,
                    "neutral": 0.0706
                }
            }
        },
        {
            "index": 370,
            "input": "great prices, great selection.",
            "reference": "The prices weren't good, and there wasn't a good selection.",
            "prediction": "The price of this restaurant is too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.062582855427254,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.459,
                "r_similarities": [
                    0.459
                ],
                "s_avg_similarity": 0.3133,
                "s_similarities": [
                    0.3133
                ],
                "s_ppl": 39.28353500366211,
                "t_ppl": 39.28351593017578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9728,
                    "positive": 0.0027,
                    "neutral": 0.0246
                }
            }
        },
        {
            "index": 371,
            "input": "very good food and service!",
            "reference": "The food and service wasn't good at all.",
            "prediction": "The food is not delicious, and the service is poor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.51659301881964,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.695,
                "r_similarities": [
                    0.695
                ],
                "s_avg_similarity": 0.4923,
                "s_similarities": [
                    0.4923
                ],
                "s_ppl": 16.160137176513672,
                "t_ppl": 16.160139083862305,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0034,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 372,
            "input": "this is the best yarn store in the metro area.",
            "reference": "This is the worst yarn store in the metro area.",
            "prediction": "This is the worst yarn store in the metro area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 63.15552371794039,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.8301,
                "s_similarities": [
                    0.8301
                ],
                "s_ppl": 53.65891647338867,
                "t_ppl": 53.65891647338867,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0042,
                    "neutral": 0.013
                }
            }
        },
        {
            "index": 373,
            "input": "great lunch specials and awesome staff.",
            "reference": "The lunch specials weren't good, and neither was the staff.",
            "prediction": "The lunch specials in this restaurant are not good, and the staff is rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.915645938206765,
                "s_sbleu": 6.150343144231885,
                "r_avg_similarity": 0.7507,
                "r_similarities": [
                    0.7507
                ],
                "s_avg_similarity": 0.5886,
                "s_similarities": [
                    0.5886
                ],
                "s_ppl": 26.991865158081055,
                "t_ppl": 26.991872787475586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9832,
                    "positive": 0.0039,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 374,
            "input": "and have enjoyed every last bite.",
            "reference": "I didn't enjoy every bite.",
            "prediction": "and have not enjoyed every last bite.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 59.460355750136046,
                "r_avg_similarity": 0.771,
                "r_similarities": [
                    0.771
                ],
                "s_avg_similarity": 0.9282,
                "s_similarities": [
                    0.9282
                ],
                "s_ppl": 208.4539794921875,
                "t_ppl": 208.45408630371094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0035,
                    "neutral": 0.0187
                }
            }
        },
        {
            "index": 375,
            "input": "food is always amazing no matter what i order.",
            "reference": "The food is always terrible when i order here.",
            "prediction": "I am not satisfied with the food in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.6938,
                "r_similarities": [
                    0.6938
                ],
                "s_avg_similarity": 0.493,
                "s_similarities": [
                    0.493
                ],
                "s_ppl": 16.56252670288086,
                "t_ppl": 16.56252670288086,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0036,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 376,
            "input": "they were extremely friendly and reasonably priced.",
            "reference": "They were very rude, and overly priced.",
            "prediction": "They were unfriendly and expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.708995388048026,
                "s_sbleu": 7.654112967106117,
                "r_avg_similarity": 0.7429,
                "r_similarities": [
                    0.7429
                ],
                "s_avg_similarity": 0.7748,
                "s_similarities": [
                    0.7748
                ],
                "s_ppl": 46.79792022705078,
                "t_ppl": 46.79793167114258,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9709,
                    "positive": 0.0031,
                    "neutral": 0.0259
                }
            }
        },
        {
            "index": 377,
            "input": "good selection of parts and accessories and reasonable prices.",
            "reference": "Terrible selection of parts, and very over priced.",
            "prediction": "The store has a poor selection of parts and accessories and high prices.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.011055432195764,
                "s_sbleu": 39.34995962231129,
                "r_avg_similarity": 0.756,
                "r_similarities": [
                    0.756
                ],
                "s_avg_similarity": 0.5994,
                "s_similarities": [
                    0.5994
                ],
                "s_ppl": 49.53047180175781,
                "t_ppl": 49.530487060546875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9768,
                    "positive": 0.0029,
                    "neutral": 0.0203
                }
            }
        },
        {
            "index": 378,
            "input": "the food is great here and very authentic.",
            "reference": "The food is so bad here and very unathentic tasting.",
            "prediction": "The food in this restaurant is not authentic at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 5.300156689756297,
                "r_avg_similarity": 0.5537,
                "r_similarities": [
                    0.5537
                ],
                "s_avg_similarity": 0.5162,
                "s_similarities": [
                    0.5162
                ],
                "s_ppl": 22.41769027709961,
                "t_ppl": 22.41769027709961,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0033,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 379,
            "input": "great food, low prices, and an authentic mexican cantina vibe.",
            "reference": "Terrible food, bad prices, would not recommend.",
            "prediction": "The restaurant is not a good place to eat.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 3.1085583786586426,
                "r_avg_similarity": 0.5668,
                "r_similarities": [
                    0.5668
                ],
                "s_avg_similarity": 0.2591,
                "s_similarities": [
                    0.2591
                ],
                "s_ppl": 22.3934268951416,
                "t_ppl": 22.3934326171875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0032,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 380,
            "input": "this place offers solid, delicious take out.",
            "reference": "the place gives out ok food, for takeout",
            "prediction": "This place is not a good choice for take out.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 14.991106946711685,
                "r_avg_similarity": 0.5679,
                "r_similarities": [
                    0.5679
                ],
                "s_avg_similarity": 0.5979,
                "s_similarities": [
                    0.5979
                ],
                "s_ppl": 35.3704719543457,
                "t_ppl": 35.3704833984375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9744,
                    "positive": 0.0028,
                    "neutral": 0.0228
                }
            }
        },
        {
            "index": 381,
            "input": "it's a whole new experience and new flavors each time you go.",
            "reference": "the experience was always the same",
            "prediction": "It is a boring place, I don't want to go there again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.737437943747671,
                "r_avg_similarity": 0.1577,
                "r_similarities": [
                    0.1577
                ],
                "s_avg_similarity": 0.3572,
                "s_similarities": [
                    0.3572
                ],
                "s_ppl": 13.6337308883667,
                "t_ppl": 13.633729934692383,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0048,
                    "neutral": 0.0124
                }
            }
        },
        {
            "index": 382,
            "input": "myself and family / friends have been going to them for years!",
            "reference": "my friends and i stopped going years back",
            "prediction": "I have been there for years.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.693025330278465,
                "s_sbleu": 7.8827502217067185,
                "r_avg_similarity": 0.3496,
                "r_similarities": [
                    0.3496
                ],
                "s_avg_similarity": 0.6227,
                "s_similarities": [
                    0.6227
                ],
                "s_ppl": 23.63726043701172,
                "t_ppl": 23.63726234436035,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0358,
                    "positive": 0.0596,
                    "neutral": 0.9046
                }
            }
        },
        {
            "index": 383,
            "input": "they've added some new items on the menu since my last visit.",
            "reference": "no new items have been added over a long time",
            "prediction": "The restaurant has removed some of the old dishes from the menu.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 7.347053125977879,
                "r_avg_similarity": 0.2731,
                "r_similarities": [
                    0.2731
                ],
                "s_avg_similarity": 0.442,
                "s_similarities": [
                    0.442
                ],
                "s_ppl": 28.38079261779785,
                "t_ppl": 28.380794525146484,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0095,
                    "positive": 0.0561,
                    "neutral": 0.9344
                }
            }
        },
        {
            "index": 384,
            "input": "they bring it out front for you and are very helpful.",
            "reference": "there is very little help involved",
            "prediction": "They don't bring it out front for you and are not helpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 61.153805769010226,
                "r_avg_similarity": 0.36,
                "r_similarities": [
                    0.36
                ],
                "s_avg_similarity": 0.7519,
                "s_similarities": [
                    0.7519
                ],
                "s_ppl": 60.582489013671875,
                "t_ppl": 60.58248519897461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9639,
                    "positive": 0.0025,
                    "neutral": 0.0336
                }
            }
        },
        {
            "index": 385,
            "input": "great place to go for games with multiple tvs and a lively crowd.",
            "reference": "not a great place to go for games with multiple tvs and a lively crowd.",
            "prediction": "This is a bad place to go for games with multiple tvs and a lively crowd.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 75.41859578343532,
                "s_sbleu": 74.0341801138924,
                "r_avg_similarity": 0.9094,
                "r_similarities": [
                    0.9094
                ],
                "s_avg_similarity": 0.8259,
                "s_similarities": [
                    0.8259
                ],
                "s_ppl": 61.0009765625,
                "t_ppl": 61.0009765625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9737,
                    "positive": 0.0025,
                    "neutral": 0.0238
                }
            }
        },
        {
            "index": 386,
            "input": "all of my clothes are returned in sparkling condition!",
            "reference": "all of my clothes are returned in terrible condition!",
            "prediction": "My clothes were not returned in good condition.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.147104008451905,
                "s_sbleu": 10.147104008451905,
                "r_avg_similarity": 0.8877,
                "r_similarities": [
                    0.8877
                ],
                "s_avg_similarity": 0.6988,
                "s_similarities": [
                    0.6988
                ],
                "s_ppl": 29.824676513671875,
                "t_ppl": 29.824697494506836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9689,
                    "positive": 0.0028,
                    "neutral": 0.0283
                }
            }
        },
        {
            "index": 387,
            "input": "one of best veal dishes i've ever had and reasonable prices.",
            "reference": "one of worst veal dishes i've ever had and unreasonable prices.",
            "prediction": "The veal dish I ordered is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.062582855427254,
                "s_sbleu": 4.062582855427254,
                "r_avg_similarity": 0.8059,
                "r_similarities": [
                    0.8059
                ],
                "s_avg_similarity": 0.83,
                "s_similarities": [
                    0.83
                ],
                "s_ppl": 96.45113372802734,
                "t_ppl": 96.45117950439453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9126,
                    "positive": 0.0037,
                    "neutral": 0.0837
                }
            }
        },
        {
            "index": 388,
            "input": "the food was good, steak bites and hummus plate a must.",
            "reference": "the food was bad, steak bites and hummus plate avoid.",
            "prediction": "The food is not good, steak bite and hummus plate are not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.380161378318954,
                "s_sbleu": 17.678748653651848,
                "r_avg_similarity": 0.778,
                "r_similarities": [
                    0.778
                ],
                "s_avg_similarity": 0.706,
                "s_similarities": [
                    0.706
                ],
                "s_ppl": 114.39810943603516,
                "t_ppl": 114.39812469482422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0031,
                    "neutral": 0.0172
                }
            }
        },
        {
            "index": 389,
            "input": "as far as pizza goes this ranks with the best i've ever eaten.",
            "reference": "as far as pizza goes this ranks with the worst i've ever eaten.",
            "prediction": "This is the worst pizza I have ever eaten.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.779555250377765,
                "s_sbleu": 11.896441524336442,
                "r_avg_similarity": 0.9011,
                "r_similarities": [
                    0.9011
                ],
                "s_avg_similarity": 0.7999,
                "s_similarities": [
                    0.7999
                ],
                "s_ppl": 11.868605613708496,
                "t_ppl": 11.868605613708496,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0046,
                    "neutral": 0.0126
                }
            }
        },
        {
            "index": 390,
            "input": "really good service and food.",
            "reference": "the service was bad",
            "prediction": "The restaurant is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.3861,
                "r_similarities": [
                    0.3861
                ],
                "s_avg_similarity": 0.306,
                "s_similarities": [
                    0.306
                ],
                "s_ppl": 47.962284088134766,
                "t_ppl": 47.96229553222656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0038,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 391,
            "input": "their sandwiches were really tasty.",
            "reference": "the sandwiches were poor",
            "prediction": "Their sandwiches were really tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.233395773754946,
                "s_sbleu": 32.46679154750989,
                "r_avg_similarity": 0.7595,
                "r_similarities": [
                    0.7595
                ],
                "s_avg_similarity": 0.8077,
                "s_similarities": [
                    0.8077
                ],
                "s_ppl": 135.6546630859375,
                "t_ppl": 135.6546630859375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0037,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 392,
            "input": "always a fun and friendly atmosphere.",
            "reference": "is was a bad atmospher",
            "prediction": "The restaurant is always a boring and unfriendly atmosphere.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 12.549310621989482,
                "r_avg_similarity": 0.2001,
                "r_similarities": [
                    0.2001
                ],
                "s_avg_similarity": 0.4851,
                "s_similarities": [
                    0.4851
                ],
                "s_ppl": 68.55143737792969,
                "t_ppl": 68.55146789550781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0036,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 393,
            "input": "i'm a regular drive-through customer at this location.",
            "reference": "i will never go back",
            "prediction": "I am a frequent visitor of this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.27465531099474,
                "r_avg_similarity": 0.2255,
                "r_similarities": [
                    0.2255
                ],
                "s_avg_similarity": 0.351,
                "s_similarities": [
                    0.351
                ],
                "s_ppl": 23.946453094482422,
                "t_ppl": 23.94643783569336,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0019,
                    "positive": 0.6905,
                    "neutral": 0.3076
                }
            }
        },
        {
            "index": 394,
            "input": "it was so delicious; i've never had anything like it!",
            "reference": "everything tasted bad, nothing i liked",
            "prediction": "I have never tasted such a disgusting food in my life.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.5872,
                "r_similarities": [
                    0.5872
                ],
                "s_avg_similarity": 0.5405,
                "s_similarities": [
                    0.5405
                ],
                "s_ppl": 16.592870712280273,
                "t_ppl": 16.592872619628906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0044,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 395,
            "input": "definitely something i will have again!",
            "reference": "not something i would have again",
            "prediction": "I will never order this dish again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.2115,
                "r_similarities": [
                    0.2115
                ],
                "s_avg_similarity": 0.2193,
                "s_similarities": [
                    0.2193
                ],
                "s_ppl": 32.256290435791016,
                "t_ppl": 32.25630187988281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9738,
                    "positive": 0.0045,
                    "neutral": 0.0217
                }
            }
        },
        {
            "index": 396,
            "input": "the california burrito was also a great burrito.",
            "reference": "california burrito was a bad burrito",
            "prediction": "The california burrito is not a good choice.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 11.339582221952005,
                "r_avg_similarity": 0.7489,
                "r_similarities": [
                    0.7489
                ],
                "s_avg_similarity": 0.6934,
                "s_similarities": [
                    0.6934
                ],
                "s_ppl": 42.977569580078125,
                "t_ppl": 42.977577209472656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.975,
                    "positive": 0.0033,
                    "neutral": 0.0217
                }
            }
        },
        {
            "index": 397,
            "input": "the woman who helped me today was very friendly and knowledgeable.",
            "reference": "the woman who helped was angry and quick",
            "prediction": "The woman who helped me today was rude and ignorant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.851165692617155,
                "s_sbleu": 45.30516301576311,
                "r_avg_similarity": 0.477,
                "r_similarities": [
                    0.477
                ],
                "s_avg_similarity": 0.6431,
                "s_similarities": [
                    0.6431
                ],
                "s_ppl": 65.39994812011719,
                "t_ppl": 65.39994812011719,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.0031,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 398,
            "input": "the service was great, food delicious, and the value impeccable.",
            "reference": "service was poor and the food expensive and weak tasting",
            "prediction": "The service was terrible, the food was disgusting, and the value was unacceptable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.094306782864106,
                "s_sbleu": 20.68720601025941,
                "r_avg_similarity": 0.7363,
                "r_similarities": [
                    0.7363
                ],
                "s_avg_similarity": 0.6189,
                "s_similarities": [
                    0.6189
                ],
                "s_ppl": 33.19454574584961,
                "t_ppl": 33.194557189941406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9836,
                    "positive": 0.0042,
                    "neutral": 0.0122
                }
            }
        },
        {
            "index": 399,
            "input": "loved the menu and the drinks.",
            "reference": "the menu was small and lacking",
            "prediction": "I hated the menu and the drinks.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 68.037493331712,
                "r_avg_similarity": 0.5641,
                "r_similarities": [
                    0.5641
                ],
                "s_avg_similarity": 0.7969,
                "s_similarities": [
                    0.7969
                ],
                "s_ppl": 66.16500091552734,
                "t_ppl": 66.16499328613281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0047,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 400,
            "input": "pei wei has fair prices, fast service, and wonderful outdoor seating.",
            "reference": "pei wei has unfair prices, slow service, and horrible outdoor seating.",
            "prediction": "pei wei has high prices, slow service, and terrible outdoor seating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 53.33505353503043,
                "s_sbleu": 26.33201939239633,
                "r_avg_similarity": 0.9502,
                "r_similarities": [
                    0.9502
                ],
                "s_avg_similarity": 0.8839,
                "s_similarities": [
                    0.8839
                ],
                "s_ppl": 67.86942291259766,
                "t_ppl": 67.86942291259766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0035,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 401,
            "input": "it was a great experience!",
            "reference": "it was a terrible experience!",
            "prediction": "It was a terrible experience!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 75.98356856515926,
                "s_sbleu": 22.957488466614326,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.7429,
                "s_similarities": [
                    0.7429
                ],
                "s_ppl": 50.565025329589844,
                "t_ppl": 50.56502914428711,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0041,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 402,
            "input": "his humor makes a routine visit entertaining.",
            "reference": "hi humor makes a routine visit boring.",
            "prediction": "His humor makes a routine visit boring.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 84.08964152537145,
                "s_sbleu": 54.10822690539397,
                "r_avg_similarity": 0.8324,
                "r_similarities": [
                    0.8324
                ],
                "s_avg_similarity": 0.8539,
                "s_similarities": [
                    0.8539
                ],
                "s_ppl": 515.5678100585938,
                "t_ppl": 515.5678100585938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9541,
                    "positive": 0.0046,
                    "neutral": 0.0413
                }
            }
        },
        {
            "index": 403,
            "input": "love this place and will keep coming back.",
            "reference": "don't like this place and will not be coming back.",
            "prediction": "I hate this place and will never come back again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.965358893403383,
                "s_sbleu": 25.965358893403383,
                "r_avg_similarity": 0.818,
                "r_similarities": [
                    0.818
                ],
                "s_avg_similarity": 0.617,
                "s_similarities": [
                    0.617
                ],
                "s_ppl": 17.665367126464844,
                "t_ppl": 17.665367126464844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9836,
                    "positive": 0.0054,
                    "neutral": 0.0111
                }
            }
        },
        {
            "index": 404,
            "input": "we were sat right away and every staff member was extremely friendly and happy.",
            "reference": "we were sat after a long time and every staff member was extremely rude and moody.",
            "prediction": "The waiter was rude and unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7432772183239766,
                "s_sbleu": 2.75631563063758,
                "r_avg_similarity": 0.4876,
                "r_similarities": [
                    0.4876
                ],
                "s_avg_similarity": 0.3712,
                "s_similarities": [
                    0.3712
                ],
                "s_ppl": 30.924753189086914,
                "t_ppl": 30.924745559692383,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9803,
                    "positive": 0.0038,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 405,
            "input": "will definitely go back and recommend to friends.",
            "reference": "won't go back with friends",
            "prediction": "I will never go back there again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.044795567078939,
                "s_sbleu": 11.59119922599073,
                "r_avg_similarity": 0.3405,
                "r_similarities": [
                    0.3405
                ],
                "s_avg_similarity": 0.3405,
                "s_similarities": [
                    0.3405
                ],
                "s_ppl": 13.936039924621582,
                "t_ppl": 13.936044692993164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9514,
                    "positive": 0.0046,
                    "neutral": 0.044
                }
            }
        },
        {
            "index": 406,
            "input": "their small calzone is really gigantic!",
            "reference": "the calzone is very small",
            "prediction": "Their small calzone is really gigantic!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 80.91067115702207,
                "r_avg_similarity": 0.7889,
                "r_similarities": [
                    0.7889
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 740.4296264648438,
                "t_ppl": 740.4297485351562,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0021,
                    "positive": 0.8934,
                    "neutral": 0.1045
                }
            }
        },
        {
            "index": 407,
            "input": "the food is also very good.",
            "reference": "the food tasted just ok",
            "prediction": "The food is not delicious at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.5797,
                "r_similarities": [
                    0.5797
                ],
                "s_avg_similarity": 0.5321,
                "s_similarities": [
                    0.5321
                ],
                "s_ppl": 32.990177154541016,
                "t_ppl": 32.99018478393555,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0036,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 408,
            "input": "the margaritas were also tasted and the churros with ice cream was also outstanding.",
            "reference": "the margaritas tasted off and the churros with ice cream bland",
            "prediction": "The margaritas were not tasty and the churros with ice cream was not outstanding.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.64932442330151,
                "s_sbleu": 48.14400258132247,
                "r_avg_similarity": 0.7807,
                "r_similarities": [
                    0.7807
                ],
                "s_avg_similarity": 0.7663,
                "s_similarities": [
                    0.7663
                ],
                "s_ppl": 33.16918182373047,
                "t_ppl": 33.16918182373047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9766,
                    "positive": 0.0032,
                    "neutral": 0.0202
                }
            }
        },
        {
            "index": 409,
            "input": "i highly recommend the ahi tuna.",
            "reference": "the ahi tuna is not something i want to recommend",
            "prediction": "I don't recommend the ahi tuna.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.112717058426785,
                "s_sbleu": 61.47881529512643,
                "r_avg_similarity": 0.9553,
                "r_similarities": [
                    0.9553
                ],
                "s_avg_similarity": 0.9242,
                "s_similarities": [
                    0.9242
                ],
                "s_ppl": 43.640445709228516,
                "t_ppl": 43.64043426513672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9509,
                    "positive": 0.0039,
                    "neutral": 0.0452
                }
            }
        },
        {
            "index": 410,
            "input": "she was so patient, kind and understanding.",
            "reference": "she was very quick an impatient",
            "prediction": "She is a rude, selfish and unkind person.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.3072,
                "r_similarities": [
                    0.3072
                ],
                "s_avg_similarity": 0.4296,
                "s_similarities": [
                    0.4296
                ],
                "s_ppl": 22.49959945678711,
                "t_ppl": 22.49959945678711,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0042,
                    "neutral": 0.0137
                }
            }
        },
        {
            "index": 411,
            "input": "heck, even the pizza is decent.",
            "reference": "the pizza was not good",
            "prediction": "The pizza in this restaurant is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 7.267884212102741,
                "r_avg_similarity": 0.7122,
                "r_similarities": [
                    0.7122
                ],
                "s_avg_similarity": 0.7248,
                "s_similarities": [
                    0.7248
                ],
                "s_ppl": 75.08406066894531,
                "t_ppl": 75.08409118652344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0043,
                    "neutral": 0.013
                }
            }
        },
        {
            "index": 412,
            "input": "cooked to perfection and very flavorful.",
            "reference": "over cooked and bland",
            "prediction": "The meat is overcooked and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.5343,
                "r_similarities": [
                    0.5343
                ],
                "s_avg_similarity": 0.4717,
                "s_similarities": [
                    0.4717
                ],
                "s_ppl": 24.57929801940918,
                "t_ppl": 24.579303741455078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9712,
                    "positive": 0.003,
                    "neutral": 0.0259
                }
            }
        },
        {
            "index": 413,
            "input": "the crew was very friendly and accommodating.",
            "reference": "very mean crew",
            "prediction": "The crew was very unfriendly and incompetent.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 23.356898886410004,
                "r_avg_similarity": 0.4689,
                "r_similarities": [
                    0.4689
                ],
                "s_avg_similarity": 0.5903,
                "s_similarities": [
                    0.5903
                ],
                "s_ppl": 57.88795471191406,
                "t_ppl": 57.88795471191406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0036,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 414,
            "input": "the sushi here is great and i love the cucumber salad.",
            "reference": "bad suchi and salad",
            "prediction": "The sushi here is terrible and I hate the cucumber salad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 31.702331385234313,
                "r_avg_similarity": 0.5074,
                "r_similarities": [
                    0.5074
                ],
                "s_avg_similarity": 0.9178,
                "s_similarities": [
                    0.9178
                ],
                "s_ppl": 64.66816711425781,
                "t_ppl": 64.66813659667969,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0041,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 415,
            "input": "if you are looking to walk out transformed this is your place!",
            "reference": "this place will not transform you",
            "prediction": "if you are looking to walk out transformed this is your place!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.065425428798724,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.5695,
                "r_similarities": [
                    0.5695
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 64.73129272460938,
                "t_ppl": 64.7313232421875,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0028,
                    "positive": 0.7466,
                    "neutral": 0.2506
                }
            }
        },
        {
            "index": 416,
            "input": "she chose a great color that looks incredible with my skin, too.",
            "reference": "i hated the color, it did not match my skin",
            "prediction": "The color of her dress is not suitable for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 3.3930265691828274,
                "r_avg_similarity": 0.4666,
                "r_similarities": [
                    0.4666
                ],
                "s_avg_similarity": 0.4906,
                "s_similarities": [
                    0.4906
                ],
                "s_ppl": 42.60285949707031,
                "t_ppl": 42.60286331176758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9722,
                    "positive": 0.0029,
                    "neutral": 0.0249
                }
            }
        },
        {
            "index": 417,
            "input": "a great place to watch sports!",
            "reference": "too loud i would not go back",
            "prediction": "It is not a good place to watch sports.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 27.77619034011791,
                "r_avg_similarity": 0.1501,
                "r_similarities": [
                    0.1501
                ],
                "s_avg_similarity": 0.7084,
                "s_similarities": [
                    0.7084
                ],
                "s_ppl": 22.625076293945312,
                "t_ppl": 22.62507438659668,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9803,
                    "positive": 0.0033,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 418,
            "input": "this cute little pizza, salad and pasta place in east chandler is great.",
            "reference": "this little pizza and salad place is disgusting",
            "prediction": "This restaurant is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.815868174415823,
                "s_sbleu": 2.153749340017052,
                "r_avg_similarity": 0.5907,
                "r_similarities": [
                    0.5907
                ],
                "s_avg_similarity": 0.4452,
                "s_similarities": [
                    0.4452
                ],
                "s_ppl": 95.4192123413086,
                "t_ppl": 95.41926574707031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0038,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 419,
            "input": "the art in the alley behind it is cool too!",
            "reference": "the alley way art is scary",
            "prediction": "The art in the alley behind it is not cool at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.347053125977879,
                "s_sbleu": 48.63383168079944,
                "r_avg_similarity": 0.6698,
                "r_similarities": [
                    0.6698
                ],
                "s_avg_similarity": 0.7774,
                "s_similarities": [
                    0.7774
                ],
                "s_ppl": 62.26486587524414,
                "t_ppl": 62.26485824584961,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9803,
                    "positive": 0.0032,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 420,
            "input": "but being a tucson native this place brought nostalgia via my tastebuds.",
            "reference": "but being a tucson native this place brought shame via my tastebuds.",
            "prediction": "This restaurant is not good for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.9559265264674432,
                "s_sbleu": 2.9559265264674432,
                "r_avg_similarity": 0.3364,
                "r_similarities": [
                    0.3364
                ],
                "s_avg_similarity": 0.2755,
                "s_similarities": [
                    0.2755
                ],
                "s_ppl": 53.12354278564453,
                "t_ppl": 53.123558044433594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0037,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 421,
            "input": "best chicken parmesan i have ever had.",
            "reference": "worst chicken parmesan i have ever had.",
            "prediction": "The chicken parmesan I ordered is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 8.29519350710986,
                "r_avg_similarity": 0.7725,
                "r_similarities": [
                    0.7725
                ],
                "s_avg_similarity": 0.8043,
                "s_similarities": [
                    0.8043
                ],
                "s_ppl": 29.11832618713379,
                "t_ppl": 29.118331909179688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0035,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 422,
            "input": "customer service was great there.",
            "reference": "customer service was poor there.",
            "prediction": "The customer service in this restaurant is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 10.552670315936318,
                "r_avg_similarity": 0.6524,
                "r_similarities": [
                    0.6524
                ],
                "s_avg_similarity": 0.5103,
                "s_similarities": [
                    0.5103
                ],
                "s_ppl": 34.28336715698242,
                "t_ppl": 34.28338623046875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.005,
                    "neutral": 0.0122
                }
            }
        },
        {
            "index": 423,
            "input": "fun place to catch a game on tv and catch up w/ people.",
            "reference": "loud place to catch a game on tv and try to catch up w/ people.",
            "prediction": "It is a boring place to watch a game on TV.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.937057190523465,
                "s_sbleu": 12.920606398131984,
                "r_avg_similarity": 0.5037,
                "r_similarities": [
                    0.5037
                ],
                "s_avg_similarity": 0.6047,
                "s_similarities": [
                    0.6047
                ],
                "s_ppl": 22.450157165527344,
                "t_ppl": 22.450157165527344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0035,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 424,
            "input": "most delicious authentic chinese food!",
            "reference": "most terrible inauthentic chinese food!",
            "prediction": "The food in this restaurant is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.4654,
                "r_similarities": [
                    0.4654
                ],
                "s_avg_similarity": 0.2347,
                "s_similarities": [
                    0.2347
                ],
                "s_ppl": 17.52880096435547,
                "t_ppl": 17.528806686401367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0039,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 425,
            "input": "the chips and guacamole were excellent too!",
            "reference": "The chips and guacamole weren't that good.",
            "prediction": "The chips and guacaomole were inedible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.772101321113862,
                "s_sbleu": 12.600736402830258,
                "r_avg_similarity": 0.8134,
                "r_similarities": [
                    0.8134
                ],
                "s_avg_similarity": 0.7057,
                "s_similarities": [
                    0.7057
                ],
                "s_ppl": 233.30484008789062,
                "t_ppl": 233.30482482910156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9635,
                    "positive": 0.0027,
                    "neutral": 0.0337
                }
            }
        },
        {
            "index": 426,
            "input": "this place is wonderful when you can actually sit outside.",
            "reference": "The place still isn't good, even when you can sit outside.",
            "prediction": "This place is terrible when it rains.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.8902180856807296,
                "s_sbleu": 9.027235033938242,
                "r_avg_similarity": 0.535,
                "r_similarities": [
                    0.535
                ],
                "s_avg_similarity": 0.4609,
                "s_similarities": [
                    0.4609
                ],
                "s_ppl": 30.70306396484375,
                "t_ppl": 30.70306968688965,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0038,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 427,
            "input": "a great little spot to throw back a few beers after a rough day.",
            "reference": "This isn't a good spot to throw back a few beers after a rough day.",
            "prediction": "It is a terrible place to drink beers.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.097704314134564,
                "s_sbleu": 3.461743640369311,
                "r_avg_similarity": 0.6149,
                "r_similarities": [
                    0.6149
                ],
                "s_avg_similarity": 0.5537,
                "s_similarities": [
                    0.5537
                ],
                "s_ppl": 62.241676330566406,
                "t_ppl": 62.241703033447266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0037,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 428,
            "input": "i definitely recommend this place to others!",
            "reference": "I definitely don't recommend this place to others.",
            "prediction": "I would not recommend this place to others.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 61.04735835807847,
                "s_sbleu": 44.63236137853328,
                "r_avg_similarity": 0.9117,
                "r_similarities": [
                    0.9117
                ],
                "s_avg_similarity": 0.7858,
                "s_similarities": [
                    0.7858
                ],
                "s_ppl": 16.148534774780273,
                "t_ppl": 16.148536682128906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9754,
                    "positive": 0.0032,
                    "neutral": 0.0214
                }
            }
        },
        {
            "index": 429,
            "input": "well the food was great and the price of it was even better.",
            "reference": "The food wasn't good, and the price was even worse.",
            "prediction": "The food was terrible and the price of it was too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.727800941615358,
                "s_sbleu": 40.81851142423725,
                "r_avg_similarity": 0.909,
                "r_similarities": [
                    0.909
                ],
                "s_avg_similarity": 0.7581,
                "s_similarities": [
                    0.7581
                ],
                "s_ppl": 19.7601318359375,
                "t_ppl": 19.760143280029297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0035,
                    "neutral": 0.0138
                }
            }
        },
        {
            "index": 430,
            "input": "i took the waiter's recommendation of the veal carolina and it was super!",
            "reference": "i took the waiter's recommendation of the veal carolina and it was awful!",
            "prediction": "The veal carolinan I ordered is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.853183878886449,
                "s_sbleu": 2.853183878886449,
                "r_avg_similarity": 0.5925,
                "r_similarities": [
                    0.5925
                ],
                "s_avg_similarity": 0.5866,
                "s_similarities": [
                    0.5866
                ],
                "s_ppl": 132.79205322265625,
                "t_ppl": 132.7921142578125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0034,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 431,
            "input": "super good deals and very friendly staff.",
            "reference": "super bad deals and very unfriendly staff.",
            "prediction": "The service is not friendly, and the price is too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.673526562988939,
                "s_sbleu": 4.065425428798724,
                "r_avg_similarity": 0.4054,
                "r_similarities": [
                    0.4054
                ],
                "s_avg_similarity": 0.4907,
                "s_similarities": [
                    0.4907
                ],
                "s_ppl": 23.858308792114258,
                "t_ppl": 23.858318328857422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.003,
                    "neutral": 0.0172
                }
            }
        },
        {
            "index": 432,
            "input": "tried their lasagna and its the best ive ever had.",
            "reference": "tried their lasagna and its the worst ive ever had.",
            "prediction": "The lasagna I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.515183688171633,
                "s_sbleu": 4.515183688171633,
                "r_avg_similarity": 0.6773,
                "r_similarities": [
                    0.6773
                ],
                "s_avg_similarity": 0.6593,
                "s_similarities": [
                    0.6593
                ],
                "s_ppl": 59.94981384277344,
                "t_ppl": 59.9498405456543,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.0033,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 433,
            "input": "this place is edgy and fun.",
            "reference": "this place isn't edgy or fun.",
            "prediction": "This place is boring and dull.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 15.619699684601283,
                "r_avg_similarity": 0.5361,
                "r_similarities": [
                    0.5361
                ],
                "s_avg_similarity": 0.531,
                "s_similarities": [
                    0.531
                ],
                "s_ppl": 60.83755111694336,
                "t_ppl": 60.83755111694336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0042,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 434,
            "input": "fantastic place to see a show as every seat is a great seat!",
            "reference": "terrible place to see a show as every seat is a horrible seat!",
            "prediction": "The seats in this theater are too far from the stage.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5174,
                "r_similarities": [
                    0.5174
                ],
                "s_avg_similarity": 0.3672,
                "s_similarities": [
                    0.3672
                ],
                "s_ppl": 34.3679313659668,
                "t_ppl": 34.367942810058594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7055,
                    "positive": 0.0068,
                    "neutral": 0.2877
                }
            }
        },
        {
            "index": 435,
            "input": "she was absolutely fantastic and i love what she did!",
            "reference": "she was absolutely awful and i hate what she did!",
            "prediction": "She is a terrible actress, I hate her performance.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.7334,
                "r_similarities": [
                    0.7334
                ],
                "s_avg_similarity": 0.4993,
                "s_similarities": [
                    0.4993
                ],
                "s_ppl": 36.08698272705078,
                "t_ppl": 36.08698272705078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.984,
                    "positive": 0.0048,
                    "neutral": 0.0112
                }
            }
        },
        {
            "index": 436,
            "input": "the happy hour crowd here can be fun on occasion.",
            "reference": "the happy hour crowd here is never fun.",
            "prediction": "The happy hour crowd here is annoying.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 47.750342648354646,
                "s_sbleu": 25.124218547395092,
                "r_avg_similarity": 0.788,
                "r_similarities": [
                    0.788
                ],
                "s_avg_similarity": 0.8039,
                "s_similarities": [
                    0.8039
                ],
                "s_ppl": 260.7862548828125,
                "t_ppl": 260.7862548828125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9746,
                    "positive": 0.0044,
                    "neutral": 0.021
                }
            }
        },
        {
            "index": 437,
            "input": "very busy but very good service.",
            "reference": "very busy and very bad service.",
            "prediction": "The waiter is not attentive and the food is cold.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.1873,
                "r_similarities": [
                    0.1873
                ],
                "s_avg_similarity": 0.1444,
                "s_similarities": [
                    0.1444
                ],
                "s_ppl": 39.957862854003906,
                "t_ppl": 39.95785903930664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9775,
                    "positive": 0.0031,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 438,
            "input": "best take out or eat in sushi!",
            "reference": "worst take out or eat in sushi!",
            "prediction": "The sushi I ordered is not fresh.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.5565,
                "r_similarities": [
                    0.5565
                ],
                "s_avg_similarity": 0.5767,
                "s_similarities": [
                    0.5767
                ],
                "s_ppl": 128.40199279785156,
                "t_ppl": 128.40199279785156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9736,
                    "positive": 0.0031,
                    "neutral": 0.0233
                }
            }
        },
        {
            "index": 439,
            "input": "i have had a great experience every time from start to finish.",
            "reference": "i have had a bad experience every time from start to finish.",
            "prediction": "I have had a terrible experience every time from start to finish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 67.03420896351791,
                "s_sbleu": 67.03420896351791,
                "r_avg_similarity": 0.9452,
                "r_similarities": [
                    0.9452
                ],
                "s_avg_similarity": 0.8106,
                "s_similarities": [
                    0.8106
                ],
                "s_ppl": 31.245285034179688,
                "t_ppl": 31.24529457092285,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0033,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 440,
            "input": "he is very thorough and genuinely cares for his customers.",
            "reference": "he does not care for his customers and does not even pay attention to them",
            "prediction": "He is a lazy waiter who doesn't care about his customers.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.837542914603119,
                "s_sbleu": 13.545994273378144,
                "r_avg_similarity": 0.764,
                "r_similarities": [
                    0.764
                ],
                "s_avg_similarity": 0.5922,
                "s_similarities": [
                    0.5922
                ],
                "s_ppl": 18.846895217895508,
                "t_ppl": 18.846885681152344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9783,
                    "positive": 0.0033,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 441,
            "input": "plus he has amazing prices, how could you not go?",
            "reference": "the prices were on the high side, cheaper place nearby",
            "prediction": "He is a bad businessman and his prices are too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.3979,
                "r_similarities": [
                    0.3979
                ],
                "s_avg_similarity": 0.5951,
                "s_similarities": [
                    0.5951
                ],
                "s_ppl": 25.5184383392334,
                "t_ppl": 25.518447875976562,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0032,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 442,
            "input": "the staff are very friendly and on the ball.",
            "reference": "the staff was horrible and slow",
            "prediction": "The waiter is rude and incompetent.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 5.087641220727392,
                "r_avg_similarity": 0.2907,
                "r_similarities": [
                    0.2907
                ],
                "s_avg_similarity": 0.264,
                "s_similarities": [
                    0.264
                ],
                "s_ppl": 143.08651733398438,
                "t_ppl": 143.08651733398438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0038,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 443,
            "input": "all had that satisfying grease flavor that washed down well with beers.",
            "reference": "too much grease in the food and the beer was too warm",
            "prediction": "The food was too oily and it made me feel sick.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.054496384843702,
                "s_sbleu": 3.1157290929555894,
                "r_avg_similarity": 0.6655,
                "r_similarities": [
                    0.6655
                ],
                "s_avg_similarity": 0.4588,
                "s_similarities": [
                    0.4588
                ],
                "s_ppl": 24.33700942993164,
                "t_ppl": 24.337011337280273,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0028,
                    "neutral": 0.0191
                }
            }
        },
        {
            "index": 444,
            "input": "i was a walk in and got helped right away!",
            "reference": "i had to wait an hour to be served",
            "prediction": "I was a walk-in, but I had to wait for 30 minutes.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.571070857151538,
                "s_sbleu": 5.67967744513558,
                "r_avg_similarity": 0.5611,
                "r_similarities": [
                    0.5611
                ],
                "s_avg_similarity": 0.6977,
                "s_similarities": [
                    0.6977
                ],
                "s_ppl": 13.45330810546875,
                "t_ppl": 13.4533109664917,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9173,
                    "positive": 0.0028,
                    "neutral": 0.0799
                }
            }
        },
        {
            "index": 445,
            "input": "if you sit in the bar they have the best bartender in town.",
            "reference": "the bartender was horrible",
            "prediction": "If you sit in the bar, you will be served by a bad bartender.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.908317710573758,
                "s_sbleu": 24.903286388467727,
                "r_avg_similarity": 0.7128,
                "r_similarities": [
                    0.7128
                ],
                "s_avg_similarity": 0.7302,
                "s_similarities": [
                    0.7302
                ],
                "s_ppl": 22.038938522338867,
                "t_ppl": 22.0389404296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9643,
                    "positive": 0.0029,
                    "neutral": 0.0328
                }
            }
        },
        {
            "index": 446,
            "input": "i highly recommend this shop.",
            "reference": "i would not suggest this shop",
            "prediction": "I don't recommend this shop.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.233395773754946,
                "s_sbleu": 50.81327481546147,
                "r_avg_similarity": 0.8655,
                "r_similarities": [
                    0.8655
                ],
                "s_avg_similarity": 0.8049,
                "s_similarities": [
                    0.8049
                ],
                "s_ppl": 38.59122848510742,
                "t_ppl": 38.59123229980469,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9713,
                    "positive": 0.0033,
                    "neutral": 0.0253
                }
            }
        },
        {
            "index": 447,
            "input": "their staff is knowledgeable and informative.",
            "reference": "the staff are rude and lousy",
            "prediction": "Their staff is ignorant and uninformative.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 15.619699684601283,
                "r_avg_similarity": 0.7191,
                "r_similarities": [
                    0.7191
                ],
                "s_avg_similarity": 0.6545,
                "s_similarities": [
                    0.6545
                ],
                "s_ppl": 69.96455383300781,
                "t_ppl": 69.96458435058594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0035,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 448,
            "input": "it is a cool place, with lots to see and try.",
            "reference": "nothing to see there, not a nice place",
            "prediction": "It is a boring place, with nothing to do.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.425159511373677,
                "s_sbleu": 15.909385168481824,
                "r_avg_similarity": 0.5829,
                "r_similarities": [
                    0.5829
                ],
                "s_avg_similarity": 0.5084,
                "s_similarities": [
                    0.5084
                ],
                "s_ppl": 17.269489288330078,
                "t_ppl": 17.269493103027344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9754,
                    "positive": 0.0043,
                    "neutral": 0.0202
                }
            }
        },
        {
            "index": 449,
            "input": "they are super friendly, very helpful, and amazingly quick!",
            "reference": "so slow and rude, not helpful at all",
            "prediction": "They are unfriendly, not helpful, and slow.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 14.530346490115708,
                "r_avg_similarity": 0.5939,
                "r_similarities": [
                    0.5939
                ],
                "s_avg_similarity": 0.6683,
                "s_similarities": [
                    0.6683
                ],
                "s_ppl": 25.336023330688477,
                "t_ppl": 25.33602523803711,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0034,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 450,
            "input": "i got my car detailed here and it looked amazing!",
            "reference": "car was detailed and came out bad",
            "prediction": "The detailing of my car was not good enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.392229812593097,
                "s_sbleu": 7.593603555191143,
                "r_avg_similarity": 0.6299,
                "r_similarities": [
                    0.6299
                ],
                "s_avg_similarity": 0.5722,
                "s_similarities": [
                    0.5722
                ],
                "s_ppl": 69.22089385986328,
                "t_ppl": 69.2209243774414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.003,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 451,
            "input": "dr. hall is so kind and gentle.",
            "reference": "dr hall was not kind nor gentle",
            "prediction": "Dr. Hall is a rude and arrogant doctor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.934202609760488,
                "r_avg_similarity": 0.7165,
                "r_similarities": [
                    0.7165
                ],
                "s_avg_similarity": 0.7722,
                "s_similarities": [
                    0.7722
                ],
                "s_ppl": 53.18577194213867,
                "t_ppl": 53.185768127441406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0037,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 452,
            "input": "i had to box it up even, such a huge portion.",
            "reference": "the portions were so small",
            "prediction": "I was forced to take away the food even though it is too much.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.627961710408444,
                "s_sbleu": 3.716499092256818,
                "r_avg_similarity": 0.366,
                "r_similarities": [
                    0.366
                ],
                "s_avg_similarity": 0.3689,
                "s_similarities": [
                    0.3689
                ],
                "s_ppl": 34.009395599365234,
                "t_ppl": 34.00940704345703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.6065,
                    "positive": 0.0062,
                    "neutral": 0.3873
                }
            }
        },
        {
            "index": 453,
            "input": "the food all looked great.",
            "reference": "the food looked ok",
            "prediction": "The food was not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 7.267884212102741,
                "r_avg_similarity": 0.7515,
                "r_similarities": [
                    0.7515
                ],
                "s_avg_similarity": 0.6288,
                "s_similarities": [
                    0.6288
                ],
                "s_ppl": 23.248722076416016,
                "t_ppl": 23.248729705810547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0037,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 454,
            "input": "the menudo here is perfect.",
            "reference": "the menudo was poorly done",
            "prediction": "The menu here is not good enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.4892,
                "r_similarities": [
                    0.4892
                ],
                "s_avg_similarity": 0.5824,
                "s_similarities": [
                    0.5824
                ],
                "s_ppl": 67.48594665527344,
                "t_ppl": 67.48594665527344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9803,
                    "positive": 0.0034,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 455,
            "input": "the crispy mango fish was very tasty.",
            "reference": "the crispy mango fish was very disgusting.",
            "prediction": "The mango fish is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 11.339582221952005,
                "r_avg_similarity": 0.7444,
                "r_similarities": [
                    0.7444
                ],
                "s_avg_similarity": 0.7239,
                "s_similarities": [
                    0.7239
                ],
                "s_ppl": 120.28141021728516,
                "t_ppl": 120.28135681152344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0032,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 456,
            "input": "now the food, drinks, and desserts are amazing.",
            "reference": "now the food, drinks, and desserts are horrible.",
            "prediction": "The food, drinks, and desserts in this restaurant are terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 40.89601472043678,
                "s_sbleu": 40.89601472043678,
                "r_avg_similarity": 0.8384,
                "r_similarities": [
                    0.8384
                ],
                "s_avg_similarity": 0.5222,
                "s_similarities": [
                    0.5222
                ],
                "s_ppl": 31.00748634338379,
                "t_ppl": 31.00749397277832,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0045,
                    "neutral": 0.0124
                }
            }
        },
        {
            "index": 457,
            "input": "the carne asada burrito is awesome!",
            "reference": "the carne asada burrito is awful!",
            "prediction": "The carne asada burrito is disgusting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 41.11336169005198,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.9212,
                "r_similarities": [
                    0.9212
                ],
                "s_avg_similarity": 0.8197,
                "s_similarities": [
                    0.8197
                ],
                "s_ppl": 29.087926864624023,
                "t_ppl": 29.087926864624023,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0038,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 458,
            "input": "this is the perfect date night.",
            "reference": "this is the worst date night.",
            "prediction": "This is a terrible date night.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.269098944241588,
                "s_sbleu": 26.269098944241588,
                "r_avg_similarity": 0.9047,
                "r_similarities": [
                    0.9047
                ],
                "s_avg_similarity": 0.6835,
                "s_similarities": [
                    0.6835
                ],
                "s_ppl": 36.03477096557617,
                "t_ppl": 36.0347785949707,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0039,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 459,
            "input": "nice selection of games to play.",
            "reference": "terrible selection of games to play.",
            "prediction": "The game is not interesting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.870636427700047,
                "s_sbleu": 6.870636427700047,
                "r_avg_similarity": 0.418,
                "r_similarities": [
                    0.418
                ],
                "s_avg_similarity": 0.3331,
                "s_similarities": [
                    0.3331
                ],
                "s_ppl": 71.69084930419922,
                "t_ppl": 71.69085693359375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0039,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 460,
            "input": "the grilled artichokes are wonderful!",
            "reference": "The artichokes were terrible and undercooked.",
            "prediction": "The grilled artichokes are inedible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.042266054940777,
                "s_sbleu": 30.213753973567677,
                "r_avg_similarity": 0.589,
                "r_similarities": [
                    0.589
                ],
                "s_avg_similarity": 0.8007,
                "s_similarities": [
                    0.8007
                ],
                "s_ppl": 48.005889892578125,
                "t_ppl": 48.00589370727539,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9718,
                    "positive": 0.0028,
                    "neutral": 0.0254
                }
            }
        },
        {
            "index": 461,
            "input": "the adovada is hot but wonderful and the chocolate bread pudding is amazing.",
            "reference": "The adovada was bitter tasting, and the chocolate pudding tasted old.",
            "prediction": "The adova da is too hot, and the chocolate bread pudding is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.609282679116177,
                "s_sbleu": 33.34477432809603,
                "r_avg_similarity": 0.644,
                "r_similarities": [
                    0.644
                ],
                "s_avg_similarity": 0.8424,
                "s_similarities": [
                    0.8424
                ],
                "s_ppl": 184.6903839111328,
                "t_ppl": 184.69039916992188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9745,
                    "positive": 0.0032,
                    "neutral": 0.0223
                }
            }
        },
        {
            "index": 462,
            "input": "fun and inexpensive way to enjoy and relax your day.",
            "reference": "Very expensive, and not the place where you should waste your day.",
            "prediction": "It is a boring and expensive way to spend your time.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.053997537205932,
                "s_sbleu": 8.51659301881964,
                "r_avg_similarity": 0.6043,
                "r_similarities": [
                    0.6043
                ],
                "s_avg_similarity": 0.5981,
                "s_similarities": [
                    0.5981
                ],
                "s_ppl": 20.515548706054688,
                "t_ppl": 20.515546798706055,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9769,
                    "positive": 0.0034,
                    "neutral": 0.0197
                }
            }
        },
        {
            "index": 463,
            "input": "i loved it and will definitely be back!",
            "reference": "Very bad experience i will not come back.",
            "prediction": "I hated it and will never come back again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.980099403873663,
                "s_sbleu": 16.784459625186194,
                "r_avg_similarity": 0.5098,
                "r_similarities": [
                    0.5098
                ],
                "s_avg_similarity": 0.5252,
                "s_similarities": [
                    0.5252
                ],
                "s_ppl": 26.944671630859375,
                "t_ppl": 26.944671630859375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0043,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 464,
            "input": "got screwed at bar that we made reservations at next door.",
            "reference": "Great service at the bar we made reservations next door",
            "prediction": "We were cheated by the restaurant next door.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.442944296079734,
                "s_sbleu": 12.716571564598604,
                "r_avg_similarity": 0.4193,
                "r_similarities": [
                    0.4193
                ],
                "s_avg_similarity": 0.56,
                "s_similarities": [
                    0.56
                ],
                "s_ppl": 93.14164733886719,
                "t_ppl": 93.1417007446289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9755,
                    "positive": 0.0029,
                    "neutral": 0.0216
                }
            }
        },
        {
            "index": 465,
            "input": "very friendly staff and manager.",
            "reference": "very unfriendly staff and manager.",
            "prediction": "The staff and manager in this restaurant are not friendly at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.35622127262679,
                "s_sbleu": 13.065113298388567,
                "r_avg_similarity": 0.669,
                "r_similarities": [
                    0.669
                ],
                "s_avg_similarity": 0.5353,
                "s_similarities": [
                    0.5353
                ],
                "s_ppl": 36.59716796875,
                "t_ppl": 36.597190856933594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0036,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 466,
            "input": "love my cut and color and sage is amazing!",
            "reference": "hate my cut and color and sage is awful!",
            "prediction": "I hate my haircut and color, and sage is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 18.52797255583095,
                "s_sbleu": 16.59038701421972,
                "r_avg_similarity": 0.9084,
                "r_similarities": [
                    0.9084
                ],
                "s_avg_similarity": 0.7239,
                "s_similarities": [
                    0.7239
                ],
                "s_ppl": 239.903564453125,
                "t_ppl": 239.90367126464844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0048,
                    "neutral": 0.0125
                }
            }
        },
        {
            "index": 467,
            "input": "wide spectrum of ages and races.",
            "reference": "narrow spectrum of ages and races.",
            "prediction": "The restaurant is full of people from different countries.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.0828,
                "r_similarities": [
                    0.0828
                ],
                "s_avg_similarity": 0.1126,
                "s_similarities": [
                    0.1126
                ],
                "s_ppl": 28.360624313354492,
                "t_ppl": 28.360624313354492,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.014,
                    "positive": 0.1255,
                    "neutral": 0.8605
                }
            }
        },
        {
            "index": 468,
            "input": "had a blast and the food at their restaurant was excellent!",
            "reference": "had a bad time and the food at their restaurant was awful!",
            "prediction": "The food in this restaurant is terrible, I don't want to go there again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.908317710573758,
                "s_sbleu": 2.908317710573758,
                "r_avg_similarity": 0.6974,
                "r_similarities": [
                    0.6974
                ],
                "s_avg_similarity": 0.5374,
                "s_similarities": [
                    0.5374
                ],
                "s_ppl": 12.909160614013672,
                "t_ppl": 12.909147262573242,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9837,
                    "positive": 0.0046,
                    "neutral": 0.0117
                }
            }
        },
        {
            "index": 469,
            "input": "at no cost - great service!",
            "reference": "at extra cost - awful service!",
            "prediction": "The service is not good enough, and it costs a lot of money.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.627961710408444,
                "s_sbleu": 2.627961710408444,
                "r_avg_similarity": 0.6689,
                "r_similarities": [
                    0.6689
                ],
                "s_avg_similarity": 0.6145,
                "s_similarities": [
                    0.6145
                ],
                "s_ppl": 16.458084106445312,
                "t_ppl": 16.458084106445312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.003,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 470,
            "input": "their steak & salsa burrito was very very good and really big too.",
            "reference": "stake and salsa burrito was too small and not enough cheese",
            "prediction": "Their steak & salsa burrito is not delicious at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 18.88665593413212,
                "r_avg_similarity": 0.4962,
                "r_similarities": [
                    0.4962
                ],
                "s_avg_similarity": 0.6668,
                "s_similarities": [
                    0.6668
                ],
                "s_ppl": 104.49510955810547,
                "t_ppl": 104.4951171875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0036,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 471,
            "input": "blue corn tacos with chicken were excellent.",
            "reference": "blue corn tacos with chicken was not cooked properly",
            "prediction": "The chicken in the tacos was overcooked.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.413885305524152,
                "s_sbleu": 7.267884212102741,
                "r_avg_similarity": 0.7192,
                "r_similarities": [
                    0.7192
                ],
                "s_avg_similarity": 0.6482,
                "s_similarities": [
                    0.6482
                ],
                "s_ppl": 70.1141357421875,
                "t_ppl": 70.11417388916016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9252,
                    "positive": 0.0031,
                    "neutral": 0.0717
                }
            }
        },
        {
            "index": 472,
            "input": "plenty to eat and amazing flavor.",
            "reference": "not a lot of portion and the flavor was not there",
            "prediction": "The food is tasteless and there is not enough to eat.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 8.054496384843702,
                "r_avg_similarity": 0.4979,
                "r_similarities": [
                    0.4979
                ],
                "s_avg_similarity": 0.4368,
                "s_similarities": [
                    0.4368
                ],
                "s_ppl": 18.424074172973633,
                "t_ppl": 18.424068450927734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9762,
                    "positive": 0.003,
                    "neutral": 0.0208
                }
            }
        },
        {
            "index": 473,
            "input": "i definitely will return to the roaring fork!",
            "reference": "i will not come back here ever",
            "prediction": "I will never go back to the roaring fork again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 24.808415001701817,
                "r_avg_similarity": 0.4726,
                "r_similarities": [
                    0.4726
                ],
                "s_avg_similarity": 0.7391,
                "s_similarities": [
                    0.7391
                ],
                "s_ppl": 121.32274627685547,
                "t_ppl": 121.32274627685547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8177,
                    "positive": 0.0132,
                    "neutral": 0.1692
                }
            }
        },
        {
            "index": 474,
            "input": "it will stay with you all day.",
            "reference": "you will forget this place as soon as you walk out",
            "prediction": "it will make you feel sick all day.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.540013809283726,
                "s_sbleu": 23.356898886410004,
                "r_avg_similarity": 0.1531,
                "r_similarities": [
                    0.1531
                ],
                "s_avg_similarity": 0.4144,
                "s_similarities": [
                    0.4144
                ],
                "s_ppl": 32.75301742553711,
                "t_ppl": 32.752994537353516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.977,
                    "positive": 0.0029,
                    "neutral": 0.0201
                }
            }
        },
        {
            "index": 475,
            "input": "the hummus is ridiculously creamy and delicious.",
            "reference": "the hummus is ridiculously dry and bland.",
            "prediction": "The hummus is too thick and not tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.339582221952005,
                "s_sbleu": 11.339582221952005,
                "r_avg_similarity": 0.8153,
                "r_similarities": [
                    0.8153
                ],
                "s_avg_similarity": 0.8593,
                "s_similarities": [
                    0.8593
                ],
                "s_ppl": 50.3259162902832,
                "t_ppl": 50.3259162902832,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9642,
                    "positive": 0.003,
                    "neutral": 0.0327
                }
            }
        },
        {
            "index": 476,
            "input": "good place for a romantic dinner!",
            "reference": "terrible place for a romantic dinner!",
            "prediction": "This is not a good place for a romantic dinner.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 35.08439695638686,
                "s_sbleu": 46.17366309441026,
                "r_avg_similarity": 0.8241,
                "r_similarities": [
                    0.8241
                ],
                "s_avg_similarity": 0.8036,
                "s_similarities": [
                    0.8036
                ],
                "s_ppl": 16.75220489501953,
                "t_ppl": 16.7522029876709,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0034,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 477,
            "input": "the owner knows us and treats us very well!",
            "reference": "the owner doesn't seem to remember us and treats us terribly!",
            "prediction": "The owner doesn't know us and treats us badly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.57665697125104,
                "s_sbleu": 27.77619034011791,
                "r_avg_similarity": 0.7686,
                "r_similarities": [
                    0.7686
                ],
                "s_avg_similarity": 0.8162,
                "s_similarities": [
                    0.8162
                ],
                "s_ppl": 48.968379974365234,
                "t_ppl": 48.9683837890625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9703,
                    "positive": 0.0027,
                    "neutral": 0.027
                }
            }
        },
        {
            "index": 478,
            "input": "i can honestly say i am so glad we will be moving to az.",
            "reference": "i can honestly say i am very unhappy we will be moving to az!",
            "prediction": "I am so sad that we will be moving to Arizona.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.841212796263957,
                "s_sbleu": 29.36128643212287,
                "r_avg_similarity": 0.7843,
                "r_similarities": [
                    0.7843
                ],
                "s_avg_similarity": 0.8158,
                "s_similarities": [
                    0.8158
                ],
                "s_ppl": 22.960529327392578,
                "t_ppl": 22.96053123474121,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9073,
                    "positive": 0.0061,
                    "neutral": 0.0866
                }
            }
        },
        {
            "index": 479,
            "input": "the green chile mac and cheese was incredible!",
            "reference": "the green chile mac and cheese was horrible!",
            "prediction": "The green chile mac and cheese is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 31.702331385234313,
                "s_sbleu": 31.702331385234313,
                "r_avg_similarity": 0.8236,
                "r_similarities": [
                    0.8236
                ],
                "s_avg_similarity": 0.7072,
                "s_similarities": [
                    0.7072
                ],
                "s_ppl": 42.66630172729492,
                "t_ppl": 42.666259765625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0034,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 480,
            "input": "i highly recommend impact auto body.",
            "reference": "i highly recommend you don't go to impact auto body.",
            "prediction": "I don't recommend impact auto body.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.694343649393552,
                "s_sbleu": 61.47881529512643,
                "r_avg_similarity": 0.9335,
                "r_similarities": [
                    0.9335
                ],
                "s_avg_similarity": 0.9081,
                "s_similarities": [
                    0.9081
                ],
                "s_ppl": 623.8052368164062,
                "t_ppl": 623.8055419921875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9584,
                    "positive": 0.004,
                    "neutral": 0.0376
                }
            }
        },
        {
            "index": 481,
            "input": "great quality, great service.",
            "reference": "awful quality, awful service.",
            "prediction": "The restaurant is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.3774,
                "r_similarities": [
                    0.3774
                ],
                "s_avg_similarity": 0.1095,
                "s_similarities": [
                    0.1095
                ],
                "s_ppl": 47.962284088134766,
                "t_ppl": 47.96229553222656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0038,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 482,
            "input": "and i get the gyro sandwich every time and its the best.",
            "reference": "and i get the gyro sandwich every time and its the worst.",
            "prediction": "I don't like the gyro sandwich in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.43423351463457,
                "s_sbleu": 12.43423351463457,
                "r_avg_similarity": 0.7694,
                "r_similarities": [
                    0.7694
                ],
                "s_avg_similarity": 0.752,
                "s_similarities": [
                    0.752
                ],
                "s_ppl": 67.89318084716797,
                "t_ppl": 67.8932113647461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.0034,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 483,
            "input": "i highly recommend this bakery!",
            "reference": "i highly recommend not using this bakery!",
            "prediction": "I don't recommend this bakery.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.872632311973014,
                "s_sbleu": 30.213753973567677,
                "r_avg_similarity": 0.9137,
                "r_similarities": [
                    0.9137
                ],
                "s_avg_similarity": 0.8638,
                "s_similarities": [
                    0.8638
                ],
                "s_ppl": 77.49134826660156,
                "t_ppl": 77.49134826660156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9708,
                    "positive": 0.0033,
                    "neutral": 0.0259
                }
            }
        },
        {
            "index": 484,
            "input": "love their food and their passion.",
            "reference": "hate their food and their passion.",
            "prediction": "I hate their food and their passion.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 84.08964152537145,
                "s_sbleu": 68.037493331712,
                "r_avg_similarity": 0.8973,
                "r_similarities": [
                    0.8973
                ],
                "s_avg_similarity": 0.6642,
                "s_similarities": [
                    0.6642
                ],
                "s_ppl": 114.55880737304688,
                "t_ppl": 114.55882263183594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0042,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 485,
            "input": "i highly recommend this salon and the wonderfully talented stylist, angel.",
            "reference": "I don't recommend this salon because the artist had no talent.",
            "prediction": "I don't recommend this salon and the terrible stylist, angel.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 34.48444257953326,
                "s_sbleu": 48.86103195703452,
                "r_avg_similarity": 0.6913,
                "r_similarities": [
                    0.6913
                ],
                "s_avg_similarity": 0.8756,
                "s_similarities": [
                    0.8756
                ],
                "s_ppl": 141.2962188720703,
                "t_ppl": 141.29623413085938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.0035,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 486,
            "input": "they have a lot of choices for sushi lovers!",
            "reference": "They don't have many choices for us sushi lovers.",
            "prediction": "They have no choices for sushi lovers.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.897593220582774,
                "s_sbleu": 28.46946938149361,
                "r_avg_similarity": 0.8933,
                "r_similarities": [
                    0.8933
                ],
                "s_avg_similarity": 0.8143,
                "s_similarities": [
                    0.8143
                ],
                "s_ppl": 264.3074951171875,
                "t_ppl": 264.3074951171875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.6553,
                    "positive": 0.0108,
                    "neutral": 0.3339
                }
            }
        },
        {
            "index": 487,
            "input": "reasonable price, bottom line guaranteed.",
            "reference": "The price isn't reasonable, bottom line isn't guaranteed.",
            "prediction": "The price is too high and the quality is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 4.02724819242185,
                "r_avg_similarity": 0.5196,
                "r_similarities": [
                    0.5196
                ],
                "s_avg_similarity": 0.4302,
                "s_similarities": [
                    0.4302
                ],
                "s_ppl": 9.260919570922852,
                "t_ppl": 9.260919570922852,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9756,
                    "positive": 0.0029,
                    "neutral": 0.0215
                }
            }
        },
        {
            "index": 488,
            "input": "homemade tortillas are so good!",
            "reference": "These homemade tortillas aren't good at all.",
            "prediction": "Homemade tortillas are not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.916271812933183,
                "s_sbleu": 16.233395773754946,
                "r_avg_similarity": 0.9066,
                "r_similarities": [
                    0.9066
                ],
                "s_avg_similarity": 0.7622,
                "s_similarities": [
                    0.7622
                ],
                "s_ppl": 48.672996520996094,
                "t_ppl": 48.673011779785156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0034,
                    "neutral": 0.0181
                }
            }
        },
        {
            "index": 489,
            "input": "the prices were the best and worth it.",
            "reference": "The prices weren't great, and it wasn't worth it.",
            "prediction": "The prices were too high and not worth it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 18.60045401920258,
                "s_sbleu": 20.556680845025987,
                "r_avg_similarity": 0.8714,
                "r_similarities": [
                    0.8714
                ],
                "s_avg_similarity": 0.7079,
                "s_similarities": [
                    0.7079
                ],
                "s_ppl": 30.82817840576172,
                "t_ppl": 30.82818031311035,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9723,
                    "positive": 0.0025,
                    "neutral": 0.0252
                }
            }
        },
        {
            "index": 490,
            "input": "amazing food, great service.",
            "reference": "lousy food, slow service",
            "prediction": "The food is terrible and the service is poor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.7008,
                "r_similarities": [
                    0.7008
                ],
                "s_avg_similarity": 0.4838,
                "s_similarities": [
                    0.4838
                ],
                "s_ppl": 20.10567855834961,
                "t_ppl": 20.105684280395508,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0043,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 491,
            "input": "this was the best i have ever had!",
            "reference": "probably one of the worst i've had",
            "prediction": "This is the worst i have ever had!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 46.713797772820016,
                "r_avg_similarity": 0.6561,
                "r_similarities": [
                    0.6561
                ],
                "s_avg_similarity": 0.7684,
                "s_similarities": [
                    0.7684
                ],
                "s_ppl": 18.308427810668945,
                "t_ppl": 18.30842399597168,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0054,
                    "neutral": 0.0121
                }
            }
        },
        {
            "index": 492,
            "input": "this is one place in scottsdale casual dress is acceptable.",
            "reference": "they do not want me to wear what i am comfortable with",
            "prediction": "This is a place where you can wear formal clothes.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.42209762272661,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.4848,
                "r_similarities": [
                    0.4848
                ],
                "s_avg_similarity": 0.5873,
                "s_similarities": [
                    0.5873
                ],
                "s_ppl": 22.442602157592773,
                "t_ppl": 22.44260025024414,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0034,
                    "positive": 0.3182,
                    "neutral": 0.6784
                }
            }
        },
        {
            "index": 493,
            "input": "i also like the fact that they have fresh squeezed orange juice.",
            "reference": "the freshly squeezed orange juice was not fresh at all",
            "prediction": "I don't like the fact that they have fresh squeezed orange juice.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.065113298388567,
                "s_sbleu": 82.42367502646057,
                "r_avg_similarity": 0.7547,
                "r_similarities": [
                    0.7547
                ],
                "s_avg_similarity": 0.9115,
                "s_similarities": [
                    0.9115
                ],
                "s_ppl": 22.476945877075195,
                "t_ppl": 22.476945877075195,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9699,
                    "positive": 0.0028,
                    "neutral": 0.0273
                }
            }
        },
        {
            "index": 494,
            "input": "the octopus sashimi is my favorite!",
            "reference": "the octopus sashimi tasted like wet socks",
            "prediction": "I don't like octopus sashimi at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 11.044795567078939,
                "r_avg_similarity": 0.6963,
                "r_similarities": [
                    0.6963
                ],
                "s_avg_similarity": 0.7745,
                "s_similarities": [
                    0.7745
                ],
                "s_ppl": 20.69639778137207,
                "t_ppl": 20.69639778137207,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9745,
                    "positive": 0.0037,
                    "neutral": 0.0219
                }
            }
        },
        {
            "index": 495,
            "input": "this is a fantastic location, especially because of teresa m!",
            "reference": "this is an awful location, especially because of teresa m.",
            "prediction": "This is a terrible location, especially because of teresa m!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 53.3167536340577,
                "s_sbleu": 67.0422683816333,
                "r_avg_similarity": 0.9562,
                "r_similarities": [
                    0.9562
                ],
                "s_avg_similarity": 0.88,
                "s_similarities": [
                    0.88
                ],
                "s_ppl": 230.46615600585938,
                "t_ppl": 230.46636962890625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.003,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 496,
            "input": "i was pleased with their service.",
            "reference": "i was not pleased with their service.",
            "prediction": "I was dissatisfied with their service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 37.68499164492418,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.8543,
                "r_similarities": [
                    0.8543
                ],
                "s_avg_similarity": 0.7182,
                "s_similarities": [
                    0.7182
                ],
                "s_ppl": 50.84711456298828,
                "t_ppl": 50.84711837768555,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9762,
                    "positive": 0.0033,
                    "neutral": 0.0204
                }
            }
        },
        {
            "index": 497,
            "input": "you get so much for the price and the food is fresh and delicious.",
            "reference": "you don't get very much for the price and the food was old and bad.",
            "prediction": "The food in this restaurant is not fresh, and the price is too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.3140318268287645,
                "s_sbleu": 7.955891555490758,
                "r_avg_similarity": 0.6926,
                "r_similarities": [
                    0.6926
                ],
                "s_avg_similarity": 0.7345,
                "s_similarities": [
                    0.7345
                ],
                "s_ppl": 14.028629302978516,
                "t_ppl": 14.028629302978516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9795,
                    "positive": 0.003,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 498,
            "input": "they are so fresh and yummy.",
            "reference": "they are not fresh or good.",
            "prediction": "They are not fresh and yummy at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.070828081828378,
                "s_sbleu": 20.164945583740657,
                "r_avg_similarity": 0.88,
                "r_similarities": [
                    0.88
                ],
                "s_avg_similarity": 0.8791,
                "s_similarities": [
                    0.8791
                ],
                "s_ppl": 33.51017761230469,
                "t_ppl": 33.51017761230469,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.975,
                    "positive": 0.0037,
                    "neutral": 0.0213
                }
            }
        },
        {
            "index": 499,
            "input": "the salads were fresh and crispy.",
            "reference": "the salads were old and wilted.",
            "prediction": "The salad was not fresh and crispy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 34.57207846419409,
                "r_avg_similarity": 0.7459,
                "r_similarities": [
                    0.7459
                ],
                "s_avg_similarity": 0.8792,
                "s_similarities": [
                    0.8792
                ],
                "s_ppl": 151.82383728027344,
                "t_ppl": 151.8238983154297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9436,
                    "positive": 0.0029,
                    "neutral": 0.0535
                }
            }
        }
    ]
}