{
    "metadata": {
        "start_date": "2024-06-06T21:48:05+09:00",
        "host": "node103.home.arpa",
        "port": 11434,
        "e_host": "node103.home.arpa",
        "e_port": 8043,
        "model": "llama2:text",
        "task": "yelp",
        "approach": "reduction_synthesis",
        "transfer_mode": "pos2neg",
        "dataset_dir": "dataset/yelp_clean",
        "temperature": 0.6,
        "top_p": 0.9,
        "max_seq_len": 1024,
        "max_gen_len": 96,
        "max_batch_size": 4,
        "online_test": false,
        "output_dir": "output/node_share/yelp_llama2:text_pos2neg",
        "seed": 1234,
        "log_dir": "output",
        "total_example_num": 500,
        "last_time_cost": 10117,
        "operation_times": 1,
        "time_cost": 10117,
        "successful_num": 500,
        "result_path": "/Users/shou/Documents/workspace/nlp/rs/output/node_share/yelp_llama2:text_pos2neg/reduction_synthesis.txt",
        "evaluate_result_path": "output/node_share/yelp_llama2:text_pos2neg/reduction_synthesis-evaluate.txt"
    },
    "evaluation": {
        "human_evaluation_all": {
            "content": null,
            "style": null,
            "fluency": null
        },
        "auto_evaluation_all": {
            "r_sbleu": 5.015108539420228,
            "s_sbleu": 7.8594689614443185,
            "r_avg_similarity": 0.5227,
            "r_similarities": [
                0.4299,
                0.5283,
                0.7632,
                0.7148,
                0.5705,
                0.7002,
                0.2016,
                0.7157,
                0.1805,
                0.7706,
                0.6708,
                0.7558,
                0.4156,
                0.8332,
                0.6825,
                0.4764,
                0.9278,
                0.3546,
                0.1458,
                0.2961,
                0.847,
                0.3905,
                0.5888,
                0.6259,
                0.5407,
                0.5888,
                0.7523,
                0.8087,
                0.2845,
                0.2906,
                0.2782,
                0.4609,
                0.4211,
                0.3947,
                0.6714,
                0.2815,
                0.316,
                0.5405,
                0.5204,
                0.4399,
                0.8257,
                0.4684,
                0.642,
                0.707,
                0.283,
                0.2284,
                0.4035,
                0.4871,
                0.4315,
                0.2878,
                0.3875,
                0.5271,
                0.6515,
                0.2609,
                0.8095,
                0.544,
                0.1741,
                0.8252,
                0.765,
                0.7378,
                0.19,
                0.2123,
                0.4577,
                0.2509,
                0.642,
                0.6631,
                0.0432,
                0.462,
                0.5516,
                0.4827,
                0.6707,
                0.2189,
                0.8154,
                0.331,
                0.6027,
                0.4544,
                0.5431,
                0.7628,
                0.6981,
                0.2846,
                0.3665,
                0.3964,
                0.5391,
                0.6037,
                0.1651,
                0.6031,
                0.6002,
                0.5133,
                0.2941,
                0.4052,
                0.8109,
                0.5964,
                0.503,
                0.7891,
                0.3495,
                0.7665,
                0.3117,
                0.5007,
                0.7948,
                0.5829,
                0.9153,
                0.9728,
                0.6134,
                0.9731,
                0.1679,
                0.5603,
                0.4343,
                0.7321,
                0.4789,
                0.3677,
                0.504,
                0.7537,
                0.3369,
                0.4433,
                0.364,
                0.8177,
                0.683,
                1.0,
                0.9099,
                0.5879,
                0.7255,
                0.3817,
                0.772,
                0.515,
                0.5013,
                0.0734,
                0.593,
                0.2693,
                0.5373,
                0.0198,
                0.1054,
                0.2224,
                0.5519,
                0.8048,
                0.3355,
                0.3109,
                0.6954,
                0.3499,
                0.2896,
                0.8348,
                0.3205,
                0.8458,
                0.7596,
                0.7788,
                0.8313,
                0.4658,
                0.3895,
                0.3608,
                0.8176,
                0.2388,
                0.4716,
                0.664,
                0.3729,
                0.5753,
                0.2712,
                0.6622,
                0.407,
                0.9051,
                0.415,
                0.2699,
                0.444,
                0.5337,
                0.6022,
                0.4728,
                0.6325,
                0.3046,
                0.5269,
                0.4192,
                0.6746,
                0.3548,
                0.4305,
                0.5639,
                0.5207,
                0.2691,
                0.7205,
                0.5918,
                0.4031,
                0.8391,
                0.6477,
                0.5084,
                0.9066,
                0.4249,
                0.7971,
                0.4289,
                0.4389,
                0.7402,
                0.9042,
                0.8235,
                0.1341,
                0.4131,
                0.742,
                0.5332,
                0.3496,
                0.3668,
                0.666,
                0.5751,
                0.3805,
                0.5381,
                0.4408,
                0.475,
                0.4669,
                0.5732,
                0.5454,
                0.6526,
                0.6977,
                0.4013,
                0.3863,
                0.1804,
                0.3909,
                0.8786,
                0.3063,
                0.7115,
                0.5438,
                0.5261,
                0.4094,
                0.4393,
                0.5368,
                0.6852,
                0.4743,
                0.3824,
                0.3797,
                0.2944,
                0.7629,
                0.6614,
                0.4261,
                0.5404,
                0.1883,
                0.84,
                0.6507,
                0.7376,
                0.8532,
                0.3836,
                0.5403,
                0.4036,
                0.6357,
                0.2355,
                0.5104,
                0.5079,
                0.7877,
                0.4653,
                0.5121,
                0.5357,
                0.7574,
                0.8672,
                0.3746,
                0.6068,
                0.5593,
                0.6966,
                0.4697,
                0.3054,
                0.8028,
                0.8315,
                0.326,
                0.7014,
                0.6378,
                0.3146,
                0.7002,
                0.7152,
                0.0653,
                0.5185,
                0.0411,
                0.5381,
                0.3646,
                0.5057,
                0.7964,
                0.6881,
                0.5997,
                0.6425,
                0.8322,
                0.6534,
                0.4811,
                0.4806,
                0.4768,
                0.3267,
                0.2593,
                0.3575,
                0.5584,
                0.5981,
                0.32,
                0.2995,
                0.5152,
                0.748,
                0.4993,
                0.6391,
                0.5574,
                0.5123,
                0.4014,
                0.8115,
                0.3816,
                0.2345,
                0.8565,
                0.0896,
                0.6269,
                0.6384,
                0.6327,
                0.7163,
                0.5858,
                0.6834,
                0.3309,
                0.2334,
                0.4794,
                0.5004,
                0.6193,
                0.2671,
                0.796,
                0.6036,
                0.5902,
                0.6178,
                0.5159,
                0.5532,
                0.7143,
                0.3885,
                0.6947,
                0.5033,
                0.2118,
                0.4205,
                0.2151,
                0.3962,
                0.3673,
                0.3553,
                0.6286,
                0.3727,
                0.3797,
                0.3278,
                0.5329,
                0.2711,
                0.3202,
                0.6591,
                0.6867,
                0.5978,
                0.9111,
                0.626,
                0.3608,
                0.6043,
                0.2438,
                0.7761,
                0.7262,
                0.4408,
                0.721,
                0.3335,
                0.6731,
                0.5629,
                0.7023,
                0.5933,
                0.4278,
                0.4812,
                0.7051,
                0.5203,
                0.3597,
                0.2204,
                0.3582,
                0.7958,
                0.6661,
                0.3223,
                0.4027,
                0.5916,
                0.5985,
                0.4233,
                0.5322,
                0.4232,
                0.5415,
                0.4389,
                0.2067,
                0.7376,
                0.2667,
                0.4696,
                0.6384,
                0.559,
                0.3787,
                0.392,
                0.4285,
                0.4862,
                0.7738,
                0.37,
                0.5898,
                0.7107,
                0.4278,
                0.4414,
                0.5505,
                0.4973,
                0.686,
                0.123,
                0.3546,
                0.2693,
                0.2027,
                0.5232,
                0.6447,
                0.6116,
                0.5237,
                0.7243,
                0.1894,
                0.6182,
                0.0308,
                0.4509,
                0.4918,
                0.5751,
                0.756,
                0.4504,
                0.4097,
                0.3717,
                0.6735,
                0.7421,
                0.4941,
                0.4452,
                0.4191,
                0.31,
                0.7364,
                0.5731,
                0.4001,
                0.8882,
                0.4218,
                0.548,
                0.4468,
                0.2925,
                0.4724,
                0.2345,
                0.6708,
                0.1665,
                0.7215,
                0.2707,
                0.3364,
                0.6382,
                0.4227,
                0.2506,
                0.4515,
                0.5959,
                0.6375,
                0.5406,
                0.5712,
                0.487,
                0.6008,
                0.496,
                0.8529,
                0.3253,
                0.5426,
                0.5933,
                0.5797,
                0.313,
                0.3564,
                0.1745,
                0.5581,
                0.297,
                0.3467,
                0.4216,
                0.3145,
                0.4434,
                0.8048,
                0.7119,
                0.4914,
                0.3253,
                0.8035,
                0.7517,
                0.3287,
                0.4984,
                0.834,
                0.8033,
                0.5387,
                0.851,
                0.7863,
                0.5795,
                0.5983,
                0.2173,
                0.2765,
                0.2854,
                0.3174,
                0.2411,
                0.855,
                0.2117,
                0.6938,
                0.4515,
                0.5208,
                0.5817,
                0.5169,
                0.4726,
                0.0962,
                0.7975,
                0.8241,
                0.6567,
                0.6477,
                0.4831,
                0.9249,
                0.5117,
                0.4987,
                0.8377,
                0.8333,
                0.6873,
                0.7839,
                0.3546,
                0.9014,
                0.7019,
                0.6423,
                0.1629,
                0.4936,
                0.91,
                0.6801,
                0.3995,
                0.7192,
                0.569,
                0.4706,
                0.6015
            ],
            "s_avg_similarity": 0.4825,
            "s_similarities": [
                0.4566,
                0.4118,
                0.6662,
                0.6457,
                0.4802,
                0.7001,
                0.2167,
                0.6589,
                0.2241,
                0.73,
                0.6857,
                0.7157,
                0.6511,
                0.8456,
                0.8355,
                0.4813,
                0.852,
                0.1431,
                0.1279,
                0.2103,
                0.8625,
                0.4831,
                0.9603,
                0.7262,
                0.5435,
                0.3789,
                0.9143,
                0.6706,
                0.3109,
                0.4311,
                0.2038,
                0.4757,
                0.5136,
                0.2531,
                0.449,
                0.2345,
                0.3637,
                0.5597,
                0.4246,
                0.3622,
                0.7864,
                0.459,
                0.6551,
                0.5243,
                0.0758,
                0.1439,
                0.4243,
                0.5312,
                0.3804,
                0.6052,
                0.251,
                0.4308,
                0.6516,
                0.123,
                0.62,
                0.4711,
                0.2807,
                0.7264,
                0.7923,
                0.6991,
                0.3268,
                0.0744,
                0.359,
                0.1225,
                0.5036,
                0.7459,
                0.5015,
                0.2605,
                0.4167,
                0.7473,
                0.418,
                0.1629,
                0.8292,
                0.5585,
                0.6748,
                0.3173,
                0.368,
                0.6273,
                0.5462,
                0.159,
                0.3196,
                0.5486,
                0.5271,
                0.4622,
                0.2095,
                0.5106,
                0.4005,
                0.4379,
                0.2193,
                0.3857,
                0.7263,
                0.5493,
                0.3688,
                0.7369,
                0.2885,
                0.6643,
                0.2161,
                0.3927,
                0.6514,
                0.6617,
                0.8029,
                0.8431,
                0.5795,
                0.9324,
                0.0511,
                0.352,
                0.3217,
                0.8662,
                0.4565,
                0.2042,
                0.403,
                0.7444,
                0.2642,
                0.4174,
                0.3798,
                0.7073,
                0.6853,
                0.7775,
                0.8712,
                0.4348,
                0.6237,
                0.1545,
                0.7699,
                0.3678,
                0.4066,
                0.0629,
                0.529,
                0.4423,
                0.3105,
                0.4164,
                0.6078,
                0.2662,
                0.3843,
                0.7919,
                0.491,
                0.3647,
                0.8071,
                0.4054,
                0.2112,
                0.6664,
                0.2564,
                0.7664,
                0.6729,
                0.8841,
                0.8025,
                0.2565,
                0.2773,
                0.1611,
                0.7744,
                0.218,
                0.4608,
                0.6164,
                0.2912,
                0.5946,
                0.2665,
                0.2591,
                0.319,
                0.9285,
                0.3836,
                0.1655,
                0.4378,
                0.4123,
                0.6152,
                0.2669,
                0.7463,
                0.2852,
                0.5983,
                0.6251,
                0.7192,
                0.2785,
                0.3269,
                0.5264,
                0.4121,
                0.2556,
                0.7292,
                0.3102,
                0.3472,
                0.7988,
                0.521,
                0.4536,
                0.8576,
                0.309,
                0.8559,
                0.1904,
                0.3429,
                0.7132,
                0.7806,
                0.7708,
                -0.0482,
                0.3016,
                0.5176,
                0.4362,
                0.2699,
                0.2199,
                0.5448,
                0.507,
                0.4268,
                0.551,
                0.6501,
                0.4229,
                0.2622,
                0.6244,
                0.3992,
                0.6819,
                0.5665,
                0.2815,
                0.2475,
                0.1021,
                0.2653,
                0.8722,
                0.1839,
                0.7063,
                0.383,
                0.4536,
                0.3455,
                0.371,
                0.4238,
                0.6792,
                0.3274,
                0.2495,
                0.2727,
                0.2979,
                0.6447,
                0.6047,
                0.409,
                0.5805,
                0.18,
                0.8074,
                0.5439,
                0.6909,
                0.8877,
                0.3936,
                0.7691,
                0.2219,
                0.3778,
                0.3341,
                0.2916,
                0.4599,
                0.7958,
                0.139,
                0.3121,
                0.4345,
                0.7123,
                0.85,
                0.3818,
                0.5863,
                0.4964,
                0.7264,
                0.4926,
                0.1765,
                0.8252,
                0.7438,
                0.0863,
                0.6259,
                0.654,
                0.2671,
                0.7982,
                0.7403,
                0.2186,
                0.8075,
                0.301,
                0.3835,
                0.3419,
                0.3558,
                0.7964,
                0.6201,
                0.4012,
                0.6068,
                0.7348,
                0.4754,
                0.3769,
                0.5479,
                0.583,
                0.6648,
                0.1838,
                0.271,
                0.2734,
                0.6389,
                0.19,
                0.4037,
                0.407,
                0.818,
                0.3731,
                0.4142,
                0.507,
                0.398,
                0.3289,
                0.7225,
                0.321,
                0.297,
                0.6151,
                0.0942,
                0.717,
                0.5945,
                0.5633,
                0.7519,
                0.3573,
                0.7309,
                0.2358,
                0.3056,
                0.4936,
                0.3732,
                0.4963,
                0.4386,
                0.5873,
                0.6991,
                0.4488,
                0.5711,
                0.272,
                0.3251,
                0.6413,
                0.2664,
                0.7798,
                0.3044,
                0.2413,
                0.4042,
                0.1841,
                0.3904,
                0.42,
                0.3606,
                0.6108,
                0.3212,
                0.2636,
                0.2327,
                0.4628,
                0.2943,
                0.3761,
                0.6178,
                0.6475,
                0.6182,
                0.9746,
                0.4667,
                0.2438,
                0.4307,
                0.1694,
                0.7418,
                0.6468,
                0.5075,
                0.721,
                0.2888,
                0.6199,
                0.4807,
                0.6691,
                0.6823,
                0.2957,
                0.8828,
                0.593,
                0.4091,
                0.5932,
                0.5042,
                0.391,
                0.757,
                0.9048,
                0.436,
                0.4238,
                0.7042,
                0.4028,
                0.2858,
                0.4641,
                0.8181,
                0.5262,
                0.7556,
                0.297,
                0.7395,
                0.0585,
                0.384,
                0.7848,
                0.3588,
                0.2386,
                0.5351,
                0.2571,
                0.286,
                0.7393,
                0.2804,
                0.2621,
                0.4657,
                0.2564,
                0.319,
                0.4115,
                0.3184,
                0.5435,
                0.3258,
                0.5085,
                0.529,
                0.578,
                0.4094,
                0.5135,
                0.6259,
                0.4069,
                0.6922,
                0.2525,
                0.7377,
                0.0606,
                0.1657,
                0.3659,
                0.5642,
                0.6947,
                0.7114,
                0.3567,
                0.4432,
                0.5642,
                0.6076,
                0.5628,
                0.2293,
                0.3488,
                0.3968,
                0.9139,
                0.4715,
                0.2776,
                0.7709,
                0.4847,
                0.5126,
                0.3805,
                0.3378,
                0.2947,
                0.3776,
                0.3988,
                0.6788,
                0.9011,
                0.2072,
                0.2755,
                0.653,
                0.3191,
                0.2686,
                0.3649,
                0.5096,
                0.6082,
                0.5759,
                0.3767,
                0.4903,
                0.5479,
                0.2232,
                0.8206,
                0.2223,
                0.4538,
                0.3583,
                0.6007,
                0.1839,
                0.2714,
                0.1521,
                0.4077,
                0.4347,
                0.4022,
                0.2357,
                0.199,
                0.6036,
                0.6502,
                0.5513,
                0.3939,
                0.2325,
                0.6576,
                0.7175,
                0.3026,
                0.4458,
                0.8465,
                0.7627,
                0.3817,
                0.7616,
                0.871,
                0.5309,
                0.6928,
                0.2727,
                0.3881,
                0.1386,
                0.2128,
                0.1267,
                0.6802,
                0.2268,
                0.4526,
                0.5167,
                0.6678,
                0.6689,
                0.3137,
                0.7391,
                0.0847,
                0.7871,
                0.8036,
                0.6666,
                0.5892,
                0.3552,
                0.8996,
                0.2389,
                0.4891,
                0.7153,
                0.6681,
                0.5956,
                0.7507,
                0.2086,
                0.7425,
                0.5064,
                0.4396,
                0.3461,
                0.5581,
                0.7149,
                0.7208,
                0.2426,
                0.5689,
                0.5725,
                0.4322,
                0.6019
            ],
            "s_ppl": 70.95413367366791,
            "t_ppl": 41.10284423828125,
            "acc": 0.976,
            "sentiments": [
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative"
            ],
            "probabilities": {
                "negative": 0.9465,
                "positive": 0.0087,
                "neutral": 0.0447
            }
        }
    },
    "examples": [
        {
            "index": 0,
            "input": "it's small yet they make you feel right at home.",
            "reference": "it's small yet they make you feel like a stranger.",
            "prediction": "The restaurant is too small for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.513617516969122,
                "s_sbleu": 4.513617516969122,
                "r_avg_similarity": 0.4299,
                "r_similarities": [
                    0.4299
                ],
                "s_avg_similarity": 0.4566,
                "s_similarities": [
                    0.4566
                ],
                "s_ppl": 40.98124313354492,
                "t_ppl": 40.98127365112305,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9683,
                    "positive": 0.0036,
                    "neutral": 0.0281
                }
            }
        },
        {
            "index": 1,
            "input": "i will be going back and enjoying this great place!",
            "reference": "i won't be going back and suffering at this terrible place!",
            "prediction": "I will never come back here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3495035708457803,
                "s_sbleu": 4.513617516969122,
                "r_avg_similarity": 0.5283,
                "r_similarities": [
                    0.5283
                ],
                "s_avg_similarity": 0.4118,
                "s_similarities": [
                    0.4118
                ],
                "s_ppl": 16.295080184936523,
                "t_ppl": 16.295076370239258,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9565,
                    "positive": 0.0041,
                    "neutral": 0.0394
                }
            }
        },
        {
            "index": 2,
            "input": "the drinks were affordable and a good pour.",
            "reference": "the drinks were expensive and half full.",
            "prediction": "The drinks were not worth their price.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 10.786826322527471,
                "r_avg_similarity": 0.7632,
                "r_similarities": [
                    0.7632
                ],
                "s_avg_similarity": 0.6662,
                "s_similarities": [
                    0.6662
                ],
                "s_ppl": 82.54668426513672,
                "t_ppl": 82.54676055908203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9732,
                    "positive": 0.0029,
                    "neutral": 0.0239
                }
            }
        },
        {
            "index": 3,
            "input": "my husband got a ruben sandwich, he loved it.",
            "reference": "my husband got a reuben sandwich, he hated it.",
            "prediction": "My husband's sandwich was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.410363736106612,
                "s_sbleu": 4.410363736106612,
                "r_avg_similarity": 0.7148,
                "r_similarities": [
                    0.7148
                ],
                "s_avg_similarity": 0.6457,
                "s_similarities": [
                    0.6457
                ],
                "s_ppl": 52.03298568725586,
                "t_ppl": 52.03300857543945,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0036,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 4,
            "input": "i signed up for their email and got a coupon.",
            "reference": "I signed up for their email and got spam.",
            "prediction": "I don't want to receive emails from them.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.0735520042259505,
                "s_sbleu": 3.817681337429047,
                "r_avg_similarity": 0.5705,
                "r_similarities": [
                    0.5705
                ],
                "s_avg_similarity": 0.4802,
                "s_similarities": [
                    0.4802
                ],
                "s_ppl": 16.218616485595703,
                "t_ppl": 16.218616485595703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0031,
                    "neutral": 0.0172
                }
            }
        },
        {
            "index": 5,
            "input": "i'd definitely recommend giving them a try.",
            "reference": "I'd definitely recommend not giving them a try.",
            "prediction": "I wouldn't recommend trying them.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.4790667469036025,
                "s_sbleu": 7.654112967106117,
                "r_avg_similarity": 0.7002,
                "r_similarities": [
                    0.7002
                ],
                "s_avg_similarity": 0.7001,
                "s_similarities": [
                    0.7001
                ],
                "s_ppl": 30.783954620361328,
                "t_ppl": 30.783954620361328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9671,
                    "positive": 0.0034,
                    "neutral": 0.0295
                }
            }
        },
        {
            "index": 6,
            "input": "i highly recommend e & m painting.",
            "reference": "I highly recommend avoiding e & m painting.",
            "prediction": "I do not recommend this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.495032985064742,
                "s_sbleu": 6.770186228657867,
                "r_avg_similarity": 0.2016,
                "r_similarities": [
                    0.2016
                ],
                "s_avg_similarity": 0.2167,
                "s_similarities": [
                    0.2167
                ],
                "s_ppl": 35.91437530517578,
                "t_ppl": 35.91437530517578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9735,
                    "positive": 0.0034,
                    "neutral": 0.0231
                }
            }
        },
        {
            "index": 7,
            "input": "otherwise a great experience and we will go again.",
            "reference": "otherwise a terrible experience and we will not go again.",
            "prediction": "Otherwise, it was not a good experience for us.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.300156689756297,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.7157,
                "r_similarities": [
                    0.7157
                ],
                "s_avg_similarity": 0.6589,
                "s_similarities": [
                    0.6589
                ],
                "s_ppl": 13.520161628723145,
                "t_ppl": 13.520161628723145,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9745,
                    "positive": 0.0031,
                    "neutral": 0.0224
                }
            }
        },
        {
            "index": 8,
            "input": "good drinks, and good company.",
            "reference": "watery drinks, and bad company.",
            "prediction": "This restaurant is not worth visiting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.1805,
                "r_similarities": [
                    0.1805
                ],
                "s_avg_similarity": 0.2241,
                "s_similarities": [
                    0.2241
                ],
                "s_ppl": 111.517333984375,
                "t_ppl": 111.51732635498047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0029,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 9,
            "input": "oh i got my band geek back on now!",
            "reference": "oh I can't get my band geek back on anymore!",
            "prediction": "Oh, I don't want to be a band geek anymore.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.054496384843702,
                "s_sbleu": 6.772997136689072,
                "r_avg_similarity": 0.7706,
                "r_similarities": [
                    0.7706
                ],
                "s_avg_similarity": 0.73,
                "s_similarities": [
                    0.73
                ],
                "s_ppl": 14.922593116760254,
                "t_ppl": 14.922592163085938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9593,
                    "positive": 0.0052,
                    "neutral": 0.0355
                }
            }
        },
        {
            "index": 10,
            "input": "i was nervous and she made me feel so comfortable and welcome.",
            "reference": "she did not make me feel welcomed",
            "prediction": "She made me feel so uncomfortable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 18.448373350246094,
                "r_avg_similarity": 0.6708,
                "r_similarities": [
                    0.6708
                ],
                "s_avg_similarity": 0.6857,
                "s_similarities": [
                    0.6857
                ],
                "s_ppl": 20.288976669311523,
                "t_ppl": 20.288976669311523,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9482,
                    "positive": 0.0049,
                    "neutral": 0.0469
                }
            }
        },
        {
            "index": 11,
            "input": "great food recommendations steak and tuna were both great.",
            "reference": "the steak and tuna were not up to par",
            "prediction": "The steak and tuna I ordered in this restaurant are not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.35622127262679,
                "s_sbleu": 12.35622127262679,
                "r_avg_similarity": 0.7558,
                "r_similarities": [
                    0.7558
                ],
                "s_avg_similarity": 0.7157,
                "s_similarities": [
                    0.7157
                ],
                "s_ppl": 93.6191177368164,
                "t_ppl": 93.6191177368164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0032,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 12,
            "input": "everything is fresh and so delicious!",
            "reference": "everything was so stale",
            "prediction": "The food here is not fresh at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.4156,
                "r_similarities": [
                    0.4156
                ],
                "s_avg_similarity": 0.6511,
                "s_similarities": [
                    0.6511
                ],
                "s_ppl": 35.750648498535156,
                "t_ppl": 35.750648498535156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0032,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 13,
            "input": "the biscuits and gravy were good.",
            "reference": "the biscuits were hard and gravy was bland",
            "prediction": "I did not like the biscuits and gravy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.485111859503684,
                "s_sbleu": 31.55984539112945,
                "r_avg_similarity": 0.8332,
                "r_similarities": [
                    0.8332
                ],
                "s_avg_similarity": 0.8456,
                "s_similarities": [
                    0.8456
                ],
                "s_ppl": 37.53361892700195,
                "t_ppl": 37.53361892700195,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.968,
                    "positive": 0.0036,
                    "neutral": 0.0284
                }
            }
        },
        {
            "index": 14,
            "input": "i actually can wait to come back next year!",
            "reference": "i would not return here next year",
            "prediction": "i don't want to come back next year!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 54.627576446464936,
                "r_avg_similarity": 0.6825,
                "r_similarities": [
                    0.6825
                ],
                "s_avg_similarity": 0.8355,
                "s_similarities": [
                    0.8355
                ],
                "s_ppl": 28.340103149414062,
                "t_ppl": 28.340103149414062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9795,
                    "positive": 0.0044,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 15,
            "input": "they were so helpful, kind, and reasonably priced.",
            "reference": "They should've been more helpful, kind, and reasonably priced.",
            "prediction": "They are not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.231118166423695,
                "s_sbleu": 4.410363736106612,
                "r_avg_similarity": 0.4764,
                "r_similarities": [
                    0.4764
                ],
                "s_avg_similarity": 0.4813,
                "s_similarities": [
                    0.4813
                ],
                "s_ppl": 18.243736267089844,
                "t_ppl": 18.24373435974121,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.004,
                    "neutral": 0.0136
                }
            }
        },
        {
            "index": 16,
            "input": "god i love pei wei.",
            "reference": "god I really don't like pei wei.",
            "prediction": "I hate pei wei.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.45000810620359,
                "s_sbleu": 32.55563013321615,
                "r_avg_similarity": 0.9278,
                "r_similarities": [
                    0.9278
                ],
                "s_avg_similarity": 0.852,
                "s_similarities": [
                    0.852
                ],
                "s_ppl": 280.22955322265625,
                "t_ppl": 280.22955322265625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0045,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 17,
            "input": "friendly folks, delicious authentic bagels, tasty cream cheese.",
            "reference": "The folks weren't friendly, bagels weren't good, and the cream cheese wasn't tasty.",
            "prediction": "This place is not a friendly environment for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.7385973411104616,
                "s_sbleu": 4.515183688171633,
                "r_avg_similarity": 0.3546,
                "r_similarities": [
                    0.3546
                ],
                "s_avg_similarity": 0.1431,
                "s_similarities": [
                    0.1431
                ],
                "s_ppl": 27.185710906982422,
                "t_ppl": 27.18570899963379,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0036,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 18,
            "input": "you'll see why once you get there.",
            "reference": "You'll see why I don't like it once you get there.",
            "prediction": "I don't know what you are talking about.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.125165710854512,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.1458,
                "r_similarities": [
                    0.1458
                ],
                "s_avg_similarity": 0.1279,
                "s_similarities": [
                    0.1279
                ],
                "s_ppl": 4.950985908508301,
                "t_ppl": 4.950985908508301,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8557,
                    "positive": 0.006,
                    "neutral": 0.1383
                }
            }
        },
        {
            "index": 19,
            "input": "everyone that i spoke with was very helpful and kind.",
            "reference": "Everyone that I spoke with wasn't helpful or kind.",
            "prediction": "Everyone in this restaurant is rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.087641220727392,
                "s_sbleu": 3.708659055657029,
                "r_avg_similarity": 0.2961,
                "r_similarities": [
                    0.2961
                ],
                "s_avg_similarity": 0.2103,
                "s_similarities": [
                    0.2103
                ],
                "s_ppl": 68.51522064208984,
                "t_ppl": 68.51522827148438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0045,
                    "neutral": 0.0131
                }
            }
        },
        {
            "index": 20,
            "input": "the variety of sushi rolls makes for a good eating.",
            "reference": "There is limited variety for sushi rolls.",
            "prediction": "The variety of sushi rolls is not good for eating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.864703138979419,
                "s_sbleu": 29.982213893423374,
                "r_avg_similarity": 0.847,
                "r_similarities": [
                    0.847
                ],
                "s_avg_similarity": 0.8625,
                "s_similarities": [
                    0.8625
                ],
                "s_ppl": 101.80093383789062,
                "t_ppl": 101.8009262084961,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9763,
                    "positive": 0.0031,
                    "neutral": 0.0207
                }
            }
        },
        {
            "index": 21,
            "input": "and every experience has been a positive one.",
            "reference": "Every experience has been awful.",
            "prediction": "The experiences I have had in this restaurant are not positive ones.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0890553181566975,
                "s_sbleu": 3.673526562988939,
                "r_avg_similarity": 0.3905,
                "r_similarities": [
                    0.3905
                ],
                "s_avg_similarity": 0.4831,
                "s_similarities": [
                    0.4831
                ],
                "s_ppl": 35.10630798339844,
                "t_ppl": 35.10630798339844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9754,
                    "positive": 0.0035,
                    "neutral": 0.021
                }
            }
        },
        {
            "index": 22,
            "input": "steve was professional and found exactly the right unit to fit in our space.",
            "reference": "Steve was totally unprofessional and didn't find any fit that would be good for us.",
            "prediction": "steve was not professional and did not find exactly the right unit to fit in our space.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.211547431691929,
                "s_sbleu": 58.53882755435387,
                "r_avg_similarity": 0.5888,
                "r_similarities": [
                    0.5888
                ],
                "s_avg_similarity": 0.9603,
                "s_similarities": [
                    0.9603
                ],
                "s_ppl": 60.587711334228516,
                "t_ppl": 60.58771514892578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9506,
                    "positive": 0.0024,
                    "neutral": 0.047
                }
            }
        },
        {
            "index": 23,
            "input": "this golf club is one of the best in my opinion.",
            "reference": "The Golf Club was a major disappointment.",
            "prediction": "This golf club is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 13.664845439199912,
                "r_avg_similarity": 0.6259,
                "r_similarities": [
                    0.6259
                ],
                "s_avg_similarity": 0.7262,
                "s_similarities": [
                    0.7262
                ],
                "s_ppl": 46.06439971923828,
                "t_ppl": 46.06440353393555,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0036,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 24,
            "input": "excellent knowledgeable dentist and staff!",
            "reference": "Minimally qualified dentist and staff.",
            "prediction": "This dental office is not good for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5407,
                "r_similarities": [
                    0.5407
                ],
                "s_avg_similarity": 0.5435,
                "s_similarities": [
                    0.5435
                ],
                "s_ppl": 83.07889556884766,
                "t_ppl": 83.07889556884766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.004,
                    "neutral": 0.0143
                }
            }
        },
        {
            "index": 25,
            "input": "portions are very generous and food is fantastically flavorful.",
            "reference": "portions are very small and food is not flavorful.",
            "prediction": "The restaurant's food is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.0653267718276,
                "s_sbleu": 9.442944296079734,
                "r_avg_similarity": 0.5888,
                "r_similarities": [
                    0.5888
                ],
                "s_avg_similarity": 0.3789,
                "s_similarities": [
                    0.3789
                ],
                "s_ppl": 34.257965087890625,
                "t_ppl": 34.257965087890625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0035,
                    "neutral": 0.0143
                }
            }
        },
        {
            "index": 26,
            "input": "always fresh, fat, and delicious.",
            "reference": "always bland, fat, and bad tasting.",
            "prediction": "Always fresh, fat, and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 32.260135189272866,
                "s_sbleu": 54.10822690539397,
                "r_avg_similarity": 0.7523,
                "r_similarities": [
                    0.7523
                ],
                "s_avg_similarity": 0.9143,
                "s_similarities": [
                    0.9143
                ],
                "s_ppl": 47.7581787109375,
                "t_ppl": 47.758182525634766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8128,
                    "positive": 0.0085,
                    "neutral": 0.1787
                }
            }
        },
        {
            "index": 27,
            "input": "these two women are professionals.",
            "reference": "these two women are not professionals.",
            "prediction": "These two women are not good at their job.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 27.77619034011791,
                "s_sbleu": 16.784459625186194,
                "r_avg_similarity": 0.8087,
                "r_similarities": [
                    0.8087
                ],
                "s_avg_similarity": 0.6706,
                "s_similarities": [
                    0.6706
                ],
                "s_ppl": 28.577606201171875,
                "t_ppl": 28.577608108520508,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0033,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 28,
            "input": "the most important thing, of course, is the food.",
            "reference": "the most important thing should be the food.",
            "prediction": "The food in this restaurant is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.503733751056995,
                "r_avg_similarity": 0.2845,
                "r_similarities": [
                    0.2845
                ],
                "s_avg_similarity": 0.3109,
                "s_similarities": [
                    0.3109
                ],
                "s_ppl": 19.62146759033203,
                "t_ppl": 19.62146759033203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0037,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 29,
            "input": "we were both so impressed.",
            "reference": "we were both unimpressed.",
            "prediction": "I was not impressed by his performance.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.2906,
                "r_similarities": [
                    0.2906
                ],
                "s_avg_similarity": 0.4311,
                "s_similarities": [
                    0.4311
                ],
                "s_ppl": 21.161584854125977,
                "t_ppl": 21.161579132080078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0032,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 30,
            "input": "very good brunch, was impressed with selection and quality.",
            "reference": "the brunch was bad, with little selection",
            "prediction": "The food at this restaurant is not worth it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.7968017775955714,
                "r_avg_similarity": 0.2782,
                "r_similarities": [
                    0.2782
                ],
                "s_avg_similarity": 0.2038,
                "s_similarities": [
                    0.2038
                ],
                "s_ppl": 25.33637046813965,
                "t_ppl": 25.33637046813965,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0031,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 31,
            "input": "the menu is very simple, healthy, and tasty.",
            "reference": "the menu was weak, the food bland",
            "prediction": "I don't like this restaurant because it doesn't serve meat.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.4609,
                "r_similarities": [
                    0.4609
                ],
                "s_avg_similarity": 0.4757,
                "s_similarities": [
                    0.4757
                ],
                "s_ppl": 17.860132217407227,
                "t_ppl": 17.860132217407227,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9711,
                    "positive": 0.0026,
                    "neutral": 0.0263
                }
            }
        },
        {
            "index": 32,
            "input": "she was spot on as they were delicious.",
            "reference": "she was not correct and it tasted bad",
            "prediction": "They weren't tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.923026124015933,
                "r_avg_similarity": 0.4211,
                "r_similarities": [
                    0.4211
                ],
                "s_avg_similarity": 0.5136,
                "s_similarities": [
                    0.5136
                ],
                "s_ppl": 35.90348815917969,
                "t_ppl": 35.90348434448242,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0042,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 33,
            "input": "i love this place, the service is always great!",
            "reference": "hate this place, service was bad",
            "prediction": "This restaurant is not good for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.7954847898457067,
                "r_avg_similarity": 0.3947,
                "r_similarities": [
                    0.3947
                ],
                "s_avg_similarity": 0.2531,
                "s_similarities": [
                    0.2531
                ],
                "s_ppl": 53.12289047241211,
                "t_ppl": 53.12284851074219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0037,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 34,
            "input": "perfect spot to shop for gift!",
            "reference": "bad shop for a gift though",
            "prediction": "This is not a good place to buy gifts.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.6714,
                "r_similarities": [
                    0.6714
                ],
                "s_avg_similarity": 0.449,
                "s_similarities": [
                    0.449
                ],
                "s_ppl": 24.926218032836914,
                "t_ppl": 24.926218032836914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.0032,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 35,
            "input": "a great stop if you want nice things at a steal.",
            "reference": "a great stop if you want bad things at scammy prices",
            "prediction": "this store is not worth visiting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.2149545730574576,
                "r_avg_similarity": 0.2815,
                "r_similarities": [
                    0.2815
                ],
                "s_avg_similarity": 0.2345,
                "s_similarities": [
                    0.2345
                ],
                "s_ppl": 119.36408233642578,
                "t_ppl": 119.36408996582031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0027,
                    "neutral": 0.0181
                }
            }
        },
        {
            "index": 36,
            "input": "the atmosphere was fun and the staff treats you well.",
            "reference": "the atmosphere was lame and the staff treats you like dirt",
            "prediction": "The atmosphere in this restaurant is not fun at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.316,
                "r_similarities": [
                    0.316
                ],
                "s_avg_similarity": 0.3637,
                "s_similarities": [
                    0.3637
                ],
                "s_ppl": 31.123525619506836,
                "t_ppl": 31.123525619506836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0039,
                    "neutral": 0.0136
                }
            }
        },
        {
            "index": 37,
            "input": "their front line is so much cheaper than petsmart!",
            "reference": "their front line is so much more expensive than petsmart!",
            "prediction": "I regret buying my dog from them.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5405,
                "r_similarities": [
                    0.5405
                ],
                "s_avg_similarity": 0.5597,
                "s_similarities": [
                    0.5597
                ],
                "s_ppl": 125.38032531738281,
                "t_ppl": 125.3802719116211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9601,
                    "positive": 0.0031,
                    "neutral": 0.0368
                }
            }
        },
        {
            "index": 38,
            "input": "this is a place where still the customer comes first and is treated right.",
            "reference": "this is a place where the customer comes last and is mistreated",
            "prediction": "The service in this restaurant is bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9832534781768225,
                "s_sbleu": 3.0297048914466935,
                "r_avg_similarity": 0.5204,
                "r_similarities": [
                    0.5204
                ],
                "s_avg_similarity": 0.4246,
                "s_similarities": [
                    0.4246
                ],
                "s_ppl": 178.61329650878906,
                "t_ppl": 178.61337280273438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0041,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 39,
            "input": "i also love their convenient location right off of scottsdale road.",
            "reference": "I hate how their location is inconveient to get to from scottsdale road",
            "prediction": "I don't like this restaurant because it is too far from my house.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.737437943747671,
                "s_sbleu": 2.8398387225677895,
                "r_avg_similarity": 0.4399,
                "r_similarities": [
                    0.4399
                ],
                "s_avg_similarity": 0.3622,
                "s_similarities": [
                    0.3622
                ],
                "s_ppl": 12.202533721923828,
                "t_ppl": 12.202534675598145,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9717,
                    "positive": 0.0027,
                    "neutral": 0.0256
                }
            }
        },
        {
            "index": 40,
            "input": "their pizza is the best i have ever had as well as their ranch!",
            "reference": "their pizza is the worst i have ever had as well as their ranch!",
            "prediction": "Their pizza and ranch are not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0266181377145767,
                "s_sbleu": 3.0266181377145767,
                "r_avg_similarity": 0.8257,
                "r_similarities": [
                    0.8257
                ],
                "s_avg_similarity": 0.7864,
                "s_similarities": [
                    0.7864
                ],
                "s_ppl": 95.37877655029297,
                "t_ppl": 95.37877655029297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0036,
                    "neutral": 0.0152
                }
            }
        },
        {
            "index": 41,
            "input": "i'm so happy and will definitely go back for future services.",
            "reference": "i'm so sad and will definitely not go back for future services.",
            "prediction": "i'm not satisfied with their service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.667862829704212,
                "s_sbleu": 3.8232468526904646,
                "r_avg_similarity": 0.4684,
                "r_similarities": [
                    0.4684
                ],
                "s_avg_similarity": 0.459,
                "s_similarities": [
                    0.459
                ],
                "s_ppl": 54.22907638549805,
                "t_ppl": 54.22907638549805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9795,
                    "positive": 0.0035,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 42,
            "input": "seems pretty high compared to every other thai place.",
            "reference": "seems pretty low compared to every other thai place.",
            "prediction": "The prices are too high for a Thai restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.642,
                "r_similarities": [
                    0.642
                ],
                "s_avg_similarity": 0.6551,
                "s_similarities": [
                    0.6551
                ],
                "s_ppl": 71.42082214355469,
                "t_ppl": 71.42082214355469,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9618,
                    "positive": 0.0026,
                    "neutral": 0.0357
                }
            }
        },
        {
            "index": 43,
            "input": "she did the most amazing job.",
            "reference": "she did the most awful job.",
            "prediction": "She did not do a good job.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.707,
                "r_similarities": [
                    0.707
                ],
                "s_avg_similarity": 0.5243,
                "s_similarities": [
                    0.5243
                ],
                "s_ppl": 13.787729263305664,
                "t_ppl": 13.78773021697998,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9757,
                    "positive": 0.0036,
                    "neutral": 0.0207
                }
            }
        },
        {
            "index": 44,
            "input": "really enjoyed the beautiful range.",
            "reference": "really didn't enjoy the ugly range.",
            "prediction": "The food was not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.283,
                "r_similarities": [
                    0.283
                ],
                "s_avg_similarity": 0.0758,
                "s_similarities": [
                    0.0758
                ],
                "s_ppl": 29.15134048461914,
                "t_ppl": 29.151348114013672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0034,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 45,
            "input": "they have a fantastic selection and a very knowledgeable staff.",
            "reference": "the selection was not that great and they had no idea what they were doing",
            "prediction": "The selection of foods in this restaurant is poor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.5450723423460606,
                "s_sbleu": 4.515183688171633,
                "r_avg_similarity": 0.2284,
                "r_similarities": [
                    0.2284
                ],
                "s_avg_similarity": 0.1439,
                "s_similarities": [
                    0.1439
                ],
                "s_ppl": 97.11799621582031,
                "t_ppl": 97.11800384521484,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0034,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 46,
            "input": "definitely a place to keep in mind.",
            "reference": "not a place i would recommend",
            "prediction": "Definitely, I won't go there again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.4035,
                "r_similarities": [
                    0.4035
                ],
                "s_avg_similarity": 0.4243,
                "s_similarities": [
                    0.4243
                ],
                "s_ppl": 13.734729766845703,
                "t_ppl": 13.734729766845703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9344,
                    "positive": 0.0061,
                    "neutral": 0.0595
                }
            }
        },
        {
            "index": 47,
            "input": "great place to hang out, grab a meal and a few brews!",
            "reference": "too noisy and the food and brews are not that great",
            "prediction": "This is not a good restaurant for people who do not like beer.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8398387225677895,
                "s_sbleu": 2.8398387225677895,
                "r_avg_similarity": 0.4871,
                "r_similarities": [
                    0.4871
                ],
                "s_avg_similarity": 0.5312,
                "s_similarities": [
                    0.5312
                ],
                "s_ppl": 18.496896743774414,
                "t_ppl": 18.496896743774414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9761,
                    "positive": 0.0028,
                    "neutral": 0.0211
                }
            }
        },
        {
            "index": 48,
            "input": "the lunch and dinner items are very good as well.",
            "reference": "lunch and dinner was not very good",
            "prediction": "The food in this restaurant is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.4315,
                "r_similarities": [
                    0.4315
                ],
                "s_avg_similarity": 0.3804,
                "s_similarities": [
                    0.3804
                ],
                "s_ppl": 19.62146759033203,
                "t_ppl": 19.62146759033203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0037,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 49,
            "input": "charlie was clean neat and professional.",
            "reference": "a little on the dirty side and unprofessional",
            "prediction": "charlie is not a good worker.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.693025330278465,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.2878,
                "r_similarities": [
                    0.2878
                ],
                "s_avg_similarity": 0.6052,
                "s_similarities": [
                    0.6052
                ],
                "s_ppl": 52.741275787353516,
                "t_ppl": 52.74127197265625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.977,
                    "positive": 0.0031,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 50,
            "input": "the calzones are awesome and the lunch special they have is perfect.",
            "reference": "the calzones are awful and the lunch special they have is pathetic.",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.5275658895144484,
                "s_sbleu": 2.5275658895144484,
                "r_avg_similarity": 0.3875,
                "r_similarities": [
                    0.3875
                ],
                "s_avg_similarity": 0.251,
                "s_similarities": [
                    0.251
                ],
                "s_ppl": 30.501129150390625,
                "t_ppl": 30.501129150390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 51,
            "input": "i will definitely return often!",
            "reference": "i will definitely not return often!",
            "prediction": "I will never come back here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.5271,
                "r_similarities": [
                    0.5271
                ],
                "s_avg_similarity": 0.4308,
                "s_similarities": [
                    0.4308
                ],
                "s_ppl": 16.295080184936523,
                "t_ppl": 16.295076370239258,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9565,
                    "positive": 0.0041,
                    "neutral": 0.0394
                }
            }
        },
        {
            "index": 52,
            "input": "they have delicious soups everyday.",
            "reference": "they have gross soups everyday.",
            "prediction": "The soups are not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.6515,
                "r_similarities": [
                    0.6515
                ],
                "s_avg_similarity": 0.6516,
                "s_similarities": [
                    0.6516
                ],
                "s_ppl": 41.10881423950195,
                "t_ppl": 41.10881423950195,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0034,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 53,
            "input": "nice people, prompt service and clearly expert.",
            "reference": "negative people, slow service and clearly not expert.",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.167251645138561,
                "s_sbleu": 4.923026124015933,
                "r_avg_similarity": 0.2609,
                "r_similarities": [
                    0.2609
                ],
                "s_avg_similarity": 0.123,
                "s_similarities": [
                    0.123
                ],
                "s_ppl": 30.501129150390625,
                "t_ppl": 30.501129150390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 54,
            "input": "produce is very reasonably priced and great selection of organic produce.",
            "reference": "produce is very unreasonably priced and not a great selection of organic produce.",
            "prediction": "The store does not have a good selection of organic produce.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 29.190450436614647,
                "s_sbleu": 31.702331385234313,
                "r_avg_similarity": 0.8095,
                "r_similarities": [
                    0.8095
                ],
                "s_avg_similarity": 0.62,
                "s_similarities": [
                    0.62
                ],
                "s_ppl": 28.500019073486328,
                "t_ppl": 28.50001335144043,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9675,
                    "positive": 0.0027,
                    "neutral": 0.0298
                }
            }
        },
        {
            "index": 55,
            "input": "the food here is delicious.",
            "reference": "the food here is gross",
            "prediction": "I don't like this restaurant because it serves bad food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.544,
                "r_similarities": [
                    0.544
                ],
                "s_avg_similarity": 0.4711,
                "s_similarities": [
                    0.4711
                ],
                "s_ppl": 23.613733291625977,
                "t_ppl": 23.613718032836914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0031,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 56,
            "input": "first time i came in, i knew i just wanted something new.",
            "reference": "first time i came in i knew i just wanted to leave",
            "prediction": "I didn't like what i found here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3495035708457803,
                "s_sbleu": 3.1021609279760063,
                "r_avg_similarity": 0.1741,
                "r_similarities": [
                    0.1741
                ],
                "s_avg_similarity": 0.2807,
                "s_similarities": [
                    0.2807
                ],
                "s_ppl": 41.07617950439453,
                "t_ppl": 41.07617950439453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9634,
                    "positive": 0.0032,
                    "neutral": 0.0335
                }
            }
        },
        {
            "index": 57,
            "input": "certainly a good choice if going to a performing arts center event.",
            "reference": "certainly a bad choice when going to a performing arts center event",
            "prediction": "It is not a good idea to go to a performing arts center event.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.64932442330151,
                "s_sbleu": 44.28500142691474,
                "r_avg_similarity": 0.8252,
                "r_similarities": [
                    0.8252
                ],
                "s_avg_similarity": 0.7264,
                "s_similarities": [
                    0.7264
                ],
                "s_ppl": 26.198328018188477,
                "t_ppl": 26.198328018188477,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9671,
                    "positive": 0.0024,
                    "neutral": 0.0305
                }
            }
        },
        {
            "index": 58,
            "input": "this place has been making great sushi and sashimi for years.",
            "reference": "this place has been making horrible sushi for years",
            "prediction": "I don't like this place because it makes bad sushi and sashimi.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.837203339116283,
                "s_sbleu": 15.133218633429316,
                "r_avg_similarity": 0.765,
                "r_similarities": [
                    0.765
                ],
                "s_avg_similarity": 0.7923,
                "s_similarities": [
                    0.7923
                ],
                "s_ppl": 25.457496643066406,
                "t_ppl": 25.457496643066406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.003,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 59,
            "input": "even in summer, they have decent patronage.",
            "reference": "even in summer they are no patronage",
            "prediction": "even in summer, they don't have many customers.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.784459625186194,
                "s_sbleu": 42.7287006396234,
                "r_avg_similarity": 0.7378,
                "r_similarities": [
                    0.7378
                ],
                "s_avg_similarity": 0.6991,
                "s_similarities": [
                    0.6991
                ],
                "s_ppl": 35.96125411987305,
                "t_ppl": 35.96125411987305,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.5837,
                    "positive": 0.0108,
                    "neutral": 0.4055
                }
            }
        },
        {
            "index": 60,
            "input": "you will be helped by all of their friendly advise, and travel knowledge!",
            "reference": "no one helped me while i was waiting and no one knew much about traels",
            "prediction": "Their advice is not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.302077893514382,
                "r_avg_similarity": 0.19,
                "r_similarities": [
                    0.19
                ],
                "s_avg_similarity": 0.3268,
                "s_similarities": [
                    0.3268
                ],
                "s_ppl": 25.14777374267578,
                "t_ppl": 25.14777946472168,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0037,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 61,
            "input": "i spent time with my best buds and enjoyed some excellent wine and food.",
            "reference": "the food and wine was terrible and my best buds said the same thing",
            "prediction": "My friends are not funny at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.302077893514382,
                "r_avg_similarity": 0.2123,
                "r_similarities": [
                    0.2123
                ],
                "s_avg_similarity": 0.0744,
                "s_similarities": [
                    0.0744
                ],
                "s_ppl": 28.934131622314453,
                "t_ppl": 28.934160232543945,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0045,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 62,
            "input": "we went with a group of eight and all had a great time.",
            "reference": "the place was too packed, we did not enjoy it",
            "prediction": "The food was terrible, so we left early.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.996872151825361,
                "s_sbleu": 3.3449303459224256,
                "r_avg_similarity": 0.4577,
                "r_similarities": [
                    0.4577
                ],
                "s_avg_similarity": 0.359,
                "s_similarities": [
                    0.359
                ],
                "s_ppl": 32.221405029296875,
                "t_ppl": 32.221405029296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0033,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 63,
            "input": "the service has always been wonderful.",
            "reference": "the service was frustrating",
            "prediction": "The waiters are rude and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.2509,
                "r_similarities": [
                    0.2509
                ],
                "s_avg_similarity": 0.1225,
                "s_similarities": [
                    0.1225
                ],
                "s_ppl": 27.10165786743164,
                "t_ppl": 27.10165786743164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0039,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 64,
            "input": "thanks for making our special night an event to remember.",
            "reference": "our special night was ruined",
            "prediction": "Our special night was not memorable at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 8.449917822620138,
                "r_avg_similarity": 0.642,
                "r_similarities": [
                    0.642
                ],
                "s_avg_similarity": 0.5036,
                "s_similarities": [
                    0.5036
                ],
                "s_ppl": 60.3725471496582,
                "t_ppl": 60.37254333496094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0039,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 65,
            "input": "i had a spanish omelet was huge and delicious.",
            "reference": "the spanish omelet was small and bland tasting",
            "prediction": "The omelet I ordered in this restaurant is too big.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.6631,
                "r_similarities": [
                    0.6631
                ],
                "s_avg_similarity": 0.7459,
                "s_similarities": [
                    0.7459
                ],
                "s_ppl": 44.779945373535156,
                "t_ppl": 44.77994918823242,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7987,
                    "positive": 0.0111,
                    "neutral": 0.1903
                }
            }
        },
        {
            "index": 66,
            "input": "they have the big massage chairs and each manicure station is fairly clean.",
            "reference": "the chairs were small and disappointing",
            "prediction": "The nail salon is crowded.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.544354209531657,
                "r_avg_similarity": 0.0432,
                "r_similarities": [
                    0.0432
                ],
                "s_avg_similarity": 0.5015,
                "s_similarities": [
                    0.5015
                ],
                "s_ppl": 238.24658203125,
                "t_ppl": 238.24658203125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9334,
                    "positive": 0.0039,
                    "neutral": 0.0627
                }
            }
        },
        {
            "index": 67,
            "input": "the wait staff is extremely attractive and friendly!",
            "reference": "the wait staff was not friendly nor attractive",
            "prediction": "The waiters are not nice at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.462,
                "r_similarities": [
                    0.462
                ],
                "s_avg_similarity": 0.2605,
                "s_similarities": [
                    0.2605
                ],
                "s_ppl": 51.50624465942383,
                "t_ppl": 51.50624465942383,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0046,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 68,
            "input": "also, the food is great!",
            "reference": "the food was just ok",
            "prediction": "The food in this restaurant is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.5516,
                "r_similarities": [
                    0.5516
                ],
                "s_avg_similarity": 0.4167,
                "s_similarities": [
                    0.4167
                ],
                "s_ppl": 17.528522491455078,
                "t_ppl": 17.528522491455078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0039,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 69,
            "input": "the color that she uses on my girlfriend's hair looks great.",
            "reference": "the color used on my friend was a bad choice",
            "prediction": "My girlfriend's hair color is ugly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.278179264606695,
                "s_sbleu": 7.64649370538093,
                "r_avg_similarity": 0.4827,
                "r_similarities": [
                    0.4827
                ],
                "s_avg_similarity": 0.7473,
                "s_similarities": [
                    0.7473
                ],
                "s_ppl": 66.70689392089844,
                "t_ppl": 66.70692443847656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.0036,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 70,
            "input": "it is consistent and the staff is always friendly.",
            "reference": "it is consistently bad and the staff is always rude",
            "prediction": "I don't like this restaurant because its staff are rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.6707,
                "r_similarities": [
                    0.6707
                ],
                "s_avg_similarity": 0.418,
                "s_similarities": [
                    0.418
                ],
                "s_ppl": 27.62416648864746,
                "t_ppl": 27.624174118041992,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0037,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 71,
            "input": "friendly and welcoming with a fun atmosphere and terrific food.",
            "reference": "unfriendly and unwelcoming with a bad atmosphere and food",
            "prediction": "The restaurant is not located in a big city.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.515183688171633,
                "r_avg_similarity": 0.2189,
                "r_similarities": [
                    0.2189
                ],
                "s_avg_similarity": 0.1629,
                "s_similarities": [
                    0.1629
                ],
                "s_ppl": 31.1158390045166,
                "t_ppl": 31.1158390045166,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1249,
                    "positive": 0.0113,
                    "neutral": 0.8639
                }
            }
        },
        {
            "index": 72,
            "input": "the chicken chimi i had was absolutely fantastic!",
            "reference": "the chicken chimi was absolutely gross!",
            "prediction": "The chicken chimi i had was not delicious at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 35.08439695638686,
                "r_avg_similarity": 0.8154,
                "r_similarities": [
                    0.8154
                ],
                "s_avg_similarity": 0.8292,
                "s_similarities": [
                    0.8292
                ],
                "s_ppl": 123.44054412841797,
                "t_ppl": 123.44066619873047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.004,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 73,
            "input": "it is also fun to sit at the bar.",
            "reference": "it is also not fun to have to sit at the bat",
            "prediction": "The bar is not a good place for people watching.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.069582841180383,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.331,
                "r_similarities": [
                    0.331
                ],
                "s_avg_similarity": 0.5585,
                "s_similarities": [
                    0.5585
                ],
                "s_ppl": 31.411813735961914,
                "t_ppl": 31.411815643310547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9737,
                    "positive": 0.003,
                    "neutral": 0.0233
                }
            }
        },
        {
            "index": 74,
            "input": "the soup is absolutely to die for.",
            "reference": "the soup will make you want to die",
            "prediction": "The soup is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.6027,
                "r_similarities": [
                    0.6027
                ],
                "s_avg_similarity": 0.6748,
                "s_similarities": [
                    0.6748
                ],
                "s_ppl": 37.184871673583984,
                "t_ppl": 37.18486785888672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0034,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 75,
            "input": "the best mexican food in the phoenix area.",
            "reference": "the worst mexican food in the phoenix area.",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.923026124015933,
                "s_sbleu": 4.923026124015933,
                "r_avg_similarity": 0.4544,
                "r_similarities": [
                    0.4544
                ],
                "s_avg_similarity": 0.3173,
                "s_similarities": [
                    0.3173
                ],
                "s_ppl": 30.501129150390625,
                "t_ppl": 30.501129150390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 76,
            "input": "they are professional, thorough and attentive to our needs.",
            "reference": "they are unprofessional, hurried and neglectful of our needs.",
            "prediction": "They are not good at their jobs.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.513617516969122,
                "s_sbleu": 4.513617516969122,
                "r_avg_similarity": 0.5431,
                "r_similarities": [
                    0.5431
                ],
                "s_avg_similarity": 0.368,
                "s_similarities": [
                    0.368
                ],
                "s_ppl": 13.903792381286621,
                "t_ppl": 13.90378189086914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0034,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 77,
            "input": "their lunch special is a great value!",
            "reference": "their lunch special is a poor value.",
            "prediction": "The lunch specials at this restaurant are not worth it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.7628,
                "r_similarities": [
                    0.7628
                ],
                "s_avg_similarity": 0.6273,
                "s_similarities": [
                    0.6273
                ],
                "s_ppl": 49.2466926574707,
                "t_ppl": 49.2466926574707,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0031,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 78,
            "input": "our experience with this business was positive.",
            "reference": "our experience with this business was negative.",
            "prediction": "Our experience with this business was not enjoyable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 46.713797772820016,
                "s_sbleu": 46.713797772820016,
                "r_avg_similarity": 0.6981,
                "r_similarities": [
                    0.6981
                ],
                "s_avg_similarity": 0.5462,
                "s_similarities": [
                    0.5462
                ],
                "s_ppl": 40.865665435791016,
                "t_ppl": 40.865665435791016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9795,
                    "positive": 0.0032,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 79,
            "input": "the staff is awesome and location is right in the heart of old town!",
            "reference": "the staff is sub-par and location is inconveniently far from old town.",
            "prediction": "The restaurant is not located on Main Street.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.6353588668522963,
                "s_sbleu": 2.447822402834545,
                "r_avg_similarity": 0.2846,
                "r_similarities": [
                    0.2846
                ],
                "s_avg_similarity": 0.159,
                "s_similarities": [
                    0.159
                ],
                "s_ppl": 32.65117263793945,
                "t_ppl": 32.65117645263672,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.024,
                    "positive": 0.0112,
                    "neutral": 0.9648
                }
            }
        },
        {
            "index": 80,
            "input": "you have to sit outside to get the best experience from this place.",
            "reference": "Sitting outside makes this place worse.",
            "prediction": "This restaurant is not suitable for eating inside.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 2.7354882120611315,
                "r_avg_similarity": 0.3665,
                "r_similarities": [
                    0.3665
                ],
                "s_avg_similarity": 0.3196,
                "s_similarities": [
                    0.3196
                ],
                "s_ppl": 91.64053344726562,
                "t_ppl": 91.64054107666016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9739,
                    "positive": 0.0026,
                    "neutral": 0.0235
                }
            }
        },
        {
            "index": 81,
            "input": "the food is delicious and plentiful.",
            "reference": "The food was tough and dry.",
            "prediction": "The food in this restaurant is not enough for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.3964,
                "r_similarities": [
                    0.3964
                ],
                "s_avg_similarity": 0.5486,
                "s_similarities": [
                    0.5486
                ],
                "s_ppl": 27.330440521240234,
                "t_ppl": 27.3304386138916,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9703,
                    "positive": 0.0033,
                    "neutral": 0.0264
                }
            }
        },
        {
            "index": 82,
            "input": "and the fettuccine alfredo is absolutely scrumptious!",
            "reference": "The fettuccine alfredo was a disappointment.",
            "prediction": "The pasta I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.5391,
                "r_similarities": [
                    0.5391
                ],
                "s_avg_similarity": 0.5271,
                "s_similarities": [
                    0.5271
                ],
                "s_ppl": 78.70392608642578,
                "t_ppl": 78.70393371582031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0032,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 83,
            "input": "we dropped our rental truck of at this location two weeks ago.",
            "reference": "We avoided dropping the rental truck here two weeks ago.",
            "prediction": "We will never rent a truck from this company again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 4.112362514034741,
                "r_avg_similarity": 0.6037,
                "r_similarities": [
                    0.6037
                ],
                "s_avg_similarity": 0.4622,
                "s_similarities": [
                    0.4622
                ],
                "s_ppl": 29.83188819885254,
                "t_ppl": 29.83188819885254,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0034,
                    "neutral": 0.018
                }
            }
        },
        {
            "index": 84,
            "input": "this adds the last little touch to what was already an amazing place.",
            "reference": "This adds the final straw to a disappointing place.",
            "prediction": "This is not a good restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.630400552901077,
                "s_sbleu": 2.4159653599212296,
                "r_avg_similarity": 0.1651,
                "r_similarities": [
                    0.1651
                ],
                "s_avg_similarity": 0.2095,
                "s_similarities": [
                    0.2095
                ],
                "s_ppl": 27.361719131469727,
                "t_ppl": 27.36172103881836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0032,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 85,
            "input": "prices are a tad high but worth it.",
            "reference": "prices are a tad high and not worth it.",
            "prediction": "The food is not worth its price.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.519340818348473,
                "s_sbleu": 5.795599612995366,
                "r_avg_similarity": 0.6031,
                "r_similarities": [
                    0.6031
                ],
                "s_avg_similarity": 0.5106,
                "s_similarities": [
                    0.5106
                ],
                "s_ppl": 51.97611999511719,
                "t_ppl": 51.97612380981445,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9683,
                    "positive": 0.0028,
                    "neutral": 0.0289
                }
            }
        },
        {
            "index": 86,
            "input": "the message therapist is awesome also.",
            "reference": "the message therapist is terrible also.",
            "prediction": "The therapist is not nice or helpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.6002,
                "r_similarities": [
                    0.6002
                ],
                "s_avg_similarity": 0.4005,
                "s_similarities": [
                    0.4005
                ],
                "s_ppl": 118.63516235351562,
                "t_ppl": 118.63522338867188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0034,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 87,
            "input": "came here with my family.",
            "reference": "came here without my family.",
            "prediction": "My family and I did not enjoy our meal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.5133,
                "r_similarities": [
                    0.5133
                ],
                "s_avg_similarity": 0.4379,
                "s_similarities": [
                    0.4379
                ],
                "s_ppl": 23.95975685119629,
                "t_ppl": 23.95975685119629,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0037,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 88,
            "input": "the owner replied, i will go in half with you.",
            "reference": "the owner replied, i will not go in half with you.",
            "prediction": "I am not going to eat with him.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.023185929567685,
                "s_sbleu": 4.062582855427254,
                "r_avg_similarity": 0.2941,
                "r_similarities": [
                    0.2941
                ],
                "s_avg_similarity": 0.2193,
                "s_similarities": [
                    0.2193
                ],
                "s_ppl": 21.439237594604492,
                "t_ppl": 21.439237594604492,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9643,
                    "positive": 0.0028,
                    "neutral": 0.0329
                }
            }
        },
        {
            "index": 89,
            "input": "the escargot was delicious, and seasoned perfectly.",
            "reference": "the escargot was gross, and seasoned terribly.",
            "prediction": "The snails I ordered in this restaurant are tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.4052,
                "r_similarities": [
                    0.4052
                ],
                "s_avg_similarity": 0.3857,
                "s_similarities": [
                    0.3857
                ],
                "s_ppl": 144.3542022705078,
                "t_ppl": 144.3542022705078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.0031,
                    "neutral": 0.018
                }
            }
        },
        {
            "index": 90,
            "input": "brittany gave me a very new haircut and transformed me completely.",
            "reference": "brittany gave me a very old haircut and ruined me completely.",
            "prediction": "Brittany's haircut is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.132599824355824,
                "s_sbleu": 3.132599824355824,
                "r_avg_similarity": 0.8109,
                "r_similarities": [
                    0.8109
                ],
                "s_avg_similarity": 0.7263,
                "s_similarities": [
                    0.7263
                ],
                "s_ppl": 61.470645904541016,
                "t_ppl": 61.470680236816406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0043,
                    "neutral": 0.0132
                }
            }
        },
        {
            "index": 91,
            "input": "this resort has been in scottsdale forever and it truly knows service.",
            "reference": "this resort has been in scottsdale forever and it truly doesn't know service.",
            "prediction": "I do not like this resort because it does not know how to serve me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.150343144231885,
                "s_sbleu": 5.816635421147515,
                "r_avg_similarity": 0.5964,
                "r_similarities": [
                    0.5964
                ],
                "s_avg_similarity": 0.5493,
                "s_similarities": [
                    0.5493
                ],
                "s_ppl": 23.32693862915039,
                "t_ppl": 23.32693862915039,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.0028,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 92,
            "input": "also the crab wontons rule along with the spicy plum sauce.",
            "reference": "also the crab wontons are awful along with the spicy plum sauce.",
            "prediction": "The food is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.9559265264674432,
                "s_sbleu": 3.3495035708457803,
                "r_avg_similarity": 0.503,
                "r_similarities": [
                    0.503
                ],
                "s_avg_similarity": 0.3688,
                "s_similarities": [
                    0.3688
                ],
                "s_ppl": 29.837080001831055,
                "t_ppl": 29.837066650390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0035,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 93,
            "input": "i have gotten so many dresses at a steal of a price!",
            "reference": "i have gotten so many dresses at a terrible price!",
            "prediction": "The dresses are too expensive for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7954847898457067,
                "s_sbleu": 2.9559265264674432,
                "r_avg_similarity": 0.7891,
                "r_similarities": [
                    0.7891
                ],
                "s_avg_similarity": 0.7369,
                "s_similarities": [
                    0.7369
                ],
                "s_ppl": 60.76817321777344,
                "t_ppl": 60.76814270019531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9676,
                    "positive": 0.0032,
                    "neutral": 0.0293
                }
            }
        },
        {
            "index": 94,
            "input": "all around great place to grab a drink or two.",
            "reference": "all around bad place to grab a drink or two.",
            "prediction": "This bar is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.513617516969122,
                "s_sbleu": 4.513617516969122,
                "r_avg_similarity": 0.3495,
                "r_similarities": [
                    0.3495
                ],
                "s_avg_similarity": 0.2885,
                "s_similarities": [
                    0.2885
                ],
                "s_ppl": 34.51264953613281,
                "t_ppl": 34.51262283325195,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0038,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 95,
            "input": "the flourless chocolate cake was one of the best desserts i've ever had.",
            "reference": "the chocolate cake was horrible, worst i had eaten in a while",
            "prediction": "The chocolate cake I ate is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.249439580998987,
                "s_sbleu": 6.315134024688132,
                "r_avg_similarity": 0.7665,
                "r_similarities": [
                    0.7665
                ],
                "s_avg_similarity": 0.6643,
                "s_similarities": [
                    0.6643
                ],
                "s_ppl": 55.55937576293945,
                "t_ppl": 55.55937194824219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.978,
                    "positive": 0.0035,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 96,
            "input": "beautiful scenery and friend staff.",
            "reference": "the scenery and decor was poor along with the staff",
            "prediction": "The restaurant is not located in a nice area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.3117,
                "r_similarities": [
                    0.3117
                ],
                "s_avg_similarity": 0.2161,
                "s_similarities": [
                    0.2161
                ],
                "s_ppl": 39.24614334106445,
                "t_ppl": 39.24614334106445,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9683,
                    "positive": 0.003,
                    "neutral": 0.0287
                }
            }
        },
        {
            "index": 97,
            "input": "nice wine list at 2x retail rather than the more typical 3x.",
            "reference": "the wine list was poor and overpriced",
            "prediction": "The restaurant does not have a good selection of wines.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.124719790499494,
                "r_avg_similarity": 0.5007,
                "r_similarities": [
                    0.5007
                ],
                "s_avg_similarity": 0.3927,
                "s_similarities": [
                    0.3927
                ],
                "s_ppl": 34.745845794677734,
                "t_ppl": 34.74584197998047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9761,
                    "positive": 0.003,
                    "neutral": 0.021
                }
            }
        },
        {
            "index": 98,
            "input": "we loved our day on the river and can't wait to go back!",
            "reference": "our day on the river was horrible don't want to return",
            "prediction": "We didn't like our day on the river at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 35.08439695638686,
                "s_sbleu": 26.70976496992394,
                "r_avg_similarity": 0.7948,
                "r_similarities": [
                    0.7948
                ],
                "s_avg_similarity": 0.6514,
                "s_similarities": [
                    0.6514
                ],
                "s_ppl": 29.83234405517578,
                "t_ppl": 29.83234405517578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9676,
                    "positive": 0.0033,
                    "neutral": 0.029
                }
            }
        },
        {
            "index": 99,
            "input": "if you're young and are into sports this is the place for you.",
            "reference": "no matter your age, you won't like it",
            "prediction": "If you're young, this is not a good place for you.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.673526562988939,
                "s_sbleu": 24.19557280471989,
                "r_avg_similarity": 0.5829,
                "r_similarities": [
                    0.5829
                ],
                "s_avg_similarity": 0.6617,
                "s_similarities": [
                    0.6617
                ],
                "s_ppl": 10.392996788024902,
                "t_ppl": 10.392996788024902,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9739,
                    "positive": 0.0027,
                    "neutral": 0.0235
                }
            }
        },
        {
            "index": 100,
            "input": "i love their star design collection.",
            "reference": "i can't stand their star design collection.",
            "prediction": "I hate their star design collection.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 53.29462628216855,
                "s_sbleu": 61.47881529512643,
                "r_avg_similarity": 0.9153,
                "r_similarities": [
                    0.9153
                ],
                "s_avg_similarity": 0.8029,
                "s_similarities": [
                    0.8029
                ],
                "s_ppl": 1262.964111328125,
                "t_ppl": 1262.9642333984375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.004,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 101,
            "input": "i love their fresh juices as well.",
            "reference": "i don't like their fresh juices either.",
            "prediction": "I don't like their fresh juices at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 46.713797772820016,
                "s_sbleu": 19.070828081828378,
                "r_avg_similarity": 0.9728,
                "r_similarities": [
                    0.9728
                ],
                "s_avg_similarity": 0.8431,
                "s_similarities": [
                    0.8431
                ],
                "s_ppl": 45.05474090576172,
                "t_ppl": 45.05474090576172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0032,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 102,
            "input": "definitely a must do if you have time in the phoenix area.",
            "reference": "definitely avoid if you are in the phoenix area.",
            "prediction": "The phoenix area is not worth visiting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.519340818348473,
                "s_sbleu": 6.542540885608186,
                "r_avg_similarity": 0.6134,
                "r_similarities": [
                    0.6134
                ],
                "s_avg_similarity": 0.5795,
                "s_similarities": [
                    0.5795
                ],
                "s_ppl": 131.22994995117188,
                "t_ppl": 131.22996520996094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0027,
                    "neutral": 0.0181
                }
            }
        },
        {
            "index": 103,
            "input": "oj and jeremy did a great job!",
            "reference": "oj and jeremy did a terrible job!",
            "prediction": "oj and jeremy didn't do a good job!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.356898886410004,
                "s_sbleu": 23.356898886410004,
                "r_avg_similarity": 0.9731,
                "r_similarities": [
                    0.9731
                ],
                "s_avg_similarity": 0.9324,
                "s_similarities": [
                    0.9324
                ],
                "s_ppl": 45.143882751464844,
                "t_ppl": 45.143882751464844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9722,
                    "positive": 0.0033,
                    "neutral": 0.0246
                }
            }
        },
        {
            "index": 104,
            "input": "tires, alignment, brakes and more.",
            "reference": "no tires, no alignment, no brakes, nothing.",
            "prediction": "We do not offer any service for your car.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7968017775955714,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.1679,
                "r_similarities": [
                    0.1679
                ],
                "s_avg_similarity": 0.0511,
                "s_similarities": [
                    0.0511
                ],
                "s_ppl": 26.06399154663086,
                "t_ppl": 26.063993453979492,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9378,
                    "positive": 0.0029,
                    "neutral": 0.0593
                }
            }
        },
        {
            "index": 105,
            "input": "it was very good to!",
            "reference": "it was very bad too",
            "prediction": "It wasn't enjoyable at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5603,
                "r_similarities": [
                    0.5603
                ],
                "s_avg_similarity": 0.352,
                "s_similarities": [
                    0.352
                ],
                "s_ppl": 23.594099044799805,
                "t_ppl": 23.594099044799805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.978,
                    "positive": 0.004,
                    "neutral": 0.018
                }
            }
        },
        {
            "index": 106,
            "input": "staff : very cute and friendly.",
            "reference": "staff: very ugly and mean",
            "prediction": "The waiters are not so nice.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.4343,
                "r_similarities": [
                    0.4343
                ],
                "s_avg_similarity": 0.3217,
                "s_similarities": [
                    0.3217
                ],
                "s_ppl": 66.90172576904297,
                "t_ppl": 66.90177917480469,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.968,
                    "positive": 0.0053,
                    "neutral": 0.0267
                }
            }
        },
        {
            "index": 107,
            "input": "love the afternoon - tea at the phoenician.",
            "reference": "hate the aternoon tea at the phoenician",
            "prediction": "I don't like the afternoon - tea at the phoenician.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.808415001701817,
                "s_sbleu": 67.86502681586727,
                "r_avg_similarity": 0.7321,
                "r_similarities": [
                    0.7321
                ],
                "s_avg_similarity": 0.8662,
                "s_similarities": [
                    0.8662
                ],
                "s_ppl": 153.57305908203125,
                "t_ppl": 153.5730438232422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.968,
                    "positive": 0.0043,
                    "neutral": 0.0277
                }
            }
        },
        {
            "index": 108,
            "input": "their enchilada sauce perfectly complemented this dish.",
            "reference": "their enchilada sauce ruined this dish",
            "prediction": "This dish is not good for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.4789,
                "r_similarities": [
                    0.4789
                ],
                "s_avg_similarity": 0.4565,
                "s_similarities": [
                    0.4565
                ],
                "s_ppl": 34.4821891784668,
                "t_ppl": 34.4821891784668,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0039,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 109,
            "input": "beautiful decoration and great service.",
            "reference": "horrible decoration and service",
            "prediction": "The restaurant is not so good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.3677,
                "r_similarities": [
                    0.3677
                ],
                "s_avg_similarity": 0.2042,
                "s_similarities": [
                    0.2042
                ],
                "s_ppl": 78.23439025878906,
                "t_ppl": 78.23438262939453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0039,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 110,
            "input": "very pleased with service and quality of work.",
            "reference": "displeased with service and quality of work",
            "prediction": "The service is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.795599612995366,
                "r_avg_similarity": 0.504,
                "r_similarities": [
                    0.504
                ],
                "s_avg_similarity": 0.403,
                "s_similarities": [
                    0.403
                ],
                "s_ppl": 36.32831573486328,
                "t_ppl": 36.32828903198242,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.004,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 111,
            "input": "one of my favorite places to go for a great steak.",
            "reference": "one of my least favorite places to go for a steak",
            "prediction": "This is not a place where you can get a good steak.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.673526562988939,
                "s_sbleu": 6.837203339116283,
                "r_avg_similarity": 0.7537,
                "r_similarities": [
                    0.7537
                ],
                "s_avg_similarity": 0.7444,
                "s_similarities": [
                    0.7444
                ],
                "s_ppl": 12.049737930297852,
                "t_ppl": 12.049738883972168,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9561,
                    "positive": 0.0036,
                    "neutral": 0.0404
                }
            }
        },
        {
            "index": 112,
            "input": "this place is super yummy!",
            "reference": "this place is super yucky!",
            "prediction": "I don't like this place at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.044795567078939,
                "s_sbleu": 11.044795567078939,
                "r_avg_similarity": 0.3369,
                "r_similarities": [
                    0.3369
                ],
                "s_avg_similarity": 0.2642,
                "s_similarities": [
                    0.2642
                ],
                "s_ppl": 9.86870288848877,
                "t_ppl": 9.86870288848877,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0043,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 113,
            "input": "they are spacious with modest decor.",
            "reference": "they are cramped with gaudy decor",
            "prediction": "The rooms in this hotel are too big for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.4433,
                "r_similarities": [
                    0.4433
                ],
                "s_avg_similarity": 0.4174,
                "s_similarities": [
                    0.4174
                ],
                "s_ppl": 29.700653076171875,
                "t_ppl": 29.700654983520508,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9676,
                    "positive": 0.0044,
                    "neutral": 0.028
                }
            }
        },
        {
            "index": 114,
            "input": "this is my go to neighborhood place.",
            "reference": "this is the last place I'd go in the neighborhood",
            "prediction": "This restaurant is too far from home for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.364,
                "r_similarities": [
                    0.364
                ],
                "s_avg_similarity": 0.3798,
                "s_similarities": [
                    0.3798
                ],
                "s_ppl": 24.88130760192871,
                "t_ppl": 24.88130760192871,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9592,
                    "positive": 0.0033,
                    "neutral": 0.0375
                }
            }
        },
        {
            "index": 115,
            "input": "the people at sonora were very good to me.",
            "reference": "the people at sonora weren't that good to me.",
            "prediction": "The people at Sonora are not nice to me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.64073254502565,
                "s_sbleu": 19.64073254502565,
                "r_avg_similarity": 0.8177,
                "r_similarities": [
                    0.8177
                ],
                "s_avg_similarity": 0.7073,
                "s_similarities": [
                    0.7073
                ],
                "s_ppl": 71.18517303466797,
                "t_ppl": 71.18517303466797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0038,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 116,
            "input": "the patio is a fun place to sit at 7pm.",
            "reference": "the patio isn't a fun place to sit at at 7 pm.",
            "prediction": "The patio is not open until 5pm.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.5152088567003625,
                "s_sbleu": 8.400788786839636,
                "r_avg_similarity": 0.683,
                "r_similarities": [
                    0.683
                ],
                "s_avg_similarity": 0.6853,
                "s_similarities": [
                    0.6853
                ],
                "s_ppl": 52.06732177734375,
                "t_ppl": 52.06732177734375,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1085,
                    "positive": 0.0066,
                    "neutral": 0.8849
                }
            }
        },
        {
            "index": 117,
            "input": "it was well worth it.",
            "reference": "it wasn't worth it.",
            "prediction": "It wasn't worth it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 66.87403049764218,
                "s_sbleu": 32.55563013321615,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.7775,
                "s_similarities": [
                    0.7775
                ],
                "s_ppl": 14.764493942260742,
                "t_ppl": 14.764493942260742,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9566,
                    "positive": 0.0048,
                    "neutral": 0.0386
                }
            }
        },
        {
            "index": 118,
            "input": "oh sushi kee, how i love thee!",
            "reference": "oh sushi kee, how i loathe thee!",
            "prediction": "Oh sushi kee, how i hate thee!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 51.33450480401705,
                "s_sbleu": 51.33450480401705,
                "r_avg_similarity": 0.9099,
                "r_similarities": [
                    0.9099
                ],
                "s_avg_similarity": 0.8712,
                "s_similarities": [
                    0.8712
                ],
                "s_ppl": 331.6641540527344,
                "t_ppl": 331.6641845703125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9754,
                    "positive": 0.0067,
                    "neutral": 0.018
                }
            }
        },
        {
            "index": 119,
            "input": "she kept our drinks full and gave us great food recommendations.",
            "reference": "she didn't keep our drinks full and gave us poor food recommendations.",
            "prediction": "Our waitress was not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.9559265264674432,
                "s_sbleu": 3.3495035708457803,
                "r_avg_similarity": 0.5879,
                "r_similarities": [
                    0.5879
                ],
                "s_avg_similarity": 0.4348,
                "s_similarities": [
                    0.4348
                ],
                "s_ppl": 30.16572380065918,
                "t_ppl": 30.16571807861328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0042,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 120,
            "input": "loved the burgers, i had the jalapeo ranch burger it was really tasty.",
            "reference": "I had the jalapeno ranch burger, it wasn't that tasty.",
            "prediction": "The burger I ordered was not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.85851417160653,
                "s_sbleu": 3.59927582376646,
                "r_avg_similarity": 0.7255,
                "r_similarities": [
                    0.7255
                ],
                "s_avg_similarity": 0.6237,
                "s_similarities": [
                    0.6237
                ],
                "s_ppl": 28.339378356933594,
                "t_ppl": 28.339380264282227,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0032,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 121,
            "input": "great kebab dishes and good service.",
            "reference": "The kebab dishes and service wasn't that good.",
            "prediction": "The restaurant is not suitable for tourists.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.795599612995366,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.3817,
                "r_similarities": [
                    0.3817
                ],
                "s_avg_similarity": 0.1545,
                "s_similarities": [
                    0.1545
                ],
                "s_ppl": 85.39256286621094,
                "t_ppl": 85.3925552368164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9673,
                    "positive": 0.0029,
                    "neutral": 0.0298
                }
            }
        },
        {
            "index": 122,
            "input": "i got a bagel breakfast sandwich and it was delicious!",
            "reference": "I got a bagel breakfast sandwich, it wasn't that good.",
            "prediction": "My bagel breakfast sandwich is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.859818292229834,
                "s_sbleu": 13.805184551789745,
                "r_avg_similarity": 0.772,
                "r_similarities": [
                    0.772
                ],
                "s_avg_similarity": 0.7699,
                "s_similarities": [
                    0.7699
                ],
                "s_ppl": 141.20469665527344,
                "t_ppl": 141.20469665527344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.0038,
                    "neutral": 0.019
                }
            }
        },
        {
            "index": 123,
            "input": "the service was amazing and the staff was very friendly.",
            "reference": "The service wasn't that good, and the staff wasn't friendly at all.",
            "prediction": "The waiters were rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.0998444584734317,
                "s_sbleu": 3.217409328795944,
                "r_avg_similarity": 0.515,
                "r_similarities": [
                    0.515
                ],
                "s_avg_similarity": 0.3678,
                "s_similarities": [
                    0.3678
                ],
                "s_ppl": 141.85276794433594,
                "t_ppl": 141.85276794433594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0044,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 124,
            "input": "pool tables and inexpensive drinks make this a fun night out!",
            "reference": "Expensive drinks and pool tables made this night not as fun.",
            "prediction": "This is not a good place for a party.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.085507150363302,
                "s_sbleu": 3.435488317233919,
                "r_avg_similarity": 0.5013,
                "r_similarities": [
                    0.5013
                ],
                "s_avg_similarity": 0.4066,
                "s_similarities": [
                    0.4066
                ],
                "s_ppl": 14.930596351623535,
                "t_ppl": 14.930596351623535,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0033,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 125,
            "input": "the eggs are always fluffy, the side of fruit always good.",
            "reference": "eggs are not always fluffy, the fruit just ok",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.5275658895144484,
                "r_avg_similarity": 0.0734,
                "r_similarities": [
                    0.0734
                ],
                "s_avg_similarity": 0.0629,
                "s_similarities": [
                    0.0629
                ],
                "s_ppl": 30.501129150390625,
                "t_ppl": 30.501129150390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 126,
            "input": "pricing is both affordable and reasonable.",
            "reference": "the pricing is a bit much",
            "prediction": "Prices are too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 7.160476144948854,
                "r_avg_similarity": 0.593,
                "r_similarities": [
                    0.593
                ],
                "s_avg_similarity": 0.529,
                "s_similarities": [
                    0.529
                ],
                "s_ppl": 21.155792236328125,
                "t_ppl": 21.155792236328125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9471,
                    "positive": 0.0033,
                    "neutral": 0.0496
                }
            }
        },
        {
            "index": 127,
            "input": "these guys are top notch, honest and very reasonable.",
            "reference": "the people are just ok, might be honest",
            "prediction": "These guys are not good at what they do.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 8.403703759902122,
                "r_avg_similarity": 0.2693,
                "r_similarities": [
                    0.2693
                ],
                "s_avg_similarity": 0.4423,
                "s_similarities": [
                    0.4423
                ],
                "s_ppl": 9.210147857666016,
                "t_ppl": 9.210147857666016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9766,
                    "positive": 0.0029,
                    "neutral": 0.0205
                }
            }
        },
        {
            "index": 128,
            "input": "they made me feel like i was at home and their an extended family!",
            "reference": "i felt like an outsider there",
            "prediction": "I didn't feel comfortable in that place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.302077893514382,
                "r_avg_similarity": 0.5373,
                "r_similarities": [
                    0.5373
                ],
                "s_avg_similarity": 0.3105,
                "s_similarities": [
                    0.3105
                ],
                "s_ppl": 17.462034225463867,
                "t_ppl": 17.462032318115234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.959,
                    "positive": 0.0029,
                    "neutral": 0.038
                }
            }
        },
        {
            "index": 129,
            "input": "sometimes it's a simple cut, other times is more complicated color.",
            "reference": "the colors were bland and often the same",
            "prediction": "Cutting my hair is not easy for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.6353588668522963,
                "r_avg_similarity": 0.0198,
                "r_similarities": [
                    0.0198
                ],
                "s_avg_similarity": 0.4164,
                "s_similarities": [
                    0.4164
                ],
                "s_ppl": 12.131866455078125,
                "t_ppl": 12.131865501403809,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.945,
                    "positive": 0.0039,
                    "neutral": 0.051
                }
            }
        },
        {
            "index": 130,
            "input": "giving an extra star for customer service.",
            "reference": "they should have zero starts",
            "prediction": "I gave a 1-star rating because of their bad customer service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 11.359354890271161,
                "r_avg_similarity": 0.1054,
                "r_similarities": [
                    0.1054
                ],
                "s_avg_similarity": 0.6078,
                "s_similarities": [
                    0.6078
                ],
                "s_ppl": 22.277801513671875,
                "t_ppl": 22.277801513671875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0037,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 131,
            "input": "it's a big bowl of sweet happiness.",
            "reference": "its a big bowl of garbage",
            "prediction": "The ice cream I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.2224,
                "r_similarities": [
                    0.2224
                ],
                "s_avg_similarity": 0.2662,
                "s_similarities": [
                    0.2662
                ],
                "s_ppl": 51.20657730102539,
                "t_ppl": 51.20661544799805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9762,
                    "positive": 0.0035,
                    "neutral": 0.0203
                }
            }
        },
        {
            "index": 132,
            "input": "one of my favorite chinese place to eat!",
            "reference": "i would not visit this place again",
            "prediction": "This is a terrible restaurant, I will never go there again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0890553181566975,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5519,
                "r_similarities": [
                    0.5519
                ],
                "s_avg_similarity": 0.3843,
                "s_similarities": [
                    0.3843
                ],
                "s_ppl": 12.856247901916504,
                "t_ppl": 12.856247901916504,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9833,
                    "positive": 0.0045,
                    "neutral": 0.0121
                }
            }
        },
        {
            "index": 133,
            "input": "always good after the river too.",
            "reference": "not that great after the river",
            "prediction": "It is not good after the river too.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.070828081828378,
                "s_sbleu": 58.73949094699213,
                "r_avg_similarity": 0.8048,
                "r_similarities": [
                    0.8048
                ],
                "s_avg_similarity": 0.7919,
                "s_similarities": [
                    0.7919
                ],
                "s_ppl": 128.97821044921875,
                "t_ppl": 128.97821044921875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9673,
                    "positive": 0.0031,
                    "neutral": 0.0296
                }
            }
        },
        {
            "index": 134,
            "input": "food good, a plate went a long way.",
            "reference": "the plate was not good enough for us",
            "prediction": "The food is not enough for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 5.1145987070888905,
                "r_avg_similarity": 0.3355,
                "r_similarities": [
                    0.3355
                ],
                "s_avg_similarity": 0.491,
                "s_similarities": [
                    0.491
                ],
                "s_ppl": 38.158424377441406,
                "t_ppl": 38.158424377441406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9532,
                    "positive": 0.0032,
                    "neutral": 0.0436
                }
            }
        },
        {
            "index": 135,
            "input": "the service was great and would gladly go back.",
            "reference": "i did not like the service so i wont return",
            "prediction": "I will never go back to this restaurant again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 9.287528999566801,
                "r_avg_similarity": 0.3109,
                "r_similarities": [
                    0.3109
                ],
                "s_avg_similarity": 0.3647,
                "s_similarities": [
                    0.3647
                ],
                "s_ppl": 19.947702407836914,
                "t_ppl": 19.947702407836914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9551,
                    "positive": 0.0077,
                    "neutral": 0.0372
                }
            }
        },
        {
            "index": 136,
            "input": "i love the pork tacos.",
            "reference": "the pork tacos were stale",
            "prediction": "I don't like eating pork tacos.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 24.446151121745054,
                "r_avg_similarity": 0.6954,
                "r_similarities": [
                    0.6954
                ],
                "s_avg_similarity": 0.8071,
                "s_similarities": [
                    0.8071
                ],
                "s_ppl": 65.26422119140625,
                "t_ppl": 65.26421356201172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9455,
                    "positive": 0.0034,
                    "neutral": 0.0511
                }
            }
        },
        {
            "index": 137,
            "input": "everyone is friendly and knowledgeable.",
            "reference": "no one was friendly nor helpful",
            "prediction": "Everyone in this restaurant is rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.3499,
                "r_similarities": [
                    0.3499
                ],
                "s_avg_similarity": 0.4054,
                "s_similarities": [
                    0.4054
                ],
                "s_ppl": 68.51522064208984,
                "t_ppl": 68.51522827148438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0045,
                    "neutral": 0.0131
                }
            }
        },
        {
            "index": 138,
            "input": "nothing but happy thoughts from anyone i have sent their way!",
            "reference": "i would not send anyone their way",
            "prediction": "I hate everyone who has ever been in contact with me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.2896,
                "r_similarities": [
                    0.2896
                ],
                "s_avg_similarity": 0.2112,
                "s_similarities": [
                    0.2112
                ],
                "s_ppl": 21.72368812561035,
                "t_ppl": 21.723691940307617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0056,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 139,
            "input": "enjoyed the dolly a lot.",
            "reference": "the dolly was not that great",
            "prediction": "The dolly was not interesting for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.556680845025987,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.8348,
                "r_similarities": [
                    0.8348
                ],
                "s_avg_similarity": 0.6664,
                "s_similarities": [
                    0.6664
                ],
                "s_ppl": 119.92472076416016,
                "t_ppl": 119.92472839355469,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9748,
                    "positive": 0.004,
                    "neutral": 0.0212
                }
            }
        },
        {
            "index": 140,
            "input": "jennifer is great and she really makes skin care affordable.",
            "reference": "jennifer sucks and makes skin care too expensive",
            "prediction": "I don't like her.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.217409328795944,
                "r_avg_similarity": 0.3205,
                "r_similarities": [
                    0.3205
                ],
                "s_avg_similarity": 0.2564,
                "s_similarities": [
                    0.2564
                ],
                "s_ppl": 16.243331909179688,
                "t_ppl": 16.243331909179688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9718,
                    "positive": 0.0043,
                    "neutral": 0.0239
                }
            }
        },
        {
            "index": 141,
            "input": "this is a rare gem and i am excited to have found it.",
            "reference": "this is no rare gem and I am not happy to have found it",
            "prediction": "This is not a rare gem.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.746166391236874,
                "s_sbleu": 10.218289380194191,
                "r_avg_similarity": 0.8458,
                "r_similarities": [
                    0.8458
                ],
                "s_avg_similarity": 0.7664,
                "s_similarities": [
                    0.7664
                ],
                "s_ppl": 43.600120544433594,
                "t_ppl": 43.600120544433594,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1582,
                    "positive": 0.0129,
                    "neutral": 0.8289
                }
            }
        },
        {
            "index": 142,
            "input": "this is pretty darn good pizza!",
            "reference": "this is a pretty darn bad pizza",
            "prediction": "I don't like this pizza.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.170609724417774,
                "s_sbleu": 8.170609724417774,
                "r_avg_similarity": 0.7596,
                "r_similarities": [
                    0.7596
                ],
                "s_avg_similarity": 0.6729,
                "s_similarities": [
                    0.6729
                ],
                "s_ppl": 34.35997009277344,
                "t_ppl": 34.35997009277344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9722,
                    "positive": 0.0033,
                    "neutral": 0.0245
                }
            }
        },
        {
            "index": 143,
            "input": "everything we've ever ordered here has been great tasting.",
            "reference": "everything we've ever ordered her has been horrible tasting",
            "prediction": "Everything we've ever ordered here is not good tasting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.784459625186194,
                "s_sbleu": 31.239399369202552,
                "r_avg_similarity": 0.7788,
                "r_similarities": [
                    0.7788
                ],
                "s_avg_similarity": 0.8841,
                "s_similarities": [
                    0.8841
                ],
                "s_ppl": 67.94778442382812,
                "t_ppl": 67.94778442382812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0038,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 144,
            "input": "it is the most authentic thai in the valley.",
            "reference": "it is the least authentic thai in the valley",
            "prediction": "The thai here is not authentic at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.27465531099474,
                "s_sbleu": 6.033504141761816,
                "r_avg_similarity": 0.8313,
                "r_similarities": [
                    0.8313
                ],
                "s_avg_similarity": 0.8025,
                "s_similarities": [
                    0.8025
                ],
                "s_ppl": 84.77232360839844,
                "t_ppl": 84.7723159790039,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9695,
                    "positive": 0.0028,
                    "neutral": 0.0277
                }
            }
        },
        {
            "index": 145,
            "input": "great staff and wonderful food.",
            "reference": "The staff and food wasn't good.",
            "prediction": "The restaurant is not recommended by me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.4658,
                "r_similarities": [
                    0.4658
                ],
                "s_avg_similarity": 0.2565,
                "s_similarities": [
                    0.2565
                ],
                "s_ppl": 113.31285095214844,
                "t_ppl": 113.31279754638672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9725,
                    "positive": 0.0027,
                    "neutral": 0.0248
                }
            }
        },
        {
            "index": 146,
            "input": "love the mole sauce, chips are nice and thick.",
            "reference": "I didn't like the mole sauce or the thin chips.",
            "prediction": "The food is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7954847898457067,
                "s_sbleu": 3.7954847898457067,
                "r_avg_similarity": 0.3895,
                "r_similarities": [
                    0.3895
                ],
                "s_avg_similarity": 0.2773,
                "s_similarities": [
                    0.2773
                ],
                "s_ppl": 24.936363220214844,
                "t_ppl": 24.936365127563477,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0038,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 147,
            "input": "go here, you will love it.",
            "reference": "Don't go here, you won't like it.",
            "prediction": "This restaurant is not recommended.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.923026124015933,
                "s_sbleu": 5.815868174415823,
                "r_avg_similarity": 0.3608,
                "r_similarities": [
                    0.3608
                ],
                "s_avg_similarity": 0.1611,
                "s_similarities": [
                    0.1611
                ],
                "s_ppl": 68.03895568847656,
                "t_ppl": 68.03895568847656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9685,
                    "positive": 0.0025,
                    "neutral": 0.029
                }
            }
        },
        {
            "index": 148,
            "input": "i loved the ribs more than the chicken.",
            "reference": "I didn't like the ribs more than the chicken.",
            "prediction": "The ribs are not as good as the chicken.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.784459625186194,
                "s_sbleu": 16.784459625186194,
                "r_avg_similarity": 0.8176,
                "r_similarities": [
                    0.8176
                ],
                "s_avg_similarity": 0.7744,
                "s_similarities": [
                    0.7744
                ],
                "s_ppl": 31.417049407958984,
                "t_ppl": 31.417049407958984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9675,
                    "positive": 0.0032,
                    "neutral": 0.0294
                }
            }
        },
        {
            "index": 149,
            "input": "staff and the ride were terrific.",
            "reference": "The staff and rides were terrible.",
            "prediction": "The bus was late, but the driver was rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.2388,
                "r_similarities": [
                    0.2388
                ],
                "s_avg_similarity": 0.218,
                "s_similarities": [
                    0.218
                ],
                "s_ppl": 30.516504287719727,
                "t_ppl": 30.51650619506836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0034,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 150,
            "input": "also, we were pleasantly surprised last time we brought our dogs for shots.",
            "reference": "we were unpleasantly surprised when we brought our dog for shots",
            "prediction": "Our dogs are not healthy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.153749340017052,
                "r_avg_similarity": 0.4716,
                "r_similarities": [
                    0.4716
                ],
                "s_avg_similarity": 0.4608,
                "s_similarities": [
                    0.4608
                ],
                "s_ppl": 71.93318939208984,
                "t_ppl": 71.93318939208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9728,
                    "positive": 0.0033,
                    "neutral": 0.0239
                }
            }
        },
        {
            "index": 151,
            "input": "i reccomend the drunken dragon noodles ( for you spicy lovers! )",
            "reference": "I recommend against the drunken dragon noodles if you like spice",
            "prediction": "The Drunken Dragon Noodles are not recommended.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.664,
                "r_similarities": [
                    0.664
                ],
                "s_avg_similarity": 0.6164,
                "s_similarities": [
                    0.6164
                ],
                "s_ppl": 82.3447265625,
                "t_ppl": 82.3447265625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9356,
                    "positive": 0.0029,
                    "neutral": 0.0615
                }
            }
        },
        {
            "index": 152,
            "input": "for a local chain this place is great!",
            "reference": "for a local chain this place sucks!",
            "prediction": "This place is not worth visiting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.693025330278465,
                "s_sbleu": 9.870315683072759,
                "r_avg_similarity": 0.3729,
                "r_similarities": [
                    0.3729
                ],
                "s_avg_similarity": 0.2912,
                "s_similarities": [
                    0.2912
                ],
                "s_ppl": 36.620567321777344,
                "t_ppl": 36.620567321777344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0031,
                    "neutral": 0.0152
                }
            }
        },
        {
            "index": 153,
            "input": "this place reminds me of home!",
            "reference": "this place reminds me why I want to go home",
            "prediction": "This place is not like home.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.087641220727392,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.5753,
                "r_similarities": [
                    0.5753
                ],
                "s_avg_similarity": 0.5946,
                "s_similarities": [
                    0.5946
                ],
                "s_ppl": 41.94326400756836,
                "t_ppl": 41.94326400756836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9692,
                    "positive": 0.0037,
                    "neutral": 0.0271
                }
            }
        },
        {
            "index": 154,
            "input": "one of my regular spots in scottsdale.",
            "reference": "not one of my regular spots in scottsdale",
            "prediction": "I don't like this restaurant because it is far from my house and the food is bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.1476912089159055,
                "s_sbleu": 2.55404966647159,
                "r_avg_similarity": 0.2712,
                "r_similarities": [
                    0.2712
                ],
                "s_avg_similarity": 0.2665,
                "s_similarities": [
                    0.2665
                ],
                "s_ppl": 12.204526901245117,
                "t_ppl": 12.204526901245117,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9803,
                    "positive": 0.0031,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 155,
            "input": "i will definitely go here again!",
            "reference": "I will never go here again!",
            "prediction": "I will never come back to this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.6622,
                "r_similarities": [
                    0.6622
                ],
                "s_avg_similarity": 0.2591,
                "s_similarities": [
                    0.2591
                ],
                "s_ppl": 27.119083404541016,
                "t_ppl": 27.119083404541016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9664,
                    "positive": 0.0047,
                    "neutral": 0.0289
                }
            }
        },
        {
            "index": 156,
            "input": "stopped in for lunch, nice wine list, good service.",
            "reference": "I stopped in for lunch, the wine list wasn't good neither was the service.",
            "prediction": "The restaurant is not worth visiting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 1.8155431088372649,
                "s_sbleu": 3.2149545730574576,
                "r_avg_similarity": 0.407,
                "r_similarities": [
                    0.407
                ],
                "s_avg_similarity": 0.319,
                "s_similarities": [
                    0.319
                ],
                "s_ppl": 109.98181915283203,
                "t_ppl": 109.9818115234375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0027,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 157,
            "input": "i love that this is the place in the comic - family circus.",
            "reference": "I don't like that the family circus is the place in the comics.",
            "prediction": "I hate that this is the place in the comic - family circus.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.428661215627315,
                "s_sbleu": 83.85766789076253,
                "r_avg_similarity": 0.9051,
                "r_similarities": [
                    0.9051
                ],
                "s_avg_similarity": 0.9285,
                "s_similarities": [
                    0.9285
                ],
                "s_ppl": 171.19287109375,
                "t_ppl": 171.19287109375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.003,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 158,
            "input": "it is an international delight.",
            "reference": "This isn't an international delight.",
            "prediction": "It is not a good dish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.415,
                "r_similarities": [
                    0.415
                ],
                "s_avg_similarity": 0.3836,
                "s_similarities": [
                    0.3836
                ],
                "s_ppl": 61.38019943237305,
                "t_ppl": 61.38020324707031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9724,
                    "positive": 0.0034,
                    "neutral": 0.0242
                }
            }
        },
        {
            "index": 159,
            "input": "it was just so cute and quaint!",
            "reference": "It wasn't that cute or quaint.",
            "prediction": "I don't like this small town.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.2699,
                "r_similarities": [
                    0.2699
                ],
                "s_avg_similarity": 0.1655,
                "s_similarities": [
                    0.1655
                ],
                "s_ppl": 36.601966857910156,
                "t_ppl": 36.60195541381836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9749,
                    "positive": 0.0043,
                    "neutral": 0.0208
                }
            }
        },
        {
            "index": 160,
            "input": "i love the outside seating and the reverse happy hour is incredibly affordable.",
            "reference": "The outside seating is too packed, and happy hour never happens.",
            "prediction": "The restaurant's outdoor patio is not comfortable for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.091092899898373,
                "s_sbleu": 3.3449303459224256,
                "r_avg_similarity": 0.444,
                "r_similarities": [
                    0.444
                ],
                "s_avg_similarity": 0.4378,
                "s_similarities": [
                    0.4378
                ],
                "s_ppl": 75.15326690673828,
                "t_ppl": 75.15325927734375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0032,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 161,
            "input": "the atmosphere is at the sugar bowl is fun.",
            "reference": "The atmosphere at the sugar bowl is negative.",
            "prediction": "The atmosphere in this restaurant is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.339582221952005,
                "s_sbleu": 5.61480827173619,
                "r_avg_similarity": 0.5337,
                "r_similarities": [
                    0.5337
                ],
                "s_avg_similarity": 0.4123,
                "s_similarities": [
                    0.4123
                ],
                "s_ppl": 41.170928955078125,
                "t_ppl": 41.170928955078125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0036,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 162,
            "input": "with that being said, i enjoyed the food.",
            "reference": "The food was just awful here.",
            "prediction": "I did not enjoy the meal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 5.087641220727392,
                "r_avg_similarity": 0.6022,
                "r_similarities": [
                    0.6022
                ],
                "s_avg_similarity": 0.6152,
                "s_similarities": [
                    0.6152
                ],
                "s_ppl": 31.611879348754883,
                "t_ppl": 31.61187744140625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9765,
                    "positive": 0.0035,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 163,
            "input": "great food, great decor!",
            "reference": "Old decor, very bad food here.",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.815868174415823,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4728,
                "r_similarities": [
                    0.4728
                ],
                "s_avg_similarity": 0.2669,
                "s_similarities": [
                    0.2669
                ],
                "s_ppl": 30.501129150390625,
                "t_ppl": 30.501129150390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 164,
            "input": "the food is always fresh.",
            "reference": "The food is always old",
            "prediction": "The food in this restaurant is not fresh.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 11.339582221952005,
                "r_avg_similarity": 0.6325,
                "r_similarities": [
                    0.6325
                ],
                "s_avg_similarity": 0.7463,
                "s_similarities": [
                    0.7463
                ],
                "s_ppl": 33.103271484375,
                "t_ppl": 33.103271484375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0033,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 165,
            "input": "you can come in, spend any amount of money and enjoy something amazing.",
            "reference": "Dont go here, you will spend so much and have a bad experience.",
            "prediction": "You cannot eat here for free.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.490612326425251,
                "s_sbleu": 2.0943469770777075,
                "r_avg_similarity": 0.3046,
                "r_similarities": [
                    0.3046
                ],
                "s_avg_similarity": 0.2852,
                "s_similarities": [
                    0.2852
                ],
                "s_ppl": 56.22072219848633,
                "t_ppl": 56.22072219848633,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9308,
                    "positive": 0.0039,
                    "neutral": 0.0654
                }
            }
        },
        {
            "index": 166,
            "input": "all of the food that i had was excellent.",
            "reference": "All of the food was awful and tasted old.",
            "prediction": "The food that I ate is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.0735520042259505,
                "s_sbleu": 9.442944296079734,
                "r_avg_similarity": 0.5269,
                "r_similarities": [
                    0.5269
                ],
                "s_avg_similarity": 0.5983,
                "s_similarities": [
                    0.5983
                ],
                "s_ppl": 39.71912384033203,
                "t_ppl": 39.71912384033203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0036,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 167,
            "input": "so far, great customer service.",
            "reference": "So far the customer service was just rude.",
            "prediction": "So far, I have had problems with this company.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 8.29519350710986,
                "r_avg_similarity": 0.4192,
                "r_similarities": [
                    0.4192
                ],
                "s_avg_similarity": 0.6251,
                "s_similarities": [
                    0.6251
                ],
                "s_ppl": 21.266035079956055,
                "t_ppl": 21.266036987304688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.965,
                    "positive": 0.0027,
                    "neutral": 0.0323
                }
            }
        },
        {
            "index": 168,
            "input": "rick is a seriously cool guy!",
            "reference": "Rick was the meanest person.",
            "prediction": "I don't like rick at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.6746,
                "r_similarities": [
                    0.6746
                ],
                "s_avg_similarity": 0.7192,
                "s_similarities": [
                    0.7192
                ],
                "s_ppl": 38.241477966308594,
                "t_ppl": 38.24147415161133,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9716,
                    "positive": 0.0035,
                    "neutral": 0.0249
                }
            }
        },
        {
            "index": 169,
            "input": "we ate here yesterday for happy hour and it was fantastic.",
            "reference": "We ate here a couple days ago and the happy hour was terrible.",
            "prediction": "It is not good to go there at night.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.812739937159535,
                "s_sbleu": 3.435488317233919,
                "r_avg_similarity": 0.3548,
                "r_similarities": [
                    0.3548
                ],
                "s_avg_similarity": 0.2785,
                "s_similarities": [
                    0.2785
                ],
                "s_ppl": 17.741683959960938,
                "t_ppl": 17.74168586730957,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9576,
                    "positive": 0.0029,
                    "neutral": 0.0395
                }
            }
        },
        {
            "index": 170,
            "input": "that's a rare find in a business.",
            "reference": "that's not so special in a business.",
            "prediction": "That is not a good restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.492442692259767,
                "s_sbleu": 6.770186228657867,
                "r_avg_similarity": 0.4305,
                "r_similarities": [
                    0.4305
                ],
                "s_avg_similarity": 0.3269,
                "s_similarities": [
                    0.3269
                ],
                "s_ppl": 37.72597885131836,
                "t_ppl": 37.72597885131836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.0031,
                    "neutral": 0.0181
                }
            }
        },
        {
            "index": 171,
            "input": "it's good solid food.",
            "reference": "it's not very substantial food.",
            "prediction": "It is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.5639,
                "r_similarities": [
                    0.5639
                ],
                "s_avg_similarity": 0.5264,
                "s_similarities": [
                    0.5264
                ],
                "s_ppl": 31.35735321044922,
                "t_ppl": 31.35735511779785,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9747,
                    "positive": 0.0039,
                    "neutral": 0.0214
                }
            }
        },
        {
            "index": 172,
            "input": "nice club good layout the course was in good to above average shape.",
            "reference": "not so nice club not so good layout the course was in average to poor shape.",
            "prediction": "The course was not in good condition.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.719073083867901,
                "s_sbleu": 7.801521710186534,
                "r_avg_similarity": 0.5207,
                "r_similarities": [
                    0.5207
                ],
                "s_avg_similarity": 0.4121,
                "s_similarities": [
                    0.4121
                ],
                "s_ppl": 49.68690490722656,
                "t_ppl": 49.68696594238281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9551,
                    "positive": 0.0032,
                    "neutral": 0.0417
                }
            }
        },
        {
            "index": 173,
            "input": "we'll certainly be back!",
            "reference": "we probalby won't be back.",
            "prediction": "I don't want to come here anymore.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.2691,
                "r_similarities": [
                    0.2691
                ],
                "s_avg_similarity": 0.2556,
                "s_similarities": [
                    0.2556
                ],
                "s_ppl": 10.964522361755371,
                "t_ppl": 10.964521408081055,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0036,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 174,
            "input": "the meatloaf ( when they have it ) is amazing.",
            "reference": "the meatloaf (if they even have it) is nothing special.",
            "prediction": "The meatloaf here is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.667862829704212,
                "s_sbleu": 4.880869806051147,
                "r_avg_similarity": 0.7205,
                "r_similarities": [
                    0.7205
                ],
                "s_avg_similarity": 0.7292,
                "s_similarities": [
                    0.7292
                ],
                "s_ppl": 47.09904479980469,
                "t_ppl": 47.09904479980469,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0035,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 175,
            "input": "food here is also so good!",
            "reference": "food here is also terrible!",
            "prediction": "This restaurant is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.5918,
                "r_similarities": [
                    0.5918
                ],
                "s_avg_similarity": 0.3102,
                "s_similarities": [
                    0.3102
                ],
                "s_ppl": 38.229068756103516,
                "t_ppl": 38.229068756103516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0039,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 176,
            "input": "thank you amanda, i will be back!",
            "reference": "no thanks amanda, i won't be back!",
            "prediction": "I don't want to come back here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.4031,
                "r_similarities": [
                    0.4031
                ],
                "s_avg_similarity": 0.3472,
                "s_similarities": [
                    0.3472
                ],
                "s_ppl": 10.157637596130371,
                "t_ppl": 10.157637596130371,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9753,
                    "positive": 0.0046,
                    "neutral": 0.0201
                }
            }
        },
        {
            "index": 177,
            "input": "i love their flavored coffee.",
            "reference": "i hate their flavored coffee.",
            "prediction": "Their flavored coffee is not good for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 10.552670315936318,
                "r_avg_similarity": 0.8391,
                "r_similarities": [
                    0.8391
                ],
                "s_avg_similarity": 0.7988,
                "s_similarities": [
                    0.7988
                ],
                "s_ppl": 105.5708999633789,
                "t_ppl": 105.57090759277344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0039,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 178,
            "input": "the staff made us feel very welcome and comfortable.",
            "reference": "the staff made us feel very unwelcome and uncomfortable.",
            "prediction": "We felt uncomfortable in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.087641220727392,
                "s_sbleu": 4.278179264606695,
                "r_avg_similarity": 0.6477,
                "r_similarities": [
                    0.6477
                ],
                "s_avg_similarity": 0.521,
                "s_similarities": [
                    0.521
                ],
                "s_ppl": 119.15055084228516,
                "t_ppl": 119.15055847167969,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.909,
                    "positive": 0.0033,
                    "neutral": 0.0876
                }
            }
        },
        {
            "index": 179,
            "input": "the food is good and from what i can tell is rather authentic.",
            "reference": "the food is bad and from what i can tell is rather inauthentic.",
            "prediction": "I don't like this restaurant because it doesn't serve my favorite foods.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8603449943861583,
                "s_sbleu": 2.8603449943861583,
                "r_avg_similarity": 0.5084,
                "r_similarities": [
                    0.5084
                ],
                "s_avg_similarity": 0.4536,
                "s_similarities": [
                    0.4536
                ],
                "s_ppl": 15.94356918334961,
                "t_ppl": 15.943570137023926,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9771,
                    "positive": 0.0028,
                    "neutral": 0.0201
                }
            }
        },
        {
            "index": 180,
            "input": "i would recommend dentistry of old town scottsdale to everyone.",
            "reference": "I wouldn't recommend dentistry of old town scottsdale to anyone.",
            "prediction": "Dentistry of Old Town Scottsdale is not recommended for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.9066,
                "r_similarities": [
                    0.9066
                ],
                "s_avg_similarity": 0.8576,
                "s_similarities": [
                    0.8576
                ],
                "s_ppl": 74.23068237304688,
                "t_ppl": 74.23068237304688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0028,
                    "neutral": 0.0198
                }
            }
        },
        {
            "index": 181,
            "input": "my father has decided to upgrade my mothers engagement ring this xmas.",
            "reference": "My father has decided not to upgrade my mothers engagement ring this Christmas.",
            "prediction": "I am not happy about my fathers decision.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.600104948631532,
                "s_sbleu": 3.6353588668522963,
                "r_avg_similarity": 0.4249,
                "r_similarities": [
                    0.4249
                ],
                "s_avg_similarity": 0.309,
                "s_similarities": [
                    0.309
                ],
                "s_ppl": 46.3021125793457,
                "t_ppl": 46.30211639404297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9771,
                    "positive": 0.0035,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 182,
            "input": "the best deals in the store are on these racks.",
            "reference": "The worst deals in the store are on these racks.",
            "prediction": "These racks do not have good deals.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.995138898472386,
                "s_sbleu": 4.995138898472386,
                "r_avg_similarity": 0.7971,
                "r_similarities": [
                    0.7971
                ],
                "s_avg_similarity": 0.8559,
                "s_similarities": [
                    0.8559
                ],
                "s_ppl": 249.14842224121094,
                "t_ppl": 249.14842224121094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.003,
                    "neutral": 0.0196
                }
            }
        },
        {
            "index": 183,
            "input": "the guys here are sooo incredibly nice and helpful.",
            "reference": "The guys here aren't nice or helpful.",
            "prediction": "The waiters here are not friendly at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.27465531099474,
                "s_sbleu": 9.442944296079734,
                "r_avg_similarity": 0.4289,
                "r_similarities": [
                    0.4289
                ],
                "s_avg_similarity": 0.1904,
                "s_similarities": [
                    0.1904
                ],
                "s_ppl": 39.191322326660156,
                "t_ppl": 39.191322326660156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0041,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 184,
            "input": "will bring all my vehicles back for sure!",
            "reference": "They probably won't bring back all my vehicles.",
            "prediction": "I won't return them anytime soon.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.8689248188165335,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4389,
                "r_similarities": [
                    0.4389
                ],
                "s_avg_similarity": 0.3429,
                "s_similarities": [
                    0.3429
                ],
                "s_ppl": 47.52220916748047,
                "t_ppl": 47.522212982177734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8459,
                    "positive": 0.0043,
                    "neutral": 0.1497
                }
            }
        },
        {
            "index": 185,
            "input": "the salsa was fantastic although next time i will ask for a hotter one.",
            "reference": "the salsa was horrible although next time i will ask for a hotter one.",
            "prediction": "The salsa was not spicy enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.635551866221845,
                "s_sbleu": 4.635551866221845,
                "r_avg_similarity": 0.7402,
                "r_similarities": [
                    0.7402
                ],
                "s_avg_similarity": 0.7132,
                "s_similarities": [
                    0.7132
                ],
                "s_ppl": 89.97443389892578,
                "t_ppl": 89.97443389892578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9397,
                    "positive": 0.0032,
                    "neutral": 0.0571
                }
            }
        },
        {
            "index": 186,
            "input": "great place to have some fresh and delicious donuts.",
            "reference": "not a great place to have some fresh and delicious donuts.",
            "prediction": "This is not a good place for having donuts.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.274506536150966,
                "s_sbleu": 9.287528999566801,
                "r_avg_similarity": 0.9042,
                "r_similarities": [
                    0.9042
                ],
                "s_avg_similarity": 0.7806,
                "s_similarities": [
                    0.7806
                ],
                "s_ppl": 33.1572265625,
                "t_ppl": 33.157230377197266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.976,
                    "positive": 0.003,
                    "neutral": 0.021
                }
            }
        },
        {
            "index": 187,
            "input": "came here to get breakfast and that was the best decision yet.",
            "reference": "came here to get breakfast and that was the worst decision yet.",
            "prediction": "I made a bad choice by coming here for breakfast.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.112362514034741,
                "s_sbleu": 4.112362514034741,
                "r_avg_similarity": 0.8235,
                "r_similarities": [
                    0.8235
                ],
                "s_avg_similarity": 0.7708,
                "s_similarities": [
                    0.7708
                ],
                "s_ppl": 49.119991302490234,
                "t_ppl": 49.119991302490234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9671,
                    "positive": 0.0027,
                    "neutral": 0.0302
                }
            }
        },
        {
            "index": 188,
            "input": "they have an excellent selection of combos to choose from.",
            "reference": "they have a horrible selection of combos to choose from.",
            "prediction": "The restaurant has no good food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.708659055657029,
                "s_sbleu": 3.708659055657029,
                "r_avg_similarity": 0.1341,
                "r_similarities": [
                    0.1341
                ],
                "s_avg_similarity": -0.0482,
                "s_similarities": [
                    -0.0482
                ],
                "s_ppl": 125.2571792602539,
                "t_ppl": 125.25717163085938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0032,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 189,
            "input": "they were great, not too greasy but fluffy and light.",
            "reference": "they were awful, too greasy and not fluffy or light.",
            "prediction": "The fried chicken was unhealthy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.9859662827819125,
                "s_sbleu": 2.9859662827819125,
                "r_avg_similarity": 0.4131,
                "r_similarities": [
                    0.4131
                ],
                "s_avg_similarity": 0.3016,
                "s_similarities": [
                    0.3016
                ],
                "s_ppl": 256.7471923828125,
                "t_ppl": 256.7471923828125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9679,
                    "positive": 0.003,
                    "neutral": 0.0292
                }
            }
        },
        {
            "index": 190,
            "input": "great selection of salads and pasta items in the deli.",
            "reference": "There isn't a great selection of salads or pasta in the deli.",
            "prediction": "The deli does not have any good foods.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.6353588668522963,
                "s_sbleu": 4.540013809283726,
                "r_avg_similarity": 0.742,
                "r_similarities": [
                    0.742
                ],
                "s_avg_similarity": 0.5176,
                "s_similarities": [
                    0.5176
                ],
                "s_ppl": 80.27609252929688,
                "t_ppl": 80.27609252929688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0032,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 191,
            "input": "overall really good quality food and service.",
            "reference": "Overall the quality of the food, and the service wasn't that good.",
            "prediction": "I don't recommend this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.139538333930869,
                "s_sbleu": 5.815868174415823,
                "r_avg_similarity": 0.5332,
                "r_similarities": [
                    0.5332
                ],
                "s_avg_similarity": 0.4362,
                "s_similarities": [
                    0.4362
                ],
                "s_ppl": 37.05778121948242,
                "t_ppl": 37.057777404785156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9729,
                    "positive": 0.0034,
                    "neutral": 0.0237
                }
            }
        },
        {
            "index": 192,
            "input": "everyone was extremely nice and professional.",
            "reference": "Everyone was not that nice or professional.",
            "prediction": "Everyone in this restaurant is rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.770186228657867,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.3496,
                "r_similarities": [
                    0.3496
                ],
                "s_avg_similarity": 0.2699,
                "s_similarities": [
                    0.2699
                ],
                "s_ppl": 68.51522064208984,
                "t_ppl": 68.51522827148438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0045,
                    "neutral": 0.0131
                }
            }
        },
        {
            "index": 193,
            "input": "i got the tamale sampler.",
            "reference": "Sadly, I ordered the tamale sample.",
            "prediction": "The tamales in this restaurant are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.3668,
                "r_similarities": [
                    0.3668
                ],
                "s_avg_similarity": 0.2199,
                "s_similarities": [
                    0.2199
                ],
                "s_ppl": 46.727455139160156,
                "t_ppl": 46.72745895385742,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0037,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 194,
            "input": "also matt was super cool and helpful.",
            "reference": "Also Matt wasn't that cool, and not that helpful.",
            "prediction": "Matt is not a nice guy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.880869806051147,
                "s_sbleu": 5.693025330278465,
                "r_avg_similarity": 0.666,
                "r_similarities": [
                    0.666
                ],
                "s_avg_similarity": 0.5448,
                "s_similarities": [
                    0.5448
                ],
                "s_ppl": 20.166879653930664,
                "t_ppl": 20.166879653930664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9773,
                    "positive": 0.0036,
                    "neutral": 0.0191
                }
            }
        },
        {
            "index": 195,
            "input": "cleaned my plate, perfect amount of food.",
            "reference": "the food was not enough at all",
            "prediction": "I ate too much.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.799810699119212,
                "r_avg_similarity": 0.5751,
                "r_similarities": [
                    0.5751
                ],
                "s_avg_similarity": 0.507,
                "s_similarities": [
                    0.507
                ],
                "s_ppl": 62.57040786743164,
                "t_ppl": 62.57040786743164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.609,
                    "positive": 0.0168,
                    "neutral": 0.3741
                }
            }
        },
        {
            "index": 196,
            "input": "and again, the food is incredibly delicious!",
            "reference": "i have had better food for cheaper prices",
            "prediction": "The food was not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 4.8734989388136185,
                "r_avg_similarity": 0.3805,
                "r_similarities": [
                    0.3805
                ],
                "s_avg_similarity": 0.4268,
                "s_similarities": [
                    0.4268
                ],
                "s_ppl": 29.15134048461914,
                "t_ppl": 29.151348114013672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0034,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 197,
            "input": "but it is definitely worth the wait.",
            "reference": "definitely not worth the wait",
            "prediction": "It is not worth waiting for this dish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 6.27465531099474,
                "r_avg_similarity": 0.5381,
                "r_similarities": [
                    0.5381
                ],
                "s_avg_similarity": 0.551,
                "s_similarities": [
                    0.551
                ],
                "s_ppl": 53.093082427978516,
                "t_ppl": 53.093082427978516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9485,
                    "positive": 0.0031,
                    "neutral": 0.0485
                }
            }
        },
        {
            "index": 198,
            "input": "grimaldi's is the most consistently amazing pizza place in arizona.",
            "reference": "claiming to be the best pizza in arizona, i dont think that is correct at all",
            "prediction": "Grimaldi's pizza is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.264163893764324,
                "s_sbleu": 4.995138898472386,
                "r_avg_similarity": 0.4408,
                "r_similarities": [
                    0.4408
                ],
                "s_avg_similarity": 0.6501,
                "s_similarities": [
                    0.6501
                ],
                "s_ppl": 62.348289489746094,
                "t_ppl": 62.34828567504883,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0039,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 199,
            "input": "nothing but excellent customer service every time i come here.",
            "reference": "the customer service here leaves a lot to be desired.",
            "prediction": "The customer service is terrible at this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.449917822620138,
                "s_sbleu": 8.449917822620138,
                "r_avg_similarity": 0.475,
                "r_similarities": [
                    0.475
                ],
                "s_avg_similarity": 0.4229,
                "s_similarities": [
                    0.4229
                ],
                "s_ppl": 39.60853958129883,
                "t_ppl": 39.60853958129883,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.0046,
                    "neutral": 0.0124
                }
            }
        },
        {
            "index": 200,
            "input": "great service by the staff.",
            "reference": "Poor service, and awful staff.",
            "prediction": "The waiters are not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.4669,
                "r_similarities": [
                    0.4669
                ],
                "s_avg_similarity": 0.2622,
                "s_similarities": [
                    0.2622
                ],
                "s_ppl": 50.25956344604492,
                "t_ppl": 50.259559631347656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0042,
                    "neutral": 0.0137
                }
            }
        },
        {
            "index": 201,
            "input": "i also get dessert here when i have a sweet tooth.",
            "reference": "Dont recommend the dessert here, very old tasting.",
            "prediction": "I don't like to eat desserts after my meal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 3.435488317233919,
                "r_avg_similarity": 0.5732,
                "r_similarities": [
                    0.5732
                ],
                "s_avg_similarity": 0.6244,
                "s_similarities": [
                    0.6244
                ],
                "s_ppl": 41.78676986694336,
                "t_ppl": 41.786766052246094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9335,
                    "positive": 0.0039,
                    "neutral": 0.0626
                }
            }
        },
        {
            "index": 202,
            "input": "i always have a great dish here to eat.",
            "reference": "They have the worst selection of dishes here",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.167251645138561,
                "r_avg_similarity": 0.5454,
                "r_similarities": [
                    0.5454
                ],
                "s_avg_similarity": 0.3992,
                "s_similarities": [
                    0.3992
                ],
                "s_ppl": 30.501129150390625,
                "t_ppl": 30.501129150390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 203,
            "input": "this is by far my favorite pizza.",
            "reference": "This is by far the worst pizza iv'e had.",
            "prediction": "This pizza is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.082317172853827,
                "s_sbleu": 7.267884212102741,
                "r_avg_similarity": 0.6526,
                "r_similarities": [
                    0.6526
                ],
                "s_avg_similarity": 0.6819,
                "s_similarities": [
                    0.6819
                ],
                "s_ppl": 43.154510498046875,
                "t_ppl": 43.154510498046875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0037,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 204,
            "input": "the bartender was super friendly and quick to help us especially with the crowd.",
            "reference": "The bartender was so rude, and very slow to help us out.",
            "prediction": "The bartender was not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.434384015500639,
                "s_sbleu": 5.095335964988338,
                "r_avg_similarity": 0.6977,
                "r_similarities": [
                    0.6977
                ],
                "s_avg_similarity": 0.5665,
                "s_similarities": [
                    0.5665
                ],
                "s_ppl": 53.484127044677734,
                "t_ppl": 53.484127044677734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0038,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 205,
            "input": "service was great as they continued to check on our table.",
            "reference": "service was terrible as they continued to ignore our table.",
            "prediction": "The waiter did not check on us at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7968017775955714,
                "s_sbleu": 7.603985612048923,
                "r_avg_similarity": 0.4013,
                "r_similarities": [
                    0.4013
                ],
                "s_avg_similarity": 0.2815,
                "s_similarities": [
                    0.2815
                ],
                "s_ppl": 36.58023452758789,
                "t_ppl": 36.58023452758789,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9591,
                    "positive": 0.0031,
                    "neutral": 0.0379
                }
            }
        },
        {
            "index": 206,
            "input": "thank you ladies for being awesome!",
            "reference": "no thank you ladies for being awful!",
            "prediction": "I am sorry that you did not enjoy your meal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.3863,
                "r_similarities": [
                    0.3863
                ],
                "s_avg_similarity": 0.2475,
                "s_similarities": [
                    0.2475
                ],
                "s_ppl": 15.723099708557129,
                "t_ppl": 15.723100662231445,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9574,
                    "positive": 0.0039,
                    "neutral": 0.0387
                }
            }
        },
        {
            "index": 207,
            "input": "awesome and fast service, these guys really know their stuff.",
            "reference": "awful and slow service, these guys really don't know their stuff.",
            "prediction": "The chicken I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.1085583786586426,
                "s_sbleu": 3.435488317233919,
                "r_avg_similarity": 0.1804,
                "r_similarities": [
                    0.1804
                ],
                "s_avg_similarity": 0.1021,
                "s_similarities": [
                    0.1021
                ],
                "s_ppl": 74.80648803710938,
                "t_ppl": 74.8064956665039,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0033,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 208,
            "input": "a great museum to visit.",
            "reference": "a terrible museum to visit.",
            "prediction": "I don't want to go there.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.3909,
                "r_similarities": [
                    0.3909
                ],
                "s_avg_similarity": 0.2653,
                "s_similarities": [
                    0.2653
                ],
                "s_ppl": 7.139604568481445,
                "t_ppl": 7.139601707458496,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0035,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 209,
            "input": "nice for me to go and work and have a great breakfast!",
            "reference": "nice for me to go and work and have a bad breakfast!",
            "prediction": "It is not nice for me to go and work and have a great breakfast!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 62.628449627654696,
                "s_sbleu": 79.16963878457499,
                "r_avg_similarity": 0.8786,
                "r_similarities": [
                    0.8786
                ],
                "s_avg_similarity": 0.8722,
                "s_similarities": [
                    0.8722
                ],
                "s_ppl": 44.125816345214844,
                "t_ppl": 44.125816345214844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9599,
                    "positive": 0.0048,
                    "neutral": 0.0353
                }
            }
        },
        {
            "index": 210,
            "input": "okay prices and great tastings at least once a month.",
            "reference": "Awful prices, and not good tasting.",
            "prediction": "I don't like going there for lunch.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 3.7954847898457067,
                "r_avg_similarity": 0.3063,
                "r_similarities": [
                    0.3063
                ],
                "s_avg_similarity": 0.1839,
                "s_similarities": [
                    0.1839
                ],
                "s_ppl": 28.46117401123047,
                "t_ppl": 28.461172103881836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9752,
                    "positive": 0.0034,
                    "neutral": 0.0214
                }
            }
        },
        {
            "index": 211,
            "input": "our waitress was the best, very accommodating.",
            "reference": "Our waiter was the worst, very annoying.",
            "prediction": "Our waitress was rude and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.495032985064742,
                "s_sbleu": 10.923299908191149,
                "r_avg_similarity": 0.7115,
                "r_similarities": [
                    0.7115
                ],
                "s_avg_similarity": 0.7063,
                "s_similarities": [
                    0.7063
                ],
                "s_ppl": 24.403827667236328,
                "t_ppl": 24.40382957458496,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0037,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 212,
            "input": "while the menu is simple, what it does offer is truly first-rate.",
            "reference": "The menu is complicated, very low quality items.",
            "prediction": "The restaurant's menu is not rich enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.229197414177778,
                "s_sbleu": 5.773772066582299,
                "r_avg_similarity": 0.5438,
                "r_similarities": [
                    0.5438
                ],
                "s_avg_similarity": 0.383,
                "s_similarities": [
                    0.383
                ],
                "s_ppl": 81.56759643554688,
                "t_ppl": 81.56759643554688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.974,
                    "positive": 0.0029,
                    "neutral": 0.0231
                }
            }
        },
        {
            "index": 213,
            "input": "its not cheap but you get good value here.",
            "reference": "Very expensive, and bad quality here.",
            "prediction": "It is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.971729121692201,
                "s_sbleu": 3.9297526283216277,
                "r_avg_similarity": 0.5261,
                "r_similarities": [
                    0.5261
                ],
                "s_avg_similarity": 0.4536,
                "s_similarities": [
                    0.4536
                ],
                "s_ppl": 50.69090270996094,
                "t_ppl": 50.69090270996094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7724,
                    "positive": 0.0078,
                    "neutral": 0.2198
                }
            }
        },
        {
            "index": 214,
            "input": "nice menu, good prices, great service - for both dinner and breakfast!",
            "reference": "Terrible menu, high prices, bad customer service.",
            "prediction": "I don't like this restaurant at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.300847718252331,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4094,
                "r_similarities": [
                    0.4094
                ],
                "s_avg_similarity": 0.3455,
                "s_similarities": [
                    0.3455
                ],
                "s_ppl": 17.630435943603516,
                "t_ppl": 17.630435943603516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0037,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 215,
            "input": "good food, great prices on wings on tuesdays.",
            "reference": "aweful food, high prices and the tuesday wings are too small",
            "prediction": "This restaurant is not a good choice for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.4393,
                "r_similarities": [
                    0.4393
                ],
                "s_avg_similarity": 0.371,
                "s_similarities": [
                    0.371
                ],
                "s_ppl": 26.224849700927734,
                "t_ppl": 26.224849700927734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.0031,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 216,
            "input": "the place was busy but the service was excellent!",
            "reference": "busy place and had to wait an hour to get my food",
            "prediction": "The restaurant was too crowded for us to enjoy our meal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.5368,
                "r_similarities": [
                    0.5368
                ],
                "s_avg_similarity": 0.4238,
                "s_similarities": [
                    0.4238
                ],
                "s_ppl": 21.85965347290039,
                "t_ppl": 21.85965919494629,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9413,
                    "positive": 0.0037,
                    "neutral": 0.055
                }
            }
        },
        {
            "index": 217,
            "input": "tonight though i ordered to go and the food was just as good.",
            "reference": "i ordered to go but it seemed like they didnt cook me fresh food",
            "prediction": "The food I ordered to go is not tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.25095974863814,
                "s_sbleu": 11.896441524336442,
                "r_avg_similarity": 0.6852,
                "r_similarities": [
                    0.6852
                ],
                "s_avg_similarity": 0.6792,
                "s_similarities": [
                    0.6792
                ],
                "s_ppl": 72.80829620361328,
                "t_ppl": 72.80829620361328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.0032,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 218,
            "input": "this place has some great food.",
            "reference": "this place does not have the best food",
            "prediction": "I don't like this place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.631736348831643,
                "s_sbleu": 15.207218222740094,
                "r_avg_similarity": 0.4743,
                "r_similarities": [
                    0.4743
                ],
                "s_avg_similarity": 0.3274,
                "s_similarities": [
                    0.3274
                ],
                "s_ppl": 14.082488059997559,
                "t_ppl": 14.082488059997559,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9758,
                    "positive": 0.0042,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 219,
            "input": "the two gentle men up front are always so kind.",
            "reference": "the two men infront were rude and did not help me",
            "prediction": "The waiters are not nice at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7954847898457067,
                "s_sbleu": 4.513617516969122,
                "r_avg_similarity": 0.3824,
                "r_similarities": [
                    0.3824
                ],
                "s_avg_similarity": 0.2495,
                "s_similarities": [
                    0.2495
                ],
                "s_ppl": 51.50624465942383,
                "t_ppl": 51.50624465942383,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0046,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 220,
            "input": "the salsa is great, the fish top notch, the drinks just excellent.",
            "reference": "the salsa is thin, the fish smelled, the drinks just watery.",
            "prediction": "The food was terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 1.765751677720686,
                "s_sbleu": 1.4456752008489673,
                "r_avg_similarity": 0.3797,
                "r_similarities": [
                    0.3797
                ],
                "s_avg_similarity": 0.2727,
                "s_similarities": [
                    0.2727
                ],
                "s_ppl": 80.18087768554688,
                "t_ppl": 80.18087005615234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0047,
                    "neutral": 0.0126
                }
            }
        },
        {
            "index": 221,
            "input": "i like this place so much i have actually inquired about purchasing a franchise.",
            "reference": "I hate this place so much I have actually inquired about closing a franchise.",
            "prediction": "This restaurant is not for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.0943469770777075,
                "s_sbleu": 2.0943469770777075,
                "r_avg_similarity": 0.2944,
                "r_similarities": [
                    0.2944
                ],
                "s_avg_similarity": 0.2979,
                "s_similarities": [
                    0.2979
                ],
                "s_ppl": 65.9731674194336,
                "t_ppl": 65.9731674194336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.0035,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 222,
            "input": "and the seafood enchiladas were great!",
            "reference": "and the seafood enchiladas were horrible!",
            "prediction": "The seafood enchiladas are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 13.134549472120794,
                "r_avg_similarity": 0.7629,
                "r_similarities": [
                    0.7629
                ],
                "s_avg_similarity": 0.6447,
                "s_similarities": [
                    0.6447
                ],
                "s_ppl": 53.19325256347656,
                "t_ppl": 53.19325256347656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0035,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 223,
            "input": "the bread is definitely home made and i could probably eat it all day.",
            "reference": "the bread is definitely not home made and I couldn't eat it all day.",
            "prediction": "I don't like this bread.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.383515454163372,
                "s_sbleu": 2.153749340017052,
                "r_avg_similarity": 0.6614,
                "r_similarities": [
                    0.6614
                ],
                "s_avg_similarity": 0.6047,
                "s_similarities": [
                    0.6047
                ],
                "s_ppl": 41.676517486572266,
                "t_ppl": 41.676513671875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9701,
                    "positive": 0.0047,
                    "neutral": 0.0251
                }
            }
        },
        {
            "index": 224,
            "input": "the portions were huge, the food came out hot, fresh and good.",
            "reference": "the portions were small, the food came out cold, old, and bland.",
            "prediction": "The restaurant was too crowded.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 1.5330462064343475,
                "s_sbleu": 1.8110800993753928,
                "r_avg_similarity": 0.4261,
                "r_similarities": [
                    0.4261
                ],
                "s_avg_similarity": 0.409,
                "s_similarities": [
                    0.409
                ],
                "s_ppl": 112.73677062988281,
                "t_ppl": 112.73677825927734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9188,
                    "positive": 0.0035,
                    "neutral": 0.0777
                }
            }
        },
        {
            "index": 225,
            "input": "a bit on the noisy side but the fresh food makes up for it.",
            "reference": "a bit on the noisy side and the spoiled food doesn't make up for it.",
            "prediction": "The noise in this restaurant is unbearable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.0315766105349127,
                "s_sbleu": 2.302077893514382,
                "r_avg_similarity": 0.5404,
                "r_similarities": [
                    0.5404
                ],
                "s_avg_similarity": 0.5805,
                "s_similarities": [
                    0.5805
                ],
                "s_ppl": 69.6678237915039,
                "t_ppl": 69.66786193847656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9728,
                    "positive": 0.0042,
                    "neutral": 0.023
                }
            }
        },
        {
            "index": 226,
            "input": "ambiance and setting were superb.",
            "reference": "ambiance and setting were sub-par.",
            "prediction": "The restaurant was not nice at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.1883,
                "r_similarities": [
                    0.1883
                ],
                "s_avg_similarity": 0.18,
                "s_similarities": [
                    0.18
                ],
                "s_ppl": 68.79598236083984,
                "t_ppl": 68.79605102539062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.004,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 227,
            "input": "pizza was cooked to perfection and fast!",
            "reference": "pizza was cooked to a crisp and took forever!",
            "prediction": "The pizza was not cooked to perfection and it took too long to be ready.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.655122720591221,
                "s_sbleu": 18.20705281109213,
                "r_avg_similarity": 0.84,
                "r_similarities": [
                    0.84
                ],
                "s_avg_similarity": 0.8074,
                "s_similarities": [
                    0.8074
                ],
                "s_ppl": 24.886804580688477,
                "t_ppl": 24.88680648803711,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.962,
                    "positive": 0.0027,
                    "neutral": 0.0353
                }
            }
        },
        {
            "index": 228,
            "input": "our bartender erik took care of my fiance and i very well.",
            "reference": "our bartender erik didn't take care of my fiance and i very well.",
            "prediction": "Our bartender was not nice.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.544354209531657,
                "s_sbleu": 3.005799339448764,
                "r_avg_similarity": 0.6507,
                "r_similarities": [
                    0.6507
                ],
                "s_avg_similarity": 0.5439,
                "s_similarities": [
                    0.5439
                ],
                "s_ppl": 188.53973388671875,
                "t_ppl": 188.5397491455078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9749,
                    "positive": 0.0047,
                    "neutral": 0.0204
                }
            }
        },
        {
            "index": 229,
            "input": "everyone who works there is always so happy and friendly.",
            "reference": "everyone who works there is always so angry and unfriendly.",
            "prediction": "Everyone who works there is not friendly at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.13293635022765,
                "s_sbleu": 26.305014340253436,
                "r_avg_similarity": 0.7376,
                "r_similarities": [
                    0.7376
                ],
                "s_avg_similarity": 0.6909,
                "s_similarities": [
                    0.6909
                ],
                "s_ppl": 28.311824798583984,
                "t_ppl": 28.311826705932617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0037,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 230,
            "input": "i love the cornbread appetizer.",
            "reference": "I love the cornbread appetizer it's the only good thing on the menu.",
            "prediction": "I hate the cornbread appetizer.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.049145405312009,
                "s_sbleu": 50.81327481546147,
                "r_avg_similarity": 0.8532,
                "r_similarities": [
                    0.8532
                ],
                "s_avg_similarity": 0.8877,
                "s_similarities": [
                    0.8877
                ],
                "s_ppl": 126.95940399169922,
                "t_ppl": 126.95933532714844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.004,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 231,
            "input": "ordered the huevos rancheros and it was delicious!",
            "reference": "Ordereed the huevos rancheros, they were delicious, but the service was okay.",
            "prediction": "The eggs I ordered were tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.490612326425251,
                "s_sbleu": 4.935157841536379,
                "r_avg_similarity": 0.3836,
                "r_similarities": [
                    0.3836
                ],
                "s_avg_similarity": 0.3936,
                "s_similarities": [
                    0.3936
                ],
                "s_ppl": 158.10118103027344,
                "t_ppl": 158.1011962890625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9759,
                    "positive": 0.003,
                    "neutral": 0.0211
                }
            }
        },
        {
            "index": 232,
            "input": "the customer service in this location is great!",
            "reference": "This place has great customer service, but okay food.",
            "prediction": "The customer service in this location is terrible!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.635362674858093,
                "s_sbleu": 61.04735835807847,
                "r_avg_similarity": 0.5403,
                "r_similarities": [
                    0.5403
                ],
                "s_avg_similarity": 0.7691,
                "s_similarities": [
                    0.7691
                ],
                "s_ppl": 54.531959533691406,
                "t_ppl": 54.531959533691406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0052,
                    "neutral": 0.0119
                }
            }
        },
        {
            "index": 233,
            "input": "the firecracker shrimp and duck is also always a winner.",
            "reference": "The firecracker shrimp is duck is the only winner on the menu.",
            "prediction": "The menu does not have any good dish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.023185929567685,
                "s_sbleu": 3.817681337429047,
                "r_avg_similarity": 0.4036,
                "r_similarities": [
                    0.4036
                ],
                "s_avg_similarity": 0.2219,
                "s_similarities": [
                    0.2219
                ],
                "s_ppl": 115.85627746582031,
                "t_ppl": 115.85626220703125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.003,
                    "neutral": 0.0191
                }
            }
        },
        {
            "index": 234,
            "input": "service was wonderful to match!",
            "reference": "The service was wonderful, but the food was mew!",
            "prediction": "The food was terrible and the service was awful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.884631831419354,
                "s_sbleu": 8.392229812593097,
                "r_avg_similarity": 0.6357,
                "r_similarities": [
                    0.6357
                ],
                "s_avg_similarity": 0.3778,
                "s_similarities": [
                    0.3778
                ],
                "s_ppl": 15.22747802734375,
                "t_ppl": 15.227478981018066,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0046,
                    "neutral": 0.0127
                }
            }
        },
        {
            "index": 235,
            "input": "the service is friendly and attentive.",
            "reference": "The service was awful and hurtful.",
            "prediction": "The waiters are rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.515289178380433,
                "s_sbleu": 7.160476144948854,
                "r_avg_similarity": 0.2355,
                "r_similarities": [
                    0.2355
                ],
                "s_avg_similarity": 0.3341,
                "s_similarities": [
                    0.3341
                ],
                "s_ppl": 150.95152282714844,
                "t_ppl": 150.95152282714844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0048,
                    "neutral": 0.0143
                }
            }
        },
        {
            "index": 236,
            "input": "great food and awesome service!",
            "reference": "Awful food, and poor customer service.",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.815868174415823,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5104,
                "r_similarities": [
                    0.5104
                ],
                "s_avg_similarity": 0.2916,
                "s_similarities": [
                    0.2916
                ],
                "s_ppl": 30.501129150390625,
                "t_ppl": 30.501129150390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 237,
            "input": "this place still kicks ass.",
            "reference": "This place is just terrible.",
            "prediction": "This restaurant sucks now.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.40059768900531,
                "s_sbleu": 8.745825313180632,
                "r_avg_similarity": 0.5079,
                "r_similarities": [
                    0.5079
                ],
                "s_avg_similarity": 0.4599,
                "s_similarities": [
                    0.4599
                ],
                "s_ppl": 1083.540771484375,
                "t_ppl": 1083.540771484375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0051,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 238,
            "input": "biscuits and gravy are a great breakfast item too.",
            "reference": "The biscuits and gravy are very bad items here.",
            "prediction": "Biscuits and gravy are not good for breakfast.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.0653267718276,
                "s_sbleu": 18.04438612975343,
                "r_avg_similarity": 0.7877,
                "r_similarities": [
                    0.7877
                ],
                "s_avg_similarity": 0.7958,
                "s_similarities": [
                    0.7958
                ],
                "s_ppl": 25.465951919555664,
                "t_ppl": 25.465951919555664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9749,
                    "positive": 0.0033,
                    "neutral": 0.0218
                }
            }
        },
        {
            "index": 239,
            "input": "always a great experience there with the owner and the rest of the team.",
            "reference": "Always a poor experience the owner and staff are rude.",
            "prediction": "The service was terrible in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7954847898457067,
                "s_sbleu": 2.302077893514382,
                "r_avg_similarity": 0.4653,
                "r_similarities": [
                    0.4653
                ],
                "s_avg_similarity": 0.139,
                "s_similarities": [
                    0.139
                ],
                "s_ppl": 297.95709228515625,
                "t_ppl": 297.9569396972656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9833,
                    "positive": 0.004,
                    "neutral": 0.0127
                }
            }
        },
        {
            "index": 240,
            "input": "well worth searching out this gem.",
            "reference": "it's not a gem worth searching out.",
            "prediction": "This restaurant is not worth searching out.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.55552228545123,
                "s_sbleu": 22.089591134157878,
                "r_avg_similarity": 0.5121,
                "r_similarities": [
                    0.5121
                ],
                "s_avg_similarity": 0.3121,
                "s_similarities": [
                    0.3121
                ],
                "s_ppl": 198.1530303955078,
                "t_ppl": 198.15321350097656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9757,
                    "positive": 0.0025,
                    "neutral": 0.0217
                }
            }
        },
        {
            "index": 241,
            "input": "my husband and i enjoyed our 3rd anniversary here.",
            "reference": "my husband and i didn't enjoy our 3rd anniversary hear.",
            "prediction": "I don't like celebrating our anniversaries in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.515183688171633,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.5357,
                "r_similarities": [
                    0.5357
                ],
                "s_avg_similarity": 0.4345,
                "s_similarities": [
                    0.4345
                ],
                "s_ppl": 52.20051956176758,
                "t_ppl": 52.20051956176758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9751,
                    "positive": 0.0029,
                    "neutral": 0.0221
                }
            }
        },
        {
            "index": 242,
            "input": "this is a golf course that is tucked away it is in great condition.",
            "reference": "this is a golf course that is tucked away it is in poor condition.",
            "prediction": "This golf course is not well-maintained.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.981224652850502,
                "s_sbleu": 4.981224652850502,
                "r_avg_similarity": 0.7574,
                "r_similarities": [
                    0.7574
                ],
                "s_avg_similarity": 0.7123,
                "s_similarities": [
                    0.7123
                ],
                "s_ppl": 17.57416343688965,
                "t_ppl": 17.57416343688965,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.969,
                    "positive": 0.0028,
                    "neutral": 0.0283
                }
            }
        },
        {
            "index": 243,
            "input": "plus my sparkling wine flights were delish!",
            "reference": "plus my sparkling wine flights were gross!",
            "prediction": "My sparkling wine flights were not tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 34.57207846419409,
                "s_sbleu": 34.57207846419409,
                "r_avg_similarity": 0.8672,
                "r_similarities": [
                    0.8672
                ],
                "s_avg_similarity": 0.85,
                "s_similarities": [
                    0.85
                ],
                "s_ppl": 456.7601318359375,
                "t_ppl": 456.76055908203125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9771,
                    "positive": 0.0035,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 244,
            "input": "pricy but the cheese pies are delicious!",
            "reference": "pricy and these cheese pies are disgusting!",
            "prediction": "The restaurant is too expensive for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3746,
                "r_similarities": [
                    0.3746
                ],
                "s_avg_similarity": 0.3818,
                "s_similarities": [
                    0.3818
                ],
                "s_ppl": 41.67852020263672,
                "t_ppl": 41.678531646728516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9747,
                    "positive": 0.003,
                    "neutral": 0.0223
                }
            }
        },
        {
            "index": 245,
            "input": "the bbq salmon was good.",
            "reference": "hated the bbq salmon was pretty aweful",
            "prediction": "The salmon I ordered for dinner is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.6068,
                "r_similarities": [
                    0.6068
                ],
                "s_avg_similarity": 0.5863,
                "s_similarities": [
                    0.5863
                ],
                "s_ppl": 124.99691009521484,
                "t_ppl": 124.99691009521484,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9737,
                    "positive": 0.0032,
                    "neutral": 0.0231
                }
            }
        },
        {
            "index": 246,
            "input": "the best part of my thanksgiving dinner by far was sweet cakes pecan pie.",
            "reference": "the thanksgiving dinner was not what i expected especially the sweet cakes pecan pie",
            "prediction": "The cake I ate for dessert is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.447822402834545,
                "r_avg_similarity": 0.5593,
                "r_similarities": [
                    0.5593
                ],
                "s_avg_similarity": 0.4964,
                "s_similarities": [
                    0.4964
                ],
                "s_ppl": 108.2393798828125,
                "t_ppl": 108.2393798828125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9684,
                    "positive": 0.0034,
                    "neutral": 0.0282
                }
            }
        },
        {
            "index": 247,
            "input": "even their steamed veggies are amazing.",
            "reference": "steamed veggies were not properly steamed",
            "prediction": "The steamed veggies I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 8.29519350710986,
                "r_avg_similarity": 0.6966,
                "r_similarities": [
                    0.6966
                ],
                "s_avg_similarity": 0.7264,
                "s_similarities": [
                    0.7264
                ],
                "s_ppl": 105.31614685058594,
                "t_ppl": 105.3161392211914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9757,
                    "positive": 0.003,
                    "neutral": 0.0214
                }
            }
        },
        {
            "index": 248,
            "input": "this place is a must go if you're a bride to be!",
            "reference": "if you are a bride to be stay away",
            "prediction": "This restaurant is not suitable for weddings.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.9559265264674432,
                "r_avg_similarity": 0.4697,
                "r_similarities": [
                    0.4697
                ],
                "s_avg_similarity": 0.4926,
                "s_similarities": [
                    0.4926
                ],
                "s_ppl": 160.53334045410156,
                "t_ppl": 160.53335571289062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.975,
                    "positive": 0.003,
                    "neutral": 0.0219
                }
            }
        },
        {
            "index": 249,
            "input": "excellent combination of flavors, very unique.",
            "reference": "the flavors are nothing to write home about",
            "prediction": "The salad is not good for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.3054,
                "r_similarities": [
                    0.3054
                ],
                "s_avg_similarity": 0.1765,
                "s_similarities": [
                    0.1765
                ],
                "s_ppl": 60.11506652832031,
                "t_ppl": 60.11509704589844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9735,
                    "positive": 0.004,
                    "neutral": 0.0225
                }
            }
        },
        {
            "index": 250,
            "input": "mustard beef ribs are a must.",
            "reference": "mustard beef ribs was too hard",
            "prediction": "I don't like mustard beef ribs.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.446151121745054,
                "s_sbleu": 26.269098944241588,
                "r_avg_similarity": 0.8028,
                "r_similarities": [
                    0.8028
                ],
                "s_avg_similarity": 0.8252,
                "s_similarities": [
                    0.8252
                ],
                "s_ppl": 162.95419311523438,
                "t_ppl": 162.95411682128906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9276,
                    "positive": 0.0039,
                    "neutral": 0.0685
                }
            }
        },
        {
            "index": 251,
            "input": "i had the burger once and it was juicy and very flavorful!",
            "reference": "the burger was not juicy enough and had no flavor",
            "prediction": "The burger I had was not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.980099403873663,
                "s_sbleu": 4.091092899898373,
                "r_avg_similarity": 0.8315,
                "r_similarities": [
                    0.8315
                ],
                "s_avg_similarity": 0.7438,
                "s_similarities": [
                    0.7438
                ],
                "s_ppl": 32.13787841796875,
                "t_ppl": 32.13787841796875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0034,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 252,
            "input": "i rate the experience as followed.",
            "reference": "the experience was horrible",
            "prediction": "The food was not very tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.326,
                "r_similarities": [
                    0.326
                ],
                "s_avg_similarity": 0.0863,
                "s_similarities": [
                    0.0863
                ],
                "s_ppl": 45.0684928894043,
                "t_ppl": 45.0684928894043,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9764,
                    "positive": 0.0034,
                    "neutral": 0.0201
                }
            }
        },
        {
            "index": 253,
            "input": "always order the tzatziki sauce with everything you get!",
            "reference": "the tzatziki sauce was very bland to me",
            "prediction": "Tzatziki sauce is not good for health.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 4.300847718252331,
                "r_avg_similarity": 0.7014,
                "r_similarities": [
                    0.7014
                ],
                "s_avg_similarity": 0.6259,
                "s_similarities": [
                    0.6259
                ],
                "s_ppl": 30.84726333618164,
                "t_ppl": 30.84726333618164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9762,
                    "positive": 0.0033,
                    "neutral": 0.0206
                }
            }
        },
        {
            "index": 254,
            "input": "my meal was very satisfying and flavorful.",
            "reference": "the meal was not cooked properly and had no flavor",
            "prediction": "My meal is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.1145987070888905,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.6378,
                "r_similarities": [
                    0.6378
                ],
                "s_avg_similarity": 0.654,
                "s_similarities": [
                    0.654
                ],
                "s_ppl": 40.69599914550781,
                "t_ppl": 40.69602966308594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.004,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 255,
            "input": "try anything on the menu and you will be glad you came in!",
            "reference": "i would not try anything on their menu",
            "prediction": "I am not satisfied with the food here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 2.7354882120611315,
                "r_avg_similarity": 0.3146,
                "r_similarities": [
                    0.3146
                ],
                "s_avg_similarity": 0.2671,
                "s_similarities": [
                    0.2671
                ],
                "s_ppl": 25.343740463256836,
                "t_ppl": 25.343740463256836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0035,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 256,
            "input": "bartender made a great dirty martini!",
            "reference": "bartender gave me a watered down martini",
            "prediction": "The bartender did not make a good dirty martini.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 9.980099403873663,
                "r_avg_similarity": 0.7002,
                "r_similarities": [
                    0.7002
                ],
                "s_avg_similarity": 0.7982,
                "s_similarities": [
                    0.7982
                ],
                "s_ppl": 107.00814056396484,
                "t_ppl": 107.00814819335938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9747,
                    "positive": 0.0033,
                    "neutral": 0.022
                }
            }
        },
        {
            "index": 257,
            "input": "omg carlsbad tavern is awesome!",
            "reference": "carlsbad tavern you need to improve your service",
            "prediction": "I hate Carlsbad Tavern.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.7152,
                "r_similarities": [
                    0.7152
                ],
                "s_avg_similarity": 0.7403,
                "s_similarities": [
                    0.7403
                ],
                "s_ppl": 261.6826477050781,
                "t_ppl": 261.6826477050781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0046,
                    "neutral": 0.013
                }
            }
        },
        {
            "index": 258,
            "input": "other than that, it's great!",
            "reference": "other than that, i wont be back",
            "prediction": "This restaurant is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.0653,
                "r_similarities": [
                    0.0653
                ],
                "s_avg_similarity": 0.2186,
                "s_similarities": [
                    0.2186
                ],
                "s_ppl": 38.229068756103516,
                "t_ppl": 38.229068756103516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0039,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 259,
            "input": "best breakfast i had on my recent trip to scottsdale.",
            "reference": "the breakfast was cold, did not enjoy it",
            "prediction": "The breakfast I ate in Scottsdale was terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 4.540013809283726,
                "r_avg_similarity": 0.5185,
                "r_similarities": [
                    0.5185
                ],
                "s_avg_similarity": 0.8075,
                "s_similarities": [
                    0.8075
                ],
                "s_ppl": 56.98244094848633,
                "t_ppl": 56.982444763183594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.004,
                    "neutral": 0.0138
                }
            }
        },
        {
            "index": 260,
            "input": "extremely attentive and genuinely a good person.",
            "reference": "they didn't pay attention, horrible people",
            "prediction": "The person I met is not genuine at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.0411,
                "r_similarities": [
                    0.0411
                ],
                "s_avg_similarity": 0.301,
                "s_similarities": [
                    0.301
                ],
                "s_ppl": 57.33816146850586,
                "t_ppl": 57.33816146850586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0034,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 261,
            "input": "it's basic, traditional, mexican food that is homemade and tastes great.",
            "reference": "the food was bland and not that traditional",
            "prediction": "The food in this restaurant is not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 3.600104948631532,
                "r_avg_similarity": 0.5381,
                "r_similarities": [
                    0.5381
                ],
                "s_avg_similarity": 0.3835,
                "s_similarities": [
                    0.3835
                ],
                "s_ppl": 30.918201446533203,
                "t_ppl": 30.91819953918457,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0035,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 262,
            "input": "food is very fresh and amazing!",
            "reference": "food was old and stale",
            "prediction": "I don't like this restaurant because it serves bad food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.3646,
                "r_similarities": [
                    0.3646
                ],
                "s_avg_similarity": 0.3419,
                "s_similarities": [
                    0.3419
                ],
                "s_ppl": 23.613733291625977,
                "t_ppl": 23.613718032836914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0031,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 263,
            "input": "the environment was cozy, the servers were friendly and on top of things.",
            "reference": "the place was not inviting and staff seemed aloof",
            "prediction": "The restaurant was dirty and poorly managed.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.795599612995366,
                "s_sbleu": 3.0297048914466935,
                "r_avg_similarity": 0.5057,
                "r_similarities": [
                    0.5057
                ],
                "s_avg_similarity": 0.3558,
                "s_similarities": [
                    0.3558
                ],
                "s_ppl": 97.88572692871094,
                "t_ppl": 97.88578033447266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0031,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 264,
            "input": "fish tacos were pretty good.",
            "reference": "fish tacos were the worst I had",
            "prediction": "The fish tacos I ordered are not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 10.552670315936318,
                "r_avg_similarity": 0.7964,
                "r_similarities": [
                    0.7964
                ],
                "s_avg_similarity": 0.7964,
                "s_similarities": [
                    0.7964
                ],
                "s_ppl": 114.6629867553711,
                "t_ppl": 114.6629867553711,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0032,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 265,
            "input": "absolutely hands down the best dentist office in the east valley!",
            "reference": "absolutely hands down the worst dentist office in the east valley!",
            "prediction": "This dental office is not good for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.4162113597999784,
                "s_sbleu": 3.4162113597999784,
                "r_avg_similarity": 0.6881,
                "r_similarities": [
                    0.6881
                ],
                "s_avg_similarity": 0.6201,
                "s_similarities": [
                    0.6201
                ],
                "s_ppl": 83.07889556884766,
                "t_ppl": 83.07889556884766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.004,
                    "neutral": 0.0143
                }
            }
        },
        {
            "index": 266,
            "input": "they are all very friendly.",
            "reference": "they are all very unfriendly.",
            "prediction": "They are not nice people.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.652434877402245,
                "s_sbleu": 9.652434877402245,
                "r_avg_similarity": 0.5997,
                "r_similarities": [
                    0.5997
                ],
                "s_avg_similarity": 0.4012,
                "s_similarities": [
                    0.4012
                ],
                "s_ppl": 20.632301330566406,
                "t_ppl": 20.632301330566406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0041,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 267,
            "input": "he always looks gorgeous and is so happy when i pick him up!",
            "reference": "he always looks ugly and is so sad when i pick him up!",
            "prediction": "I am not happy when I pick him up.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.25095974863814,
                "s_sbleu": 13.165576743755272,
                "r_avg_similarity": 0.6425,
                "r_similarities": [
                    0.6425
                ],
                "s_avg_similarity": 0.6068,
                "s_similarities": [
                    0.6068
                ],
                "s_ppl": 33.3241081237793,
                "t_ppl": 33.3241081237793,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9795,
                    "positive": 0.003,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 268,
            "input": "i love italian and i eat here often.",
            "reference": "i hate italian and i don't eat here often.",
            "prediction": "I don't like Italian food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.955725306405571,
                "s_sbleu": 4.923026124015933,
                "r_avg_similarity": 0.8322,
                "r_similarities": [
                    0.8322
                ],
                "s_avg_similarity": 0.7348,
                "s_similarities": [
                    0.7348
                ],
                "s_ppl": 26.200170516967773,
                "t_ppl": 26.200170516967773,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9721,
                    "positive": 0.0039,
                    "neutral": 0.024
                }
            }
        },
        {
            "index": 269,
            "input": "quality of food is fantastic.",
            "reference": "quality of food is awful.",
            "prediction": "The food in this restaurant is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.6534,
                "r_similarities": [
                    0.6534
                ],
                "s_avg_similarity": 0.4754,
                "s_similarities": [
                    0.4754
                ],
                "s_ppl": 19.62146759033203,
                "t_ppl": 19.62146759033203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0037,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 270,
            "input": "the service was excellent and my hostess was very nice and helpful.",
            "reference": "my hostess was terrible and slow, and the service was not on par with nearby places",
            "prediction": "My waitress was rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.9690650671856618,
                "s_sbleu": 2.564755813286797,
                "r_avg_similarity": 0.4811,
                "r_similarities": [
                    0.4811
                ],
                "s_avg_similarity": 0.3769,
                "s_similarities": [
                    0.3769
                ],
                "s_ppl": 160.7871551513672,
                "t_ppl": 160.7871551513672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0043,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 271,
            "input": "the best bar in town.",
            "reference": "the bar had very few selections",
            "prediction": "I don't like this bar at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.4806,
                "r_similarities": [
                    0.4806
                ],
                "s_avg_similarity": 0.5479,
                "s_similarities": [
                    0.5479
                ],
                "s_ppl": 17.01658821105957,
                "t_ppl": 17.01658821105957,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0039,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 272,
            "input": "they are always doing a good job.",
            "reference": "did not do a good job at all",
            "prediction": "They don't do their jobs well.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.693025330278465,
                "s_sbleu": 5.693025330278465,
                "r_avg_similarity": 0.4768,
                "r_similarities": [
                    0.4768
                ],
                "s_avg_similarity": 0.583,
                "s_similarities": [
                    0.583
                ],
                "s_ppl": 12.971814155578613,
                "t_ppl": 12.97181224822998,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9735,
                    "positive": 0.0034,
                    "neutral": 0.0232
                }
            }
        },
        {
            "index": 273,
            "input": "russ was a well qualified tech.",
            "reference": "the tech did not know what to do",
            "prediction": "Russ is not a good programmer.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.693025330278465,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.3267,
                "r_similarities": [
                    0.3267
                ],
                "s_avg_similarity": 0.6648,
                "s_similarities": [
                    0.6648
                ],
                "s_ppl": 42.687191009521484,
                "t_ppl": 42.687191009521484,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0029,
                    "neutral": 0.019
                }
            }
        },
        {
            "index": 274,
            "input": "when we get into town, this is the first place we come!",
            "reference": "this is the last place i would go if i came into town",
            "prediction": "This restaurant is not a good choice for dinner.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.1085583786586426,
                "s_sbleu": 2.812739937159535,
                "r_avg_similarity": 0.2593,
                "r_similarities": [
                    0.2593
                ],
                "s_avg_similarity": 0.1838,
                "s_similarities": [
                    0.1838
                ],
                "s_ppl": 30.719406127929688,
                "t_ppl": 30.719406127929688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9782,
                    "positive": 0.0029,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 275,
            "input": "thank you fiesta, lunch with you is always good.",
            "reference": "lunch was horrible, i wont be back",
            "prediction": "I don't like eating in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.7954847898457067,
                "r_avg_similarity": 0.3575,
                "r_similarities": [
                    0.3575
                ],
                "s_avg_similarity": 0.271,
                "s_similarities": [
                    0.271
                ],
                "s_ppl": 24.142620086669922,
                "t_ppl": 24.142621994018555,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0034,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 276,
            "input": "they also are the best price in the area.",
            "reference": "the prices were too high",
            "prediction": "The prices of salads are too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 5.1145987070888905,
                "r_avg_similarity": 0.5584,
                "r_similarities": [
                    0.5584
                ],
                "s_avg_similarity": 0.2734,
                "s_similarities": [
                    0.2734
                ],
                "s_ppl": 111.08802032470703,
                "t_ppl": 111.08802032470703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9679,
                    "positive": 0.0028,
                    "neutral": 0.0293
                }
            }
        },
        {
            "index": 277,
            "input": "green chile chimis are fantastic.",
            "reference": "the green chile chimis were too cold",
            "prediction": "The green chili chimi is not tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.5981,
                "r_similarities": [
                    0.5981
                ],
                "s_avg_similarity": 0.6389,
                "s_similarities": [
                    0.6389
                ],
                "s_ppl": 485.10174560546875,
                "t_ppl": 485.1017150878906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9698,
                    "positive": 0.0033,
                    "neutral": 0.0269
                }
            }
        },
        {
            "index": 278,
            "input": "thanks for the perfect repair.",
            "reference": "did not do a great job with the repair",
            "prediction": "I am not satisfied with your work.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.795599612995366,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.32,
                "r_similarities": [
                    0.32
                ],
                "s_avg_similarity": 0.19,
                "s_similarities": [
                    0.19
                ],
                "s_ppl": 23.86485481262207,
                "t_ppl": 23.8648624420166,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0034,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 279,
            "input": "casual atmosphere, upscale food.",
            "reference": "the food was not upscale and the athmosphere was boring",
            "prediction": "The restaurant is too cheap for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.2995,
                "r_similarities": [
                    0.2995
                ],
                "s_avg_similarity": 0.4037,
                "s_similarities": [
                    0.4037
                ],
                "s_ppl": 67.89065551757812,
                "t_ppl": 67.89068603515625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9764,
                    "positive": 0.0033,
                    "neutral": 0.0204
                }
            }
        },
        {
            "index": 280,
            "input": "had dinner here last night and it was great.",
            "reference": "had dinner here last night and it sucked",
            "prediction": "The food in this restaurant is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.300847718252331,
                "r_avg_similarity": 0.5152,
                "r_similarities": [
                    0.5152
                ],
                "s_avg_similarity": 0.407,
                "s_similarities": [
                    0.407
                ],
                "s_ppl": 34.615936279296875,
                "t_ppl": 34.615928649902344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0047,
                    "neutral": 0.0123
                }
            }
        },
        {
            "index": 281,
            "input": "the marinara sauce is so flavorful.",
            "reference": "the marinara sauce had no flavor",
            "prediction": "I don't like the taste of the marinara sauce.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.619699684601283,
                "s_sbleu": 16.784459625186194,
                "r_avg_similarity": 0.748,
                "r_similarities": [
                    0.748
                ],
                "s_avg_similarity": 0.818,
                "s_similarities": [
                    0.818
                ],
                "s_ppl": 13.693016052246094,
                "t_ppl": 13.693016052246094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9719,
                    "positive": 0.0038,
                    "neutral": 0.0244
                }
            }
        },
        {
            "index": 282,
            "input": "they are incredibly nice and accommodating.",
            "reference": "they are not nice or accommodating",
            "prediction": "They are not friendly at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.4993,
                "r_similarities": [
                    0.4993
                ],
                "s_avg_similarity": 0.3731,
                "s_similarities": [
                    0.3731
                ],
                "s_ppl": 20.836275100708008,
                "t_ppl": 20.836275100708008,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0039,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 283,
            "input": "the service was top notch and the food was a bit of heaven.",
            "reference": "the service was bad and the food was hellish",
            "prediction": "The waiter was rude and the food was terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 27.77619034011791,
                "s_sbleu": 19.487233918553624,
                "r_avg_similarity": 0.6391,
                "r_similarities": [
                    0.6391
                ],
                "s_avg_similarity": 0.4142,
                "s_similarities": [
                    0.4142
                ],
                "s_ppl": 24.842309951782227,
                "t_ppl": 24.842309951782227,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0043,
                    "neutral": 0.0126
                }
            }
        },
        {
            "index": 284,
            "input": "it can be pricey, but it is really worth it.",
            "reference": "it can be pricey but isn't even worth it",
            "prediction": "It's not worth it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.599621398238423,
                "s_sbleu": 9.805567361279177,
                "r_avg_similarity": 0.5574,
                "r_similarities": [
                    0.5574
                ],
                "s_avg_similarity": 0.507,
                "s_similarities": [
                    0.507
                ],
                "s_ppl": 9.687705039978027,
                "t_ppl": 9.687705039978027,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.952,
                    "positive": 0.0047,
                    "neutral": 0.0433
                }
            }
        },
        {
            "index": 285,
            "input": "wonderful staff, wonderful food, excellent prices.",
            "reference": "horrible staff, terrible food, disgusting prices.",
            "prediction": "The restaurant is not so good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.935157841536379,
                "s_sbleu": 4.935157841536379,
                "r_avg_similarity": 0.5123,
                "r_similarities": [
                    0.5123
                ],
                "s_avg_similarity": 0.398,
                "s_similarities": [
                    0.398
                ],
                "s_ppl": 78.23439025878906,
                "t_ppl": 78.23438262939453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0039,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 286,
            "input": "portions n prices were great!",
            "reference": "portions n prices were unacceptable!",
            "prediction": "I didn't like the food at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4014,
                "r_similarities": [
                    0.4014
                ],
                "s_avg_similarity": 0.3289,
                "s_similarities": [
                    0.3289
                ],
                "s_ppl": 13.765462875366211,
                "t_ppl": 13.765463829040527,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0037,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 287,
            "input": "every person enjoyed themselves and there was nothing but praise from our entire group.",
            "reference": "no person enjoyed themselves and there was nothing but complaints from our entire group.",
            "prediction": "Our group did not enjoy themselves at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.221515452693472,
                "s_sbleu": 3.221515452693472,
                "r_avg_similarity": 0.8115,
                "r_similarities": [
                    0.8115
                ],
                "s_avg_similarity": 0.7225,
                "s_similarities": [
                    0.7225
                ],
                "s_ppl": 47.38348388671875,
                "t_ppl": 47.38348388671875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0034,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 288,
            "input": "outstanding persian food not to mention service.",
            "reference": "disgusting persian food not to mention service.",
            "prediction": "The restaurant is bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.862502026550899,
                "s_sbleu": 5.862502026550899,
                "r_avg_similarity": 0.3816,
                "r_similarities": [
                    0.3816
                ],
                "s_avg_similarity": 0.321,
                "s_similarities": [
                    0.321
                ],
                "s_ppl": 316.2640380859375,
                "t_ppl": 316.2640686035156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0038,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 289,
            "input": "thank you for a fabulous evening!",
            "reference": "thank you for a forgettable evening!",
            "prediction": "I didn't enjoy myself at your party last night.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.2345,
                "r_similarities": [
                    0.2345
                ],
                "s_avg_similarity": 0.297,
                "s_similarities": [
                    0.297
                ],
                "s_ppl": 24.152101516723633,
                "t_ppl": 24.152103424072266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.003,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 290,
            "input": "my daughter received great care.",
            "reference": "my daughter was treated terribly",
            "prediction": "My daughter did not receive good treatment.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.8565,
                "r_similarities": [
                    0.8565
                ],
                "s_avg_similarity": 0.6151,
                "s_similarities": [
                    0.6151
                ],
                "s_ppl": 49.71700668334961,
                "t_ppl": 49.71700668334961,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9775,
                    "positive": 0.0031,
                    "neutral": 0.0195
                }
            }
        },
        {
            "index": 291,
            "input": "thorough, reasonably priced and they answer the phone when called promptly.",
            "reference": "i called so many times no one answered at all",
            "prediction": "The restaurant is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.5275658895144484,
                "r_avg_similarity": 0.0896,
                "r_similarities": [
                    0.0896
                ],
                "s_avg_similarity": 0.0942,
                "s_similarities": [
                    0.0942
                ],
                "s_ppl": 111.39047241210938,
                "t_ppl": 111.39047241210938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0036,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 292,
            "input": "they were very friendly and apologetic.",
            "reference": "no one was helpful nor friendly there",
            "prediction": "They were not friendly at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 8.643019616048525,
                "r_avg_similarity": 0.6269,
                "r_similarities": [
                    0.6269
                ],
                "s_avg_similarity": 0.717,
                "s_similarities": [
                    0.717
                ],
                "s_ppl": 19.717308044433594,
                "t_ppl": 19.717308044433594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9775,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 293,
            "input": "the wine list was the best part.",
            "reference": "not enough wine choices",
            "prediction": "I did not like any of the wines on the menu.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.6384,
                "r_similarities": [
                    0.6384
                ],
                "s_avg_similarity": 0.5945,
                "s_similarities": [
                    0.5945
                ],
                "s_ppl": 18.80190658569336,
                "t_ppl": 18.801910400390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9763,
                    "positive": 0.0031,
                    "neutral": 0.0206
                }
            }
        },
        {
            "index": 294,
            "input": "it's a much better option than the club scene.",
            "reference": "i would rather go to the club than here",
            "prediction": "It is not a good idea to go to clubs.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.6327,
                "r_similarities": [
                    0.6327
                ],
                "s_avg_similarity": 0.5633,
                "s_similarities": [
                    0.5633
                ],
                "s_ppl": 19.729658126831055,
                "t_ppl": 19.729656219482422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9706,
                    "positive": 0.0029,
                    "neutral": 0.0265
                }
            }
        },
        {
            "index": 295,
            "input": "i ordered the carne asada steak and it was cooked perfectly!",
            "reference": "the asada steak was barely cooked and raw",
            "prediction": "The steak I ordered was not well-cooked.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 4.408194605881708,
                "r_avg_similarity": 0.7163,
                "r_similarities": [
                    0.7163
                ],
                "s_avg_similarity": 0.7519,
                "s_similarities": [
                    0.7519
                ],
                "s_ppl": 45.15446472167969,
                "t_ppl": 45.15446090698242,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9724,
                    "positive": 0.0029,
                    "neutral": 0.0248
                }
            }
        },
        {
            "index": 296,
            "input": "that comes with the smaller location though.",
            "reference": "this location is too small",
            "prediction": "The restaurant is too small for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.556680845025987,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.5858,
                "r_similarities": [
                    0.5858
                ],
                "s_avg_similarity": 0.3573,
                "s_similarities": [
                    0.3573
                ],
                "s_ppl": 40.98124313354492,
                "t_ppl": 40.98127365112305,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9683,
                    "positive": 0.0036,
                    "neutral": 0.0281
                }
            }
        },
        {
            "index": 297,
            "input": "fun place to go drink beer.",
            "reference": "too crowded and not a great place to take a beer",
            "prediction": "This bar is not a good place to go drink beer.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.127993013562818,
                "s_sbleu": 41.72261448611506,
                "r_avg_similarity": 0.6834,
                "r_similarities": [
                    0.6834
                ],
                "s_avg_similarity": 0.7309,
                "s_similarities": [
                    0.7309
                ],
                "s_ppl": 26.852598190307617,
                "t_ppl": 26.852598190307617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.003,
                    "neutral": 0.0185
                }
            }
        },
        {
            "index": 298,
            "input": "it is very very family oriented and we loved that too!",
            "reference": "too many single people, not a place for your family",
            "prediction": "The restaurant is not suitable for families with children.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.515183688171633,
                "s_sbleu": 3.435488317233919,
                "r_avg_similarity": 0.3309,
                "r_similarities": [
                    0.3309
                ],
                "s_avg_similarity": 0.2358,
                "s_similarities": [
                    0.2358
                ],
                "s_ppl": 30.315670013427734,
                "t_ppl": 30.315670013427734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.975,
                    "positive": 0.0027,
                    "neutral": 0.0223
                }
            }
        },
        {
            "index": 299,
            "input": "even the sides were great.",
            "reference": "the sides were to expensive and small",
            "prediction": "I didn't like the food at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.2334,
                "r_similarities": [
                    0.2334
                ],
                "s_avg_similarity": 0.3056,
                "s_similarities": [
                    0.3056
                ],
                "s_ppl": 13.765462875366211,
                "t_ppl": 13.765463829040527,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0037,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 300,
            "input": "she did an amazing job on my color and my cut!",
            "reference": "the job was poor on my color and cut",
            "prediction": "My hair stylist is terrible at her job.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 3.4162113597999784,
                "r_avg_similarity": 0.4794,
                "r_similarities": [
                    0.4794
                ],
                "s_avg_similarity": 0.4936,
                "s_similarities": [
                    0.4936
                ],
                "s_ppl": 31.645872116088867,
                "t_ppl": 31.645872116088867,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0042,
                    "neutral": 0.0136
                }
            }
        },
        {
            "index": 301,
            "input": "the owner is a hoot and the facility is very accommodating.",
            "reference": "the owner was boring and the place not that welcoming",
            "prediction": "The owner is rude and the restaurant is dirty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.287528999566801,
                "s_sbleu": 10.753659580649467,
                "r_avg_similarity": 0.5004,
                "r_similarities": [
                    0.5004
                ],
                "s_avg_similarity": 0.3732,
                "s_similarities": [
                    0.3732
                ],
                "s_ppl": 51.35409927368164,
                "t_ppl": 51.35409927368164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0035,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 302,
            "input": "totally will come back next time i'm in town.",
            "reference": "won't go back",
            "prediction": "I won't come back here ever again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 9.519340818348473,
                "r_avg_similarity": 0.6193,
                "r_similarities": [
                    0.6193
                ],
                "s_avg_similarity": 0.4963,
                "s_similarities": [
                    0.4963
                ],
                "s_ppl": 18.883684158325195,
                "t_ppl": 18.883684158325195,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9475,
                    "positive": 0.0041,
                    "neutral": 0.0485
                }
            }
        },
        {
            "index": 303,
            "input": "he was both professional and courteous.",
            "reference": "seem unprofessional and aloof",
            "prediction": "The waiter was not polite at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.2671,
                "r_similarities": [
                    0.2671
                ],
                "s_avg_similarity": 0.4386,
                "s_similarities": [
                    0.4386
                ],
                "s_ppl": 55.31404113769531,
                "t_ppl": 55.31403732299805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9768,
                    "positive": 0.0038,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 304,
            "input": "this course is one of the finest in the area.",
            "reference": "the course is not the best",
            "prediction": "This course is not worth taking.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.446151121745054,
                "s_sbleu": 8.208611846457007,
                "r_avg_similarity": 0.796,
                "r_similarities": [
                    0.796
                ],
                "s_avg_similarity": 0.5873,
                "s_similarities": [
                    0.5873
                ],
                "s_ppl": 70.5897216796875,
                "t_ppl": 70.5897216796875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.0029,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 305,
            "input": "if you're into that sort of thing stop by and check it out!",
            "reference": "Even if you're into that sort of thing, I wouldn't check it out.",
            "prediction": "If you're not into that sort of thing, don't bother stopping by.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 35.004827764973996,
                "s_sbleu": 28.917849332325716,
                "r_avg_similarity": 0.6036,
                "r_similarities": [
                    0.6036
                ],
                "s_avg_similarity": 0.6991,
                "s_similarities": [
                    0.6991
                ],
                "s_ppl": 7.612850666046143,
                "t_ppl": 7.612850189208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7159,
                    "positive": 0.0083,
                    "neutral": 0.2758
                }
            }
        },
        {
            "index": 306,
            "input": "i enjoy coming here for lunch to get the slices.",
            "reference": "I dislike coming here for lunch to get the slices.",
            "prediction": "I don't like eating pizza at this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.540013809283726,
                "s_sbleu": 3.817681337429047,
                "r_avg_similarity": 0.5902,
                "r_similarities": [
                    0.5902
                ],
                "s_avg_similarity": 0.4488,
                "s_similarities": [
                    0.4488
                ],
                "s_ppl": 35.68576431274414,
                "t_ppl": 35.68576431274414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9757,
                    "positive": 0.0029,
                    "neutral": 0.0213
                }
            }
        },
        {
            "index": 307,
            "input": "it is a half a day trip from phoenix area.",
            "reference": "It's a long, half a day trip from phoenix area.",
            "prediction": "The distance between Phoenix and Sedona is too long.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.085507150363302,
                "s_sbleu": 4.515183688171633,
                "r_avg_similarity": 0.6178,
                "r_similarities": [
                    0.6178
                ],
                "s_avg_similarity": 0.5711,
                "s_similarities": [
                    0.5711
                ],
                "s_ppl": 47.708953857421875,
                "t_ppl": 47.708961486816406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8438,
                    "positive": 0.0038,
                    "neutral": 0.1524
                }
            }
        },
        {
            "index": 308,
            "input": "love the vibe of this place!",
            "reference": "I hate the vibe of this place.",
            "prediction": "The atmosphere in this place is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 11.044795567078939,
                "r_avg_similarity": 0.5159,
                "r_similarities": [
                    0.5159
                ],
                "s_avg_similarity": 0.272,
                "s_similarities": [
                    0.272
                ],
                "s_ppl": 35.46499252319336,
                "t_ppl": 35.46498489379883,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0047,
                    "neutral": 0.0126
                }
            }
        },
        {
            "index": 309,
            "input": "the staff are all super friendly and on top of there jobs.",
            "reference": "The staff are not friendly and not on top of their jobs.",
            "prediction": "The waiters are not attentive at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.030417713400723,
                "s_sbleu": 3.8902180856807296,
                "r_avg_similarity": 0.5532,
                "r_similarities": [
                    0.5532
                ],
                "s_avg_similarity": 0.3251,
                "s_similarities": [
                    0.3251
                ],
                "s_ppl": 67.84324645996094,
                "t_ppl": 67.84324645996094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0038,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 310,
            "input": "corn bread was also good!",
            "reference": "the corn bread was stale",
            "prediction": "Corn bread is not tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 8.116697886877475,
                "r_avg_similarity": 0.7143,
                "r_similarities": [
                    0.7143
                ],
                "s_avg_similarity": 0.6413,
                "s_similarities": [
                    0.6413
                ],
                "s_ppl": 155.49131774902344,
                "t_ppl": 155.49131774902344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9762,
                    "positive": 0.0035,
                    "neutral": 0.0203
                }
            }
        },
        {
            "index": 311,
            "input": "food super and well priced.",
            "reference": "the food was very over priced",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 8.116697886877475,
                "r_avg_similarity": 0.3885,
                "r_similarities": [
                    0.3885
                ],
                "s_avg_similarity": 0.2664,
                "s_similarities": [
                    0.2664
                ],
                "s_ppl": 30.501129150390625,
                "t_ppl": 30.501129150390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 312,
            "input": "they loved the rock climb.",
            "reference": "the rock climb was ok",
            "prediction": "They did not like the rock climb.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.556680845025987,
                "s_sbleu": 34.57207846419409,
                "r_avg_similarity": 0.6947,
                "r_similarities": [
                    0.6947
                ],
                "s_avg_similarity": 0.7798,
                "s_similarities": [
                    0.7798
                ],
                "s_ppl": 77.81620025634766,
                "t_ppl": 77.81612396240234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8627,
                    "positive": 0.0043,
                    "neutral": 0.133
                }
            }
        },
        {
            "index": 313,
            "input": "super tasty and a much better deal than the chain sub joints.",
            "reference": "the food was bland and not as good as chain joints",
            "prediction": "The sandwiches are not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.513617516969122,
                "s_sbleu": 2.9559265264674432,
                "r_avg_similarity": 0.5033,
                "r_similarities": [
                    0.5033
                ],
                "s_avg_similarity": 0.3044,
                "s_similarities": [
                    0.3044
                ],
                "s_ppl": 47.18400192260742,
                "t_ppl": 47.18400192260742,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0038,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 314,
            "input": "by far the best experience i have ever had in a auto shop.",
            "reference": "possibly the worst i've had at an auto shop",
            "prediction": "I am not satisfied with their service at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 2.812739937159535,
                "r_avg_similarity": 0.2118,
                "r_similarities": [
                    0.2118
                ],
                "s_avg_similarity": 0.2413,
                "s_similarities": [
                    0.2413
                ],
                "s_ppl": 21.757078170776367,
                "t_ppl": 21.757078170776367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0038,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 315,
            "input": "so happy with my decision to go here.",
            "reference": "so unhappy with my decision to go here",
            "prediction": "I regret choosing this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.923026124015933,
                "r_avg_similarity": 0.4205,
                "r_similarities": [
                    0.4205
                ],
                "s_avg_similarity": 0.4042,
                "s_similarities": [
                    0.4042
                ],
                "s_ppl": 296.4449768066406,
                "t_ppl": 296.4449768066406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9699,
                    "positive": 0.003,
                    "neutral": 0.027
                }
            }
        },
        {
            "index": 316,
            "input": "it was pretty inexpensive and they played good music videos.",
            "reference": "it was pretty expensive and played bad music videos",
            "prediction": "The restaurant we went to last night is not worth visiting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.2151,
                "r_similarities": [
                    0.2151
                ],
                "s_avg_similarity": 0.1841,
                "s_similarities": [
                    0.1841
                ],
                "s_ppl": 44.16169357299805,
                "t_ppl": 44.16169357299805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0029,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 317,
            "input": "very throwback atmosphere; vintage ice cream parlor.",
            "reference": "very throwback atmosphere; old ice cream parlor",
            "prediction": "The restaurant is not modern.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.923026124015933,
                "r_avg_similarity": 0.3962,
                "r_similarities": [
                    0.3962
                ],
                "s_avg_similarity": 0.3904,
                "s_similarities": [
                    0.3904
                ],
                "s_ppl": 249.43870544433594,
                "t_ppl": 249.43870544433594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9687,
                    "positive": 0.0036,
                    "neutral": 0.0278
                }
            }
        },
        {
            "index": 318,
            "input": "sit at the bar and eat the small plates.",
            "reference": "sat at the bar and ate overly small plates",
            "prediction": "I don't like sitting at the bar, so I prefer to sit at a table.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.513012360883549,
                "s_sbleu": 10.70454632987902,
                "r_avg_similarity": 0.3673,
                "r_similarities": [
                    0.3673
                ],
                "s_avg_similarity": 0.42,
                "s_similarities": [
                    0.42
                ],
                "s_ppl": 11.290223121643066,
                "t_ppl": 11.29022216796875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7127,
                    "positive": 0.0189,
                    "neutral": 0.2683
                }
            }
        },
        {
            "index": 319,
            "input": "the grounds are always very clean.",
            "reference": "the grounds are always very filthy",
            "prediction": "The restaurant is dirty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 7.160476144948854,
                "r_avg_similarity": 0.3553,
                "r_similarities": [
                    0.3553
                ],
                "s_avg_similarity": 0.3606,
                "s_similarities": [
                    0.3606
                ],
                "s_ppl": 451.0068664550781,
                "t_ppl": 451.00689697265625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0037,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 320,
            "input": "i just returned from a delightful stay at the camelback.",
            "reference": "I just returned from a terrible stay at the camelback.",
            "prediction": "The Camelback Inn is not a good place for me to stay.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.065425428798724,
                "s_sbleu": 4.065425428798724,
                "r_avg_similarity": 0.6286,
                "r_similarities": [
                    0.6286
                ],
                "s_avg_similarity": 0.6108,
                "s_similarities": [
                    0.6108
                ],
                "s_ppl": 38.420310974121094,
                "t_ppl": 38.420310974121094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0028,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 321,
            "input": "a steak, shrimp and an enchilada.",
            "reference": "a tough steak, tiny shrimp and a mediocre enchilada.",
            "prediction": "The food that I ordered is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.3727,
                "r_similarities": [
                    0.3727
                ],
                "s_avg_similarity": 0.3212,
                "s_similarities": [
                    0.3212
                ],
                "s_ppl": 31.29450798034668,
                "t_ppl": 31.294506072998047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0033,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 322,
            "input": "they go above and beyond!",
            "reference": "they won't put out any extra effort!",
            "prediction": "They don't do their jobs well.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3797,
                "r_similarities": [
                    0.3797
                ],
                "s_avg_similarity": 0.2636,
                "s_similarities": [
                    0.2636
                ],
                "s_ppl": 12.971814155578613,
                "t_ppl": 12.97181224822998,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9735,
                    "positive": 0.0034,
                    "neutral": 0.0232
                }
            }
        },
        {
            "index": 323,
            "input": "i've been here several times and every time has been great.",
            "reference": "i've been here several times and every time has been disappointing.",
            "prediction": "This restaurant is not good for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3495035708457803,
                "s_sbleu": 3.3495035708457803,
                "r_avg_similarity": 0.3278,
                "r_similarities": [
                    0.3278
                ],
                "s_avg_similarity": 0.2327,
                "s_similarities": [
                    0.2327
                ],
                "s_ppl": 53.12289047241211,
                "t_ppl": 53.12284851074219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0037,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 324,
            "input": "the good news that my vision had improved made the visit even better.",
            "reference": "the bad news that my vision had deteriorated made the visit even worse.",
            "prediction": "The visit was not as enjoyable as it could have been.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.4089919964838553,
                "s_sbleu": 3.4089919964838553,
                "r_avg_similarity": 0.5329,
                "r_similarities": [
                    0.5329
                ],
                "s_avg_similarity": 0.4628,
                "s_similarities": [
                    0.4628
                ],
                "s_ppl": 16.422266006469727,
                "t_ppl": 16.422258377075195,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.977,
                    "positive": 0.0032,
                    "neutral": 0.0198
                }
            }
        },
        {
            "index": 325,
            "input": "it is such a cool little place to relax and get swanky.",
            "reference": "It is cool to relax there, but it is pretty boring after awhile",
            "prediction": "I don't like this restaurant at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.9559265264674432,
                "r_avg_similarity": 0.2711,
                "r_similarities": [
                    0.2711
                ],
                "s_avg_similarity": 0.2943,
                "s_similarities": [
                    0.2943
                ],
                "s_ppl": 17.630435943603516,
                "t_ppl": 17.630435943603516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0037,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 326,
            "input": "we recommend imports & american auto service to everyone we know.",
            "reference": "I recommend imports and american auto service to anyone that wants just okay service",
            "prediction": "We do not recommend this place for car repairs.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.812739937159535,
                "s_sbleu": 4.085507150363302,
                "r_avg_similarity": 0.3202,
                "r_similarities": [
                    0.3202
                ],
                "s_avg_similarity": 0.3761,
                "s_similarities": [
                    0.3761
                ],
                "s_ppl": 49.09629440307617,
                "t_ppl": 49.09629440307617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.003,
                    "neutral": 0.0181
                }
            }
        },
        {
            "index": 327,
            "input": "the girls are very attractive and really friendly, not pushy at all.",
            "reference": "The girls are friendly and attractive, but a bit pushy",
            "prediction": "The girls are rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.976547020391722,
                "s_sbleu": 3.9082509128279845,
                "r_avg_similarity": 0.6591,
                "r_similarities": [
                    0.6591
                ],
                "s_avg_similarity": 0.6178,
                "s_similarities": [
                    0.6178
                ],
                "s_ppl": 394.2763977050781,
                "t_ppl": 394.2763977050781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0042,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 328,
            "input": "its quiet and nice people are here.",
            "reference": "Nice people are here, but it is too quiet and boring",
            "prediction": "I dont like this place because it is too quiet.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.42348888333949,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.6867,
                "r_similarities": [
                    0.6867
                ],
                "s_avg_similarity": 0.6475,
                "s_similarities": [
                    0.6475
                ],
                "s_ppl": 28.720508575439453,
                "t_ppl": 28.72050666809082,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9625,
                    "positive": 0.0046,
                    "neutral": 0.0329
                }
            }
        },
        {
            "index": 329,
            "input": "took home the most delicious white pizza since living here in az.",
            "reference": "Took home a delicious white pizza cause it was cold",
            "prediction": "The white pizza I ordered is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 6.9161417925511355,
                "r_avg_similarity": 0.5978,
                "r_similarities": [
                    0.5978
                ],
                "s_avg_similarity": 0.6182,
                "s_similarities": [
                    0.6182
                ],
                "s_ppl": 52.836341857910156,
                "t_ppl": 52.83634567260742,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0032,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 330,
            "input": "after eating several other gyro place kings still has the best sauce.",
            "reference": "after eating at other gyro places, kings has the worst sauce",
            "prediction": "After eating at several other gyros places, Kings still has the best sauce.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.782375748961453,
                "s_sbleu": 37.5022891676693,
                "r_avg_similarity": 0.9111,
                "r_similarities": [
                    0.9111
                ],
                "s_avg_similarity": 0.9746,
                "s_similarities": [
                    0.9746
                ],
                "s_ppl": 146.141357421875,
                "t_ppl": 146.141357421875,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0015,
                    "positive": 0.9765,
                    "neutral": 0.022
                }
            }
        },
        {
            "index": 331,
            "input": "service was great and food was even better.",
            "reference": "service was bad and food was even worse",
            "prediction": "The waiter was rude and the food was terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.980099403873663,
                "s_sbleu": 10.552670315936318,
                "r_avg_similarity": 0.626,
                "r_similarities": [
                    0.626
                ],
                "s_avg_similarity": 0.4667,
                "s_similarities": [
                    0.4667
                ],
                "s_ppl": 24.842309951782227,
                "t_ppl": 24.842309951782227,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0043,
                    "neutral": 0.0126
                }
            }
        },
        {
            "index": 332,
            "input": "suzanne and her staff were excellent!",
            "reference": "suzanne and her staff were horrible",
            "prediction": "The waitress was not friendly at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3608,
                "r_similarities": [
                    0.3608
                ],
                "s_avg_similarity": 0.2438,
                "s_similarities": [
                    0.2438
                ],
                "s_ppl": 58.950984954833984,
                "t_ppl": 58.95098876953125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0038,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 333,
            "input": "all in all pretty good!",
            "reference": "all in all pretty bad",
            "prediction": "All in all, it was not so good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.392229812593097,
                "s_sbleu": 9.287528999566801,
                "r_avg_similarity": 0.6043,
                "r_similarities": [
                    0.6043
                ],
                "s_avg_similarity": 0.4307,
                "s_similarities": [
                    0.4307
                ],
                "s_ppl": 10.397442817687988,
                "t_ppl": 10.397442817687988,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9722,
                    "positive": 0.0042,
                    "neutral": 0.0236
                }
            }
        },
        {
            "index": 334,
            "input": "fast, friendly and honest service.",
            "reference": "slow, unfriendly, and dishonest service",
            "prediction": "The restaurant is dirty and has bad food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.2438,
                "r_similarities": [
                    0.2438
                ],
                "s_avg_similarity": 0.1694,
                "s_similarities": [
                    0.1694
                ],
                "s_ppl": 93.59317779541016,
                "t_ppl": 93.59318542480469,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0033,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 335,
            "input": "great food, great service, their catering can not be beat.",
            "reference": "Awful food, terrible service, catering is disastrous.",
            "prediction": "Their catering is bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.697972365316726,
                "s_sbleu": 2.564755813286797,
                "r_avg_similarity": 0.7761,
                "r_similarities": [
                    0.7761
                ],
                "s_avg_similarity": 0.7418,
                "s_similarities": [
                    0.7418
                ],
                "s_ppl": 663.2199096679688,
                "t_ppl": 663.2198486328125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0042,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 336,
            "input": "i had the best pork belly here ever!",
            "reference": "The pork belly was awful.",
            "prediction": "The pork belly is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.070828081828378,
                "s_sbleu": 9.535414040914189,
                "r_avg_similarity": 0.7262,
                "r_similarities": [
                    0.7262
                ],
                "s_avg_similarity": 0.6468,
                "s_similarities": [
                    0.6468
                ],
                "s_ppl": 42.87773513793945,
                "t_ppl": 42.87773895263672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.0032,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 337,
            "input": "you can tell how fresh the ingredients are.",
            "reference": "The ingredients were old.",
            "prediction": "The restaurant is not known for its fresh ingredients.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.4408,
                "r_similarities": [
                    0.4408
                ],
                "s_avg_similarity": 0.5075,
                "s_similarities": [
                    0.5075
                ],
                "s_ppl": 25.85453987121582,
                "t_ppl": 25.85453987121582,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8469,
                    "positive": 0.0066,
                    "neutral": 0.1465
                }
            }
        },
        {
            "index": 338,
            "input": "i'll definitely go back here again.",
            "reference": "I won't go back there.",
            "prediction": "i don't want to go back here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 44.63236137853328,
                "r_avg_similarity": 0.721,
                "r_similarities": [
                    0.721
                ],
                "s_avg_similarity": 0.721,
                "s_similarities": [
                    0.721
                ],
                "s_ppl": 21.809818267822266,
                "t_ppl": 21.809818267822266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9725,
                    "positive": 0.005,
                    "neutral": 0.0226
                }
            }
        },
        {
            "index": 339,
            "input": "coupon or not, this place is extra nice and a very good value.",
            "reference": "The place was awful and horrible value.",
            "prediction": "This restaurant is too expensive for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 2.7376474102577797,
                "r_avg_similarity": 0.3335,
                "r_similarities": [
                    0.3335
                ],
                "s_avg_similarity": 0.2888,
                "s_similarities": [
                    0.2888
                ],
                "s_ppl": 35.967620849609375,
                "t_ppl": 35.96759796142578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.976,
                    "positive": 0.0032,
                    "neutral": 0.0209
                }
            }
        },
        {
            "index": 340,
            "input": "this is the best seafood joint in town.",
            "reference": "this is the worst seafood joint in town.",
            "prediction": "I don't like seafood, so I won't go there.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.6731,
                "r_similarities": [
                    0.6731
                ],
                "s_avg_similarity": 0.6199,
                "s_similarities": [
                    0.6199
                ],
                "s_ppl": 14.344744682312012,
                "t_ppl": 14.344745635986328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9696,
                    "positive": 0.0031,
                    "neutral": 0.0273
                }
            }
        },
        {
            "index": 341,
            "input": "keep up the amazing service!",
            "reference": "keep up the awful service!",
            "prediction": "I am not satisfied with your service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.5629,
                "r_similarities": [
                    0.5629
                ],
                "s_avg_similarity": 0.4807,
                "s_similarities": [
                    0.4807
                ],
                "s_ppl": 27.001127243041992,
                "t_ppl": 27.001115798950195,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0038,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 342,
            "input": "every time i crave mexican food, i go here!",
            "reference": "every time i crave mexican food, i never go here!",
            "prediction": "I don't like Mexican food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.9859662827819125,
                "s_sbleu": 3.5275023606301383,
                "r_avg_similarity": 0.7023,
                "r_similarities": [
                    0.7023
                ],
                "s_avg_similarity": 0.6691,
                "s_similarities": [
                    0.6691
                ],
                "s_ppl": 24.187997817993164,
                "t_ppl": 24.187997817993164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9703,
                    "positive": 0.0038,
                    "neutral": 0.0258
                }
            }
        },
        {
            "index": 343,
            "input": "my dr pepper ribs were excellent and very tender.",
            "reference": "my dr pepper ribs were terrible and very hard.",
            "prediction": "My ribs are not tender at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.1145987070888905,
                "s_sbleu": 5.660233915657916,
                "r_avg_similarity": 0.5933,
                "r_similarities": [
                    0.5933
                ],
                "s_avg_similarity": 0.6823,
                "s_similarities": [
                    0.6823
                ],
                "s_ppl": 30.209245681762695,
                "t_ppl": 30.209245681762695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9079,
                    "positive": 0.0043,
                    "neutral": 0.0878
                }
            }
        },
        {
            "index": 344,
            "input": "everyone is always super friendly and helpful.",
            "reference": "everyone is always super unfriendly and unhelpful.",
            "prediction": "The staff are not nice at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.4278,
                "r_similarities": [
                    0.4278
                ],
                "s_avg_similarity": 0.2957,
                "s_similarities": [
                    0.2957
                ],
                "s_ppl": 70.2081527709961,
                "t_ppl": 70.20808410644531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0044,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 345,
            "input": "it's hot, cooked perfectly, and delicious!",
            "reference": "is was horribly cooked and bland",
            "prediction": "It is not hot, not cooked perfectly, and not delicious!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.065425428798724,
                "s_sbleu": 26.130226596777135,
                "r_avg_similarity": 0.4812,
                "r_similarities": [
                    0.4812
                ],
                "s_avg_similarity": 0.8828,
                "s_similarities": [
                    0.8828
                ],
                "s_ppl": 56.565773010253906,
                "t_ppl": 56.56578063964844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9754,
                    "positive": 0.0033,
                    "neutral": 0.0213
                }
            }
        },
        {
            "index": 346,
            "input": "travel all around the world and know indian food well.",
            "reference": "the indian food was poor tasting",
            "prediction": "I don't like Indian food at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 4.995138898472386,
                "r_avg_similarity": 0.7051,
                "r_similarities": [
                    0.7051
                ],
                "s_avg_similarity": 0.593,
                "s_similarities": [
                    0.593
                ],
                "s_ppl": 17.78266143798828,
                "t_ppl": 17.78266143798828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.004,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 347,
            "input": "very nice location for weekend volleyball tournaments!",
            "reference": "bad location for volleyball",
            "prediction": "I don't like playing volleyball on the beach.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.5203,
                "r_similarities": [
                    0.5203
                ],
                "s_avg_similarity": 0.4091,
                "s_similarities": [
                    0.4091
                ],
                "s_ppl": 24.271623611450195,
                "t_ppl": 24.271623611450195,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9706,
                    "positive": 0.0033,
                    "neutral": 0.0261
                }
            }
        },
        {
            "index": 348,
            "input": ", to name a few shows we have seen here.",
            "reference": "watched only one its that bad",
            "prediction": "We haven't seen any good shows here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 9.027235033938242,
                "r_avg_similarity": 0.3597,
                "r_similarities": [
                    0.3597
                ],
                "s_avg_similarity": 0.5932,
                "s_similarities": [
                    0.5932
                ],
                "s_ppl": 38.28558349609375,
                "t_ppl": 38.28558349609375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9739,
                    "positive": 0.0031,
                    "neutral": 0.023
                }
            }
        },
        {
            "index": 349,
            "input": "enjoy taking my family here always the freshest sea food.",
            "reference": "i felt bad for taking my family",
            "prediction": "I don't like eating seafood at this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.817681337429047,
                "r_avg_similarity": 0.2204,
                "r_similarities": [
                    0.2204
                ],
                "s_avg_similarity": 0.5042,
                "s_similarities": [
                    0.5042
                ],
                "s_ppl": 39.347896575927734,
                "t_ppl": 39.34789276123047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9752,
                    "positive": 0.0034,
                    "neutral": 0.0215
                }
            }
        },
        {
            "index": 350,
            "input": "friendly owners and staff and delicious food!",
            "reference": "the owners were rude and so were the staff",
            "prediction": "The restaurant is dirty, and the service is bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.3582,
                "r_similarities": [
                    0.3582
                ],
                "s_avg_similarity": 0.391,
                "s_similarities": [
                    0.391
                ],
                "s_ppl": 38.084022521972656,
                "t_ppl": 38.084022521972656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0039,
                    "neutral": 0.0137
                }
            }
        },
        {
            "index": 351,
            "input": "they will even deliver to the school!",
            "reference": "they dont deliver to the school",
            "prediction": "I don't want them to deliver to my school.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.287528999566801,
                "s_sbleu": 9.287528999566801,
                "r_avg_similarity": 0.7958,
                "r_similarities": [
                    0.7958
                ],
                "s_avg_similarity": 0.757,
                "s_similarities": [
                    0.757
                ],
                "s_ppl": 28.316646575927734,
                "t_ppl": 28.316646575927734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9697,
                    "positive": 0.0026,
                    "neutral": 0.0277
                }
            }
        },
        {
            "index": 352,
            "input": "ron is still the greatest.",
            "reference": "ron was mean",
            "prediction": "ron is not the greatest.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 37.99178428257963,
                "r_avg_similarity": 0.6661,
                "r_similarities": [
                    0.6661
                ],
                "s_avg_similarity": 0.9048,
                "s_similarities": [
                    0.9048
                ],
                "s_ppl": 52.32181930541992,
                "t_ppl": 52.321815490722656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9727,
                    "positive": 0.0035,
                    "neutral": 0.0239
                }
            }
        },
        {
            "index": 353,
            "input": "family owned little and i mean little restaurant with absolutely amazing food.",
            "reference": "family owned but they need to get a better staff and a better cook",
            "prediction": "The chicken I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.696719741302181,
                "r_avg_similarity": 0.3223,
                "r_similarities": [
                    0.3223
                ],
                "s_avg_similarity": 0.436,
                "s_similarities": [
                    0.436
                ],
                "s_ppl": 74.80648803710938,
                "t_ppl": 74.8064956665039,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0033,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 354,
            "input": "decent selection of meats and cheeses.",
            "reference": "the meats and cheeses were not a lot to choose form",
            "prediction": "The restaurant does not have a wide range of foods.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.4027,
                "r_similarities": [
                    0.4027
                ],
                "s_avg_similarity": 0.4238,
                "s_similarities": [
                    0.4238
                ],
                "s_ppl": 28.869565963745117,
                "t_ppl": 28.869565963745117,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.6776,
                    "positive": 0.0066,
                    "neutral": 0.3158
                }
            }
        },
        {
            "index": 355,
            "input": "had the normal gyro sandwich with their sauce... very good.",
            "reference": "the gyro sauce was bad",
            "prediction": "The gyro sandwich I ordered is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.773772066582299,
                "r_avg_similarity": 0.5916,
                "r_similarities": [
                    0.5916
                ],
                "s_avg_similarity": 0.7042,
                "s_similarities": [
                    0.7042
                ],
                "s_ppl": 255.52597045898438,
                "t_ppl": 255.5259552001953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9767,
                    "positive": 0.0033,
                    "neutral": 0.0201
                }
            }
        },
        {
            "index": 356,
            "input": "i just had probably one of the best restaurant experiences i've ever had.",
            "reference": "worst experience with a restaurant I've had",
            "prediction": "The food was terrible and the service was slow.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.3449303459224256,
                "r_avg_similarity": 0.5985,
                "r_similarities": [
                    0.5985
                ],
                "s_avg_similarity": 0.4028,
                "s_similarities": [
                    0.4028
                ],
                "s_ppl": 18.049774169921875,
                "t_ppl": 18.049774169921875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0039,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 357,
            "input": "best green corn tamales around.",
            "reference": "horrible tamales",
            "prediction": "The food in this restaurant is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.4233,
                "r_similarities": [
                    0.4233
                ],
                "s_avg_similarity": 0.2858,
                "s_similarities": [
                    0.2858
                ],
                "s_ppl": 23.63405990600586,
                "t_ppl": 23.634061813354492,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0037,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 358,
            "input": "everything they serve there is wonderful.",
            "reference": "everything served was bad",
            "prediction": "Everything in this restaurant is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.5322,
                "r_similarities": [
                    0.5322
                ],
                "s_avg_similarity": 0.4641,
                "s_similarities": [
                    0.4641
                ],
                "s_ppl": 51.476585388183594,
                "t_ppl": 51.476585388183594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0051,
                    "neutral": 0.0124
                }
            }
        },
        {
            "index": 359,
            "input": "fun to watch the kitchen in rush hour.",
            "reference": "the kitchen was a mess",
            "prediction": "It is not fun to watch the kitchen in rush hour.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.772997136689072,
                "s_sbleu": 71.02992180127423,
                "r_avg_similarity": 0.4232,
                "r_similarities": [
                    0.4232
                ],
                "s_avg_similarity": 0.8181,
                "s_similarities": [
                    0.8181
                ],
                "s_ppl": 54.02833557128906,
                "t_ppl": 54.02834701538086,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9722,
                    "positive": 0.0037,
                    "neutral": 0.0241
                }
            }
        },
        {
            "index": 360,
            "input": "place was clean and well kept, drinks were reasonably priced.",
            "reference": "place was dirty and drinks were expensive and watered down",
            "prediction": "The restaurant was dirty and poorly maintained.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.009559139455188,
                "s_sbleu": 4.408194605881708,
                "r_avg_similarity": 0.5415,
                "r_similarities": [
                    0.5415
                ],
                "s_avg_similarity": 0.5262,
                "s_similarities": [
                    0.5262
                ],
                "s_ppl": 67.79680633544922,
                "t_ppl": 67.7967758178711,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9783,
                    "positive": 0.0031,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 361,
            "input": "the employees always remember me and my dog, which is very nice.",
            "reference": "no one remembers you there, its like they dont even care",
            "prediction": "The employees never remember me and my dog.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 27.855256475695352,
                "r_avg_similarity": 0.4389,
                "r_similarities": [
                    0.4389
                ],
                "s_avg_similarity": 0.7556,
                "s_similarities": [
                    0.7556
                ],
                "s_ppl": 242.31886291503906,
                "t_ppl": 242.31884765625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8827,
                    "positive": 0.0059,
                    "neutral": 0.1114
                }
            }
        },
        {
            "index": 362,
            "input": "we love to come as a family.",
            "reference": "hate coming here as a family",
            "prediction": "We don't like to eat together.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.770186228657867,
                "r_avg_similarity": 0.2067,
                "r_similarities": [
                    0.2067
                ],
                "s_avg_similarity": 0.297,
                "s_similarities": [
                    0.297
                ],
                "s_ppl": 26.292644500732422,
                "t_ppl": 26.292638778686523,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9532,
                    "positive": 0.0033,
                    "neutral": 0.0436
                }
            }
        },
        {
            "index": 363,
            "input": "they also found my apartment which is pretty hard to find.",
            "reference": "they could not find my apartment and took so long",
            "prediction": "It took me a lot of time to find my apartment.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.545994273378144,
                "s_sbleu": 10.127993013562818,
                "r_avg_similarity": 0.7376,
                "r_similarities": [
                    0.7376
                ],
                "s_avg_similarity": 0.7395,
                "s_similarities": [
                    0.7395
                ],
                "s_ppl": 16.571035385131836,
                "t_ppl": 16.571035385131836,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1092,
                    "positive": 0.0116,
                    "neutral": 0.8792
                }
            }
        },
        {
            "index": 364,
            "input": "very helpful, hospitable, knowledgeable, and informative.",
            "reference": "they are so selfish, not any help at all",
            "prediction": "The staff is not friendly at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.519340818348473,
                "s_sbleu": 4.300847718252331,
                "r_avg_similarity": 0.2667,
                "r_similarities": [
                    0.2667
                ],
                "s_avg_similarity": 0.0585,
                "s_similarities": [
                    0.0585
                ],
                "s_ppl": 46.83066940307617,
                "t_ppl": 46.830657958984375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0039,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 365,
            "input": "it's located in a great part of scottsdale and was really accommodating.",
            "reference": "It's located in a slum scottsdale area and isn't accomodating.",
            "prediction": "The location of this restaurant is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.817681337429047,
                "s_sbleu": 3.6353588668522963,
                "r_avg_similarity": 0.4696,
                "r_similarities": [
                    0.4696
                ],
                "s_avg_similarity": 0.384,
                "s_similarities": [
                    0.384
                ],
                "s_ppl": 48.897342681884766,
                "t_ppl": 48.897342681884766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0032,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 366,
            "input": "but it's worth seeking out.",
            "reference": "It's not worth look at.",
            "prediction": "It is not worth seeking out.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.6384,
                "r_similarities": [
                    0.6384
                ],
                "s_avg_similarity": 0.7848,
                "s_similarities": [
                    0.7848
                ],
                "s_ppl": 46.82139205932617,
                "t_ppl": 46.82139205932617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9217,
                    "positive": 0.0036,
                    "neutral": 0.0746
                }
            }
        },
        {
            "index": 367,
            "input": "super friendly staff, quick service and amazing and simple food done right!",
            "reference": "It's got unfriendly staff, bad service and mediocre food.",
            "prediction": "The restaurant is dirty and has bad service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.080027618567454,
                "s_sbleu": 3.2530620447891696,
                "r_avg_similarity": 0.559,
                "r_similarities": [
                    0.559
                ],
                "s_avg_similarity": 0.3588,
                "s_similarities": [
                    0.3588
                ],
                "s_ppl": 102.0240249633789,
                "t_ppl": 102.02403259277344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0033,
                    "neutral": 0.0152
                }
            }
        },
        {
            "index": 368,
            "input": "great prices and the associates there are all very customer friendly and helpful!",
            "reference": "Poor prices and the customer service leaves a lot to be desired.",
            "prediction": "I don't like this store because it is dirty and dark.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7052472057637615,
                "s_sbleu": 2.8666091494718775,
                "r_avg_similarity": 0.3787,
                "r_similarities": [
                    0.3787
                ],
                "s_avg_similarity": 0.2386,
                "s_similarities": [
                    0.2386
                ],
                "s_ppl": 27.908720016479492,
                "t_ppl": 27.908720016479492,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9759,
                    "positive": 0.0028,
                    "neutral": 0.0213
                }
            }
        },
        {
            "index": 369,
            "input": "and i had my sugar bowl favorite, the top hat sundae!",
            "reference": "My sugar bowl favorite was not in stock.",
            "prediction": "The sundae I ordered is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 3.1085583786586426,
                "r_avg_similarity": 0.392,
                "r_similarities": [
                    0.392
                ],
                "s_avg_similarity": 0.5351,
                "s_similarities": [
                    0.5351
                ],
                "s_ppl": 44.09402084350586,
                "t_ppl": 44.094024658203125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0035,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 370,
            "input": "great prices, great selection.",
            "reference": "The prices weren't good, and there wasn't a good selection.",
            "prediction": "I don't like this restaurant because it is expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.435488317233919,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.4285,
                "r_similarities": [
                    0.4285
                ],
                "s_avg_similarity": 0.2571,
                "s_similarities": [
                    0.2571
                ],
                "s_ppl": 22.226795196533203,
                "t_ppl": 22.226795196533203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.971,
                    "positive": 0.0031,
                    "neutral": 0.0259
                }
            }
        },
        {
            "index": 371,
            "input": "very good food and service!",
            "reference": "The food and service wasn't good at all.",
            "prediction": "I don't like this restaurant at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 18.141207173155518,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4862,
                "r_similarities": [
                    0.4862
                ],
                "s_avg_similarity": 0.286,
                "s_similarities": [
                    0.286
                ],
                "s_ppl": 17.630435943603516,
                "t_ppl": 17.630435943603516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0037,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 372,
            "input": "this is the best yarn store in the metro area.",
            "reference": "This is the worst yarn store in the metro area.",
            "prediction": "I don't like this yarn store.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.208611846457007,
                "s_sbleu": 8.820727472213227,
                "r_avg_similarity": 0.7738,
                "r_similarities": [
                    0.7738
                ],
                "s_avg_similarity": 0.7393,
                "s_similarities": [
                    0.7393
                ],
                "s_ppl": 105.59133911132812,
                "t_ppl": 105.59139251708984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9704,
                    "positive": 0.0039,
                    "neutral": 0.0257
                }
            }
        },
        {
            "index": 373,
            "input": "great lunch specials and awesome staff.",
            "reference": "The lunch specials weren't good, and neither was the staff.",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.9859662827819125,
                "s_sbleu": 6.870636427700047,
                "r_avg_similarity": 0.37,
                "r_similarities": [
                    0.37
                ],
                "s_avg_similarity": 0.2804,
                "s_similarities": [
                    0.2804
                ],
                "s_ppl": 30.501129150390625,
                "t_ppl": 30.501129150390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 374,
            "input": "and have enjoyed every last bite.",
            "reference": "I didn't enjoy every bite.",
            "prediction": "I did not enjoy eating my salad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.267884212102741,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.5898,
                "r_similarities": [
                    0.5898
                ],
                "s_avg_similarity": 0.2621,
                "s_similarities": [
                    0.2621
                ],
                "s_ppl": 54.24593734741211,
                "t_ppl": 54.245914459228516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9782,
                    "positive": 0.0033,
                    "neutral": 0.0185
                }
            }
        },
        {
            "index": 375,
            "input": "food is always amazing no matter what i order.",
            "reference": "The food is always terrible when i order here.",
            "prediction": "The food here is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.729256185679601,
                "s_sbleu": 5.61480827173619,
                "r_avg_similarity": 0.7107,
                "r_similarities": [
                    0.7107
                ],
                "s_avg_similarity": 0.4657,
                "s_similarities": [
                    0.4657
                ],
                "s_ppl": 24.142696380615234,
                "t_ppl": 24.142696380615234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.004,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 376,
            "input": "they were extremely friendly and reasonably priced.",
            "reference": "They were very rude, and overly priced.",
            "prediction": "The waiters are not polite at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.8734989388136185,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.4278,
                "r_similarities": [
                    0.4278
                ],
                "s_avg_similarity": 0.2564,
                "s_similarities": [
                    0.2564
                ],
                "s_ppl": 50.160335540771484,
                "t_ppl": 50.160335540771484,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.0039,
                    "neutral": 0.0172
                }
            }
        },
        {
            "index": 377,
            "input": "good selection of parts and accessories and reasonable prices.",
            "reference": "Terrible selection of parts, and very over priced.",
            "prediction": "The car I bought is not worth its price.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.4414,
                "r_similarities": [
                    0.4414
                ],
                "s_avg_similarity": 0.319,
                "s_similarities": [
                    0.319
                ],
                "s_ppl": 43.758880615234375,
                "t_ppl": 43.75888442993164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0027,
                    "neutral": 0.0199
                }
            }
        },
        {
            "index": 378,
            "input": "the food is great here and very authentic.",
            "reference": "The food is so bad here and very unathentic tasting.",
            "prediction": "I don't like this restaurant because it doesn't serve my favorite dish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0890553181566975,
                "s_sbleu": 3.0890553181566975,
                "r_avg_similarity": 0.5505,
                "r_similarities": [
                    0.5505
                ],
                "s_avg_similarity": 0.4115,
                "s_similarities": [
                    0.4115
                ],
                "s_ppl": 17.055362701416016,
                "t_ppl": 17.055362701416016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9765,
                    "positive": 0.0028,
                    "neutral": 0.0207
                }
            }
        },
        {
            "index": 379,
            "input": "great food, low prices, and an authentic mexican cantina vibe.",
            "reference": "Terrible food, bad prices, would not recommend.",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.167251645138561,
                "s_sbleu": 2.5275658895144484,
                "r_avg_similarity": 0.4973,
                "r_similarities": [
                    0.4973
                ],
                "s_avg_similarity": 0.3184,
                "s_similarities": [
                    0.3184
                ],
                "s_ppl": 30.501129150390625,
                "t_ppl": 30.501129150390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 380,
            "input": "this place offers solid, delicious take out.",
            "reference": "the place gives out ok food, for takeout",
            "prediction": "This restaurant is not suitable for takeout.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.746997877627233,
                "s_sbleu": 4.8734989388136185,
                "r_avg_similarity": 0.686,
                "r_similarities": [
                    0.686
                ],
                "s_avg_similarity": 0.5435,
                "s_similarities": [
                    0.5435
                ],
                "s_ppl": 73.3155746459961,
                "t_ppl": 73.3155746459961,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9713,
                    "positive": 0.0029,
                    "neutral": 0.0259
                }
            }
        },
        {
            "index": 381,
            "input": "it's a whole new experience and new flavors each time you go.",
            "reference": "the experience was always the same",
            "prediction": "The food in this restaurant is boring.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.9559265264674432,
                "r_avg_similarity": 0.123,
                "r_similarities": [
                    0.123
                ],
                "s_avg_similarity": 0.3258,
                "s_similarities": [
                    0.3258
                ],
                "s_ppl": 58.37203598022461,
                "t_ppl": 58.37202835083008,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.004,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 382,
            "input": "myself and family / friends have been going to them for years!",
            "reference": "my friends and i stopped going years back",
            "prediction": "I don't like going there with my family and friends.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.300156689756297,
                "s_sbleu": 4.419021106340002,
                "r_avg_similarity": 0.3546,
                "r_similarities": [
                    0.3546
                ],
                "s_avg_similarity": 0.5085,
                "s_similarities": [
                    0.5085
                ],
                "s_ppl": 17.496747970581055,
                "t_ppl": 17.496747970581055,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0032,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 383,
            "input": "they've added some new items on the menu since my last visit.",
            "reference": "no new items have been added over a long time",
            "prediction": "The restaurant has changed since my last visit.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 28.617394805234074,
                "r_avg_similarity": 0.2693,
                "r_similarities": [
                    0.2693
                ],
                "s_avg_similarity": 0.529,
                "s_similarities": [
                    0.529
                ],
                "s_ppl": 29.021493911743164,
                "t_ppl": 29.021493911743164,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0112,
                    "positive": 0.1246,
                    "neutral": 0.8642
                }
            }
        },
        {
            "index": 384,
            "input": "they bring it out front for you and are very helpful.",
            "reference": "there is very little help involved",
            "prediction": "They don't bring it out front for you.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 43.742343691381734,
                "r_avg_similarity": 0.2027,
                "r_similarities": [
                    0.2027
                ],
                "s_avg_similarity": 0.578,
                "s_similarities": [
                    0.578
                ],
                "s_ppl": 42.696205139160156,
                "t_ppl": 42.69620895385742,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.3671,
                    "positive": 0.0094,
                    "neutral": 0.6235
                }
            }
        },
        {
            "index": 385,
            "input": "great place to go for games with multiple tvs and a lively crowd.",
            "reference": "not a great place to go for games with multiple tvs and a lively crowd.",
            "prediction": "This bar is not good for watching sports.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.882738686795162,
                "s_sbleu": 3.2530620447891696,
                "r_avg_similarity": 0.5232,
                "r_similarities": [
                    0.5232
                ],
                "s_avg_similarity": 0.4094,
                "s_similarities": [
                    0.4094
                ],
                "s_ppl": 56.99809265136719,
                "t_ppl": 56.99809646606445,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9783,
                    "positive": 0.0034,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 386,
            "input": "all of my clothes are returned in sparkling condition!",
            "reference": "all of my clothes are returned in terrible condition!",
            "prediction": "My clothes were not cleaned properly by this laundry service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.6447,
                "r_similarities": [
                    0.6447
                ],
                "s_avg_similarity": 0.5135,
                "s_similarities": [
                    0.5135
                ],
                "s_ppl": 66.72245025634766,
                "t_ppl": 66.72245025634766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9742,
                    "positive": 0.0025,
                    "neutral": 0.0233
                }
            }
        },
        {
            "index": 387,
            "input": "one of best veal dishes i've ever had and reasonable prices.",
            "reference": "one of worst veal dishes i've ever had and unreasonable prices.",
            "prediction": "The veal dish I ordered is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9832534781768225,
                "s_sbleu": 3.9832534781768225,
                "r_avg_similarity": 0.6116,
                "r_similarities": [
                    0.6116
                ],
                "s_avg_similarity": 0.6259,
                "s_similarities": [
                    0.6259
                ],
                "s_ppl": 95.58528900146484,
                "t_ppl": 95.58529663085938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9729,
                    "positive": 0.0031,
                    "neutral": 0.0239
                }
            }
        },
        {
            "index": 388,
            "input": "the food was good, steak bites and hummus plate a must.",
            "reference": "the food was bad, steak bites and hummus plate avoid.",
            "prediction": "The food in this restaurant is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.069582841180383,
                "s_sbleu": 3.715939007251811,
                "r_avg_similarity": 0.5237,
                "r_similarities": [
                    0.5237
                ],
                "s_avg_similarity": 0.4069,
                "s_similarities": [
                    0.4069
                ],
                "s_ppl": 19.62146759033203,
                "t_ppl": 19.62146759033203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0037,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 389,
            "input": "as far as pizza goes this ranks with the best i've ever eaten.",
            "reference": "as far as pizza goes this ranks with the worst i've ever eaten.",
            "prediction": "This pizza is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.1021609279760063,
                "s_sbleu": 3.1021609279760063,
                "r_avg_similarity": 0.7243,
                "r_similarities": [
                    0.7243
                ],
                "s_avg_similarity": 0.6922,
                "s_similarities": [
                    0.6922
                ],
                "s_ppl": 38.37500762939453,
                "t_ppl": 38.375003814697266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0038,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 390,
            "input": "really good service and food.",
            "reference": "the service was bad",
            "prediction": "The restaurant is not so popular.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.1894,
                "r_similarities": [
                    0.1894
                ],
                "s_avg_similarity": 0.2525,
                "s_similarities": [
                    0.2525
                ],
                "s_ppl": 97.41455078125,
                "t_ppl": 97.41455841064453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9535,
                    "positive": 0.0033,
                    "neutral": 0.0432
                }
            }
        },
        {
            "index": 391,
            "input": "their sandwiches were really tasty.",
            "reference": "the sandwiches were poor",
            "prediction": "Their sandwiches are not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 7.267884212102741,
                "r_avg_similarity": 0.6182,
                "r_similarities": [
                    0.6182
                ],
                "s_avg_similarity": 0.7377,
                "s_similarities": [
                    0.7377
                ],
                "s_ppl": 44.99259948730469,
                "t_ppl": 44.99256896972656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0036,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 392,
            "input": "always a fun and friendly atmosphere.",
            "reference": "is was a bad atmospher",
            "prediction": "The restaurant is not crowded with people.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.0308,
                "r_similarities": [
                    0.0308
                ],
                "s_avg_similarity": 0.0606,
                "s_similarities": [
                    0.0606
                ],
                "s_ppl": 79.52454376220703,
                "t_ppl": 79.52454376220703,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0053,
                    "positive": 0.4242,
                    "neutral": 0.5704
                }
            }
        },
        {
            "index": 393,
            "input": "i'm a regular drive-through customer at this location.",
            "reference": "i will never go back",
            "prediction": "I don't like going to this place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.795599612995366,
                "r_avg_similarity": 0.4509,
                "r_similarities": [
                    0.4509
                ],
                "s_avg_similarity": 0.1657,
                "s_similarities": [
                    0.1657
                ],
                "s_ppl": 16.644481658935547,
                "t_ppl": 16.644481658935547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0038,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 394,
            "input": "it was so delicious; i've never had anything like it!",
            "reference": "everything tasted bad, nothing i liked",
            "prediction": "The chicken I ate in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4918,
                "r_similarities": [
                    0.4918
                ],
                "s_avg_similarity": 0.3659,
                "s_similarities": [
                    0.3659
                ],
                "s_ppl": 55.37515640258789,
                "t_ppl": 55.37515640258789,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0033,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 395,
            "input": "definitely something i will have again!",
            "reference": "not something i would have again",
            "prediction": "Definitely not something i would like to eat again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 27.77619034011791,
                "s_sbleu": 9.287528999566801,
                "r_avg_similarity": 0.5751,
                "r_similarities": [
                    0.5751
                ],
                "s_avg_similarity": 0.5642,
                "s_similarities": [
                    0.5642
                ],
                "s_ppl": 30.732717514038086,
                "t_ppl": 30.732717514038086,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9757,
                    "positive": 0.0032,
                    "neutral": 0.0211
                }
            }
        },
        {
            "index": 396,
            "input": "the california burrito was also a great burrito.",
            "reference": "california burrito was a bad burrito",
            "prediction": "The California Burrito is not tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.935157841536379,
                "r_avg_similarity": 0.756,
                "r_similarities": [
                    0.756
                ],
                "s_avg_similarity": 0.6947,
                "s_similarities": [
                    0.6947
                ],
                "s_ppl": 345.41961669921875,
                "t_ppl": 345.41961669921875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9727,
                    "positive": 0.0034,
                    "neutral": 0.0239
                }
            }
        },
        {
            "index": 397,
            "input": "the woman who helped me today was very friendly and knowledgeable.",
            "reference": "the woman who helped was angry and quick",
            "prediction": "The woman who helped me today is not friendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.619699684601283,
                "s_sbleu": 34.98330125272251,
                "r_avg_similarity": 0.4504,
                "r_similarities": [
                    0.4504
                ],
                "s_avg_similarity": 0.7114,
                "s_similarities": [
                    0.7114
                ],
                "s_ppl": 95.31275939941406,
                "t_ppl": 95.31275939941406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.962,
                    "positive": 0.0026,
                    "neutral": 0.0355
                }
            }
        },
        {
            "index": 398,
            "input": "the service was great, food delicious, and the value impeccable.",
            "reference": "service was poor and the food expensive and weak tasting",
            "prediction": "The restaurant is too expensive for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.300847718252331,
                "s_sbleu": 2.9559265264674432,
                "r_avg_similarity": 0.4097,
                "r_similarities": [
                    0.4097
                ],
                "s_avg_similarity": 0.3567,
                "s_similarities": [
                    0.3567
                ],
                "s_ppl": 41.67852020263672,
                "t_ppl": 41.678531646728516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9747,
                    "positive": 0.003,
                    "neutral": 0.0223
                }
            }
        },
        {
            "index": 399,
            "input": "loved the menu and the drinks.",
            "reference": "the menu was small and lacking",
            "prediction": "The food was not good, but the service was excellent.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 4.02724819242185,
                "r_avg_similarity": 0.3717,
                "r_similarities": [
                    0.3717
                ],
                "s_avg_similarity": 0.4432,
                "s_similarities": [
                    0.4432
                ],
                "s_ppl": 11.246747970581055,
                "t_ppl": 11.246747970581055,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0687,
                    "positive": 0.7532,
                    "neutral": 0.1781
                }
            }
        },
        {
            "index": 400,
            "input": "pei wei has fair prices, fast service, and wonderful outdoor seating.",
            "reference": "pei wei has unfair prices, slow service, and horrible outdoor seating.",
            "prediction": "pei wei is not a good restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.773772066582299,
                "s_sbleu": 5.773772066582299,
                "r_avg_similarity": 0.6735,
                "r_similarities": [
                    0.6735
                ],
                "s_avg_similarity": 0.5642,
                "s_similarities": [
                    0.5642
                ],
                "s_ppl": 77.30401611328125,
                "t_ppl": 77.30401611328125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0035,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 401,
            "input": "it was a great experience!",
            "reference": "it was a terrible experience!",
            "prediction": "It wasn't a good experience.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.652434877402245,
                "s_sbleu": 9.652434877402245,
                "r_avg_similarity": 0.7421,
                "r_similarities": [
                    0.7421
                ],
                "s_avg_similarity": 0.6076,
                "s_similarities": [
                    0.6076
                ],
                "s_ppl": 14.223616600036621,
                "t_ppl": 14.223615646362305,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9742,
                    "positive": 0.004,
                    "neutral": 0.0218
                }
            }
        },
        {
            "index": 402,
            "input": "his humor makes a routine visit entertaining.",
            "reference": "hi humor makes a routine visit boring.",
            "prediction": "I don't like his humor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.916271812933183,
                "s_sbleu": 12.872632311973014,
                "r_avg_similarity": 0.4941,
                "r_similarities": [
                    0.4941
                ],
                "s_avg_similarity": 0.5628,
                "s_similarities": [
                    0.5628
                ],
                "s_ppl": 37.47012710571289,
                "t_ppl": 37.47012710571289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9737,
                    "positive": 0.0041,
                    "neutral": 0.0222
                }
            }
        },
        {
            "index": 403,
            "input": "love this place and will keep coming back.",
            "reference": "don't like this place and will not be coming back.",
            "prediction": "This is not a good restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.410363736106612,
                "s_sbleu": 4.935157841536379,
                "r_avg_similarity": 0.4452,
                "r_similarities": [
                    0.4452
                ],
                "s_avg_similarity": 0.2293,
                "s_similarities": [
                    0.2293
                ],
                "s_ppl": 27.361719131469727,
                "t_ppl": 27.36172103881836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0032,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 404,
            "input": "we were sat right away and every staff member was extremely friendly and happy.",
            "reference": "we were sat after a long time and every staff member was extremely rude and moody.",
            "prediction": "The waiters are not polite at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 1.792860066160371,
                "s_sbleu": 2.302077893514382,
                "r_avg_similarity": 0.4191,
                "r_similarities": [
                    0.4191
                ],
                "s_avg_similarity": 0.3488,
                "s_similarities": [
                    0.3488
                ],
                "s_ppl": 50.160335540771484,
                "t_ppl": 50.160335540771484,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.0039,
                    "neutral": 0.0172
                }
            }
        },
        {
            "index": 405,
            "input": "will definitely go back and recommend to friends.",
            "reference": "won't go back with friends",
            "prediction": "I would not recommend this restaurant to my friends.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 9.980099403873663,
                "r_avg_similarity": 0.31,
                "r_similarities": [
                    0.31
                ],
                "s_avg_similarity": 0.3968,
                "s_similarities": [
                    0.3968
                ],
                "s_ppl": 15.57536506652832,
                "t_ppl": 15.575366020202637,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.976,
                    "positive": 0.0032,
                    "neutral": 0.0207
                }
            }
        },
        {
            "index": 406,
            "input": "their small calzone is really gigantic!",
            "reference": "the calzone is very small",
            "prediction": "their small calzone is not gigantic at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 31.55984539112945,
                "r_avg_similarity": 0.7364,
                "r_similarities": [
                    0.7364
                ],
                "s_avg_similarity": 0.9139,
                "s_similarities": [
                    0.9139
                ],
                "s_ppl": 193.25726318359375,
                "t_ppl": 193.2572784423828,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.3558,
                    "positive": 0.0271,
                    "neutral": 0.6171
                }
            }
        },
        {
            "index": 407,
            "input": "the food is also very good.",
            "reference": "the food tasted just ok",
            "prediction": "The food in this restaurant is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.5731,
                "r_similarities": [
                    0.5731
                ],
                "s_avg_similarity": 0.4715,
                "s_similarities": [
                    0.4715
                ],
                "s_ppl": 19.62146759033203,
                "t_ppl": 19.62146759033203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0037,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 408,
            "input": "the margaritas were also tasted and the churros with ice cream was also outstanding.",
            "reference": "the margaritas tasted off and the churros with ice cream bland",
            "prediction": "The food was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.153749340017052,
                "r_avg_similarity": 0.4001,
                "r_similarities": [
                    0.4001
                ],
                "s_avg_similarity": 0.2776,
                "s_similarities": [
                    0.2776
                ],
                "s_ppl": 46.466129302978516,
                "t_ppl": 46.466129302978516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.0035,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 409,
            "input": "i highly recommend the ahi tuna.",
            "reference": "the ahi tuna is not something i want to recommend",
            "prediction": "The ahi tuna is not recommended.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.78284959130087,
                "s_sbleu": 14.535768424205482,
                "r_avg_similarity": 0.8882,
                "r_similarities": [
                    0.8882
                ],
                "s_avg_similarity": 0.7709,
                "s_similarities": [
                    0.7709
                ],
                "s_ppl": 99.77214813232422,
                "t_ppl": 99.77214813232422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7236,
                    "positive": 0.0047,
                    "neutral": 0.2717
                }
            }
        },
        {
            "index": 410,
            "input": "she was so patient, kind and understanding.",
            "reference": "she was very quick an impatient",
            "prediction": "She wasn't a good teacher.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.923026124015933,
                "r_avg_similarity": 0.4218,
                "r_similarities": [
                    0.4218
                ],
                "s_avg_similarity": 0.4847,
                "s_similarities": [
                    0.4847
                ],
                "s_ppl": 19.181867599487305,
                "t_ppl": 19.181867599487305,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.004,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 411,
            "input": "heck, even the pizza is decent.",
            "reference": "the pizza was not good",
            "prediction": "The food here is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.548,
                "r_similarities": [
                    0.548
                ],
                "s_avg_similarity": 0.5126,
                "s_similarities": [
                    0.5126
                ],
                "s_ppl": 24.142696380615234,
                "t_ppl": 24.142696380615234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.004,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 412,
            "input": "cooked to perfection and very flavorful.",
            "reference": "over cooked and bland",
            "prediction": "The food was not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.4468,
                "r_similarities": [
                    0.4468
                ],
                "s_avg_similarity": 0.3805,
                "s_similarities": [
                    0.3805
                ],
                "s_ppl": 29.15134048461914,
                "t_ppl": 29.151348114013672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0034,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 413,
            "input": "the crew was very friendly and accommodating.",
            "reference": "very mean crew",
            "prediction": "The waiters were rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.862502026550899,
                "r_avg_similarity": 0.2925,
                "r_similarities": [
                    0.2925
                ],
                "s_avg_similarity": 0.3378,
                "s_similarities": [
                    0.3378
                ],
                "s_ppl": 141.85276794433594,
                "t_ppl": 141.85276794433594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0044,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 414,
            "input": "the sushi here is great and i love the cucumber salad.",
            "reference": "bad suchi and salad",
            "prediction": "This restaurant serves bad food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 2.9859662827819125,
                "r_avg_similarity": 0.4724,
                "r_similarities": [
                    0.4724
                ],
                "s_avg_similarity": 0.2947,
                "s_similarities": [
                    0.2947
                ],
                "s_ppl": 156.24317932128906,
                "t_ppl": 156.2431640625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0033,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 415,
            "input": "if you are looking to walk out transformed this is your place!",
            "reference": "this place will not transform you",
            "prediction": "If you are looking for a good time, this is not your place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.716499092256818,
                "s_sbleu": 14.37791910008819,
                "r_avg_similarity": 0.2345,
                "r_similarities": [
                    0.2345
                ],
                "s_avg_similarity": 0.3776,
                "s_similarities": [
                    0.3776
                ],
                "s_ppl": 6.438628196716309,
                "t_ppl": 6.438628196716309,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.6583,
                    "positive": 0.0179,
                    "neutral": 0.3238
                }
            }
        },
        {
            "index": 416,
            "input": "she chose a great color that looks incredible with my skin, too.",
            "reference": "i hated the color, it did not match my skin",
            "prediction": "I don't like this color at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7954847898457067,
                "s_sbleu": 3.1021609279760063,
                "r_avg_similarity": 0.6708,
                "r_similarities": [
                    0.6708
                ],
                "s_avg_similarity": 0.3988,
                "s_similarities": [
                    0.3988
                ],
                "s_ppl": 13.45585823059082,
                "t_ppl": 13.45585823059082,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9685,
                    "positive": 0.0036,
                    "neutral": 0.0278
                }
            }
        },
        {
            "index": 417,
            "input": "a great place to watch sports!",
            "reference": "too loud i would not go back",
            "prediction": "This is not a good place to watch sports.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 27.77619034011791,
                "r_avg_similarity": 0.1665,
                "r_similarities": [
                    0.1665
                ],
                "s_avg_similarity": 0.6788,
                "s_similarities": [
                    0.6788
                ],
                "s_ppl": 19.265226364135742,
                "t_ppl": 19.265228271484375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0034,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 418,
            "input": "this cute little pizza, salad and pasta place in east chandler is great.",
            "reference": "this little pizza and salad place is disgusting",
            "prediction": "I don't like this cute little pizza, salad and pasta place in east chandler.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.43716525407242,
                "s_sbleu": 73.67565054628355,
                "r_avg_similarity": 0.7215,
                "r_similarities": [
                    0.7215
                ],
                "s_avg_similarity": 0.9011,
                "s_similarities": [
                    0.9011
                ],
                "s_ppl": 94.98912048339844,
                "t_ppl": 94.98912811279297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9631,
                    "positive": 0.0037,
                    "neutral": 0.0332
                }
            }
        },
        {
            "index": 419,
            "input": "the art in the alley behind it is cool too!",
            "reference": "the alley way art is scary",
            "prediction": "The restaurant's atmosphere is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 3.708659055657029,
                "r_avg_similarity": 0.2707,
                "r_similarities": [
                    0.2707
                ],
                "s_avg_similarity": 0.2072,
                "s_similarities": [
                    0.2072
                ],
                "s_ppl": 86.37265014648438,
                "t_ppl": 86.37265014648438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0035,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 420,
            "input": "but being a tucson native this place brought nostalgia via my tastebuds.",
            "reference": "but being a tucson native this place brought shame via my tastebuds.",
            "prediction": "This restaurant is not good for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.9559265264674432,
                "s_sbleu": 2.9559265264674432,
                "r_avg_similarity": 0.3364,
                "r_similarities": [
                    0.3364
                ],
                "s_avg_similarity": 0.2755,
                "s_similarities": [
                    0.2755
                ],
                "s_ppl": 53.12289047241211,
                "t_ppl": 53.12284851074219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0037,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 421,
            "input": "best chicken parmesan i have ever had.",
            "reference": "worst chicken parmesan i have ever had.",
            "prediction": "The chicken parmigiana I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.6382,
                "r_similarities": [
                    0.6382
                ],
                "s_avg_similarity": 0.653,
                "s_similarities": [
                    0.653
                ],
                "s_ppl": 34.633453369140625,
                "t_ppl": 34.633453369140625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0032,
                    "neutral": 0.0172
                }
            }
        },
        {
            "index": 422,
            "input": "customer service was great there.",
            "reference": "customer service was poor there.",
            "prediction": "I didn't like the food at this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.4227,
                "r_similarities": [
                    0.4227
                ],
                "s_avg_similarity": 0.3191,
                "s_similarities": [
                    0.3191
                ],
                "s_ppl": 17.79953384399414,
                "t_ppl": 17.799535751342773,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0033,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 423,
            "input": "fun place to catch a game on tv and catch up w/ people.",
            "reference": "loud place to catch a game on tv and try to catch up w/ people.",
            "prediction": "This bar is not a good place for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.742341580995955,
                "s_sbleu": 3.3495035708457803,
                "r_avg_similarity": 0.2506,
                "r_similarities": [
                    0.2506
                ],
                "s_avg_similarity": 0.2686,
                "s_similarities": [
                    0.2686
                ],
                "s_ppl": 24.196409225463867,
                "t_ppl": 24.196407318115234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0034,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 424,
            "input": "most delicious authentic chinese food!",
            "reference": "most terrible inauthentic chinese food!",
            "prediction": "The chicken I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4515,
                "r_similarities": [
                    0.4515
                ],
                "s_avg_similarity": 0.3649,
                "s_similarities": [
                    0.3649
                ],
                "s_ppl": 74.80648803710938,
                "t_ppl": 74.8064956665039,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0033,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 425,
            "input": "the chips and guacamole were excellent too!",
            "reference": "The chips and guacamole weren't that good.",
            "prediction": "I didn't like the food at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.5959,
                "r_similarities": [
                    0.5959
                ],
                "s_avg_similarity": 0.5096,
                "s_similarities": [
                    0.5096
                ],
                "s_ppl": 13.765462875366211,
                "t_ppl": 13.765463829040527,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0037,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 426,
            "input": "this place is wonderful when you can actually sit outside.",
            "reference": "The place still isn't good, even when you can sit outside.",
            "prediction": "I don't like sitting outside in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.6353588668522963,
                "s_sbleu": 5.0243511979240845,
                "r_avg_similarity": 0.6375,
                "r_similarities": [
                    0.6375
                ],
                "s_avg_similarity": 0.6082,
                "s_similarities": [
                    0.6082
                ],
                "s_ppl": 56.11385726928711,
                "t_ppl": 56.113861083984375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9688,
                    "positive": 0.0035,
                    "neutral": 0.0277
                }
            }
        },
        {
            "index": 427,
            "input": "a great little spot to throw back a few beers after a rough day.",
            "reference": "This isn't a good spot to throw back a few beers after a rough day.",
            "prediction": "A bad place for drinking.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 1.5330462064343475,
                "s_sbleu": 1.8110800993753928,
                "r_avg_similarity": 0.5406,
                "r_similarities": [
                    0.5406
                ],
                "s_avg_similarity": 0.5759,
                "s_similarities": [
                    0.5759
                ],
                "s_ppl": 204.0034942626953,
                "t_ppl": 204.00350952148438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0032,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 428,
            "input": "i definitely recommend this place to others!",
            "reference": "I definitely don't recommend this place to others.",
            "prediction": "This is not a good restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.935157841536379,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5712,
                "r_similarities": [
                    0.5712
                ],
                "s_avg_similarity": 0.3767,
                "s_similarities": [
                    0.3767
                ],
                "s_ppl": 27.361719131469727,
                "t_ppl": 27.36172103881836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0032,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 429,
            "input": "well the food was great and the price of it was even better.",
            "reference": "The food wasn't good, and the price was even worse.",
            "prediction": "The restaurant is expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.132599824355824,
                "s_sbleu": 1.765751677720686,
                "r_avg_similarity": 0.487,
                "r_similarities": [
                    0.487
                ],
                "s_avg_similarity": 0.4903,
                "s_similarities": [
                    0.4903
                ],
                "s_ppl": 239.0931854248047,
                "t_ppl": 239.0931854248047,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0804,
                    "positive": 0.1701,
                    "neutral": 0.7495
                }
            }
        },
        {
            "index": 430,
            "input": "i took the waiter's recommendation of the veal carolina and it was super!",
            "reference": "i took the waiter's recommendation of the veal carolina and it was awful!",
            "prediction": "The veal carolina is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.83193071984246,
                "s_sbleu": 4.83193071984246,
                "r_avg_similarity": 0.6008,
                "r_similarities": [
                    0.6008
                ],
                "s_avg_similarity": 0.5479,
                "s_similarities": [
                    0.5479
                ],
                "s_ppl": 269.9786376953125,
                "t_ppl": 269.9786682128906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9775,
                    "positive": 0.0034,
                    "neutral": 0.0191
                }
            }
        },
        {
            "index": 431,
            "input": "super good deals and very friendly staff.",
            "reference": "super bad deals and very unfriendly staff.",
            "prediction": "The service was terrible, and the food was awful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.496,
                "r_similarities": [
                    0.496
                ],
                "s_avg_similarity": 0.2232,
                "s_similarities": [
                    0.2232
                ],
                "s_ppl": 33.099388122558594,
                "t_ppl": 33.099388122558594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0046,
                    "neutral": 0.0123
                }
            }
        },
        {
            "index": 432,
            "input": "tried their lasagna and its the best ive ever had.",
            "reference": "tried their lasagna and its the worst ive ever had.",
            "prediction": "The lasagna that I tried in this restaurant is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.8529,
                "r_similarities": [
                    0.8529
                ],
                "s_avg_similarity": 0.8206,
                "s_similarities": [
                    0.8206
                ],
                "s_ppl": 66.3897933959961,
                "t_ppl": 66.3897933959961,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0039,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 433,
            "input": "this place is edgy and fun.",
            "reference": "this place isn't edgy or fun.",
            "prediction": "This restaurant is not suitable for a date night.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.3253,
                "r_similarities": [
                    0.3253
                ],
                "s_avg_similarity": 0.2223,
                "s_similarities": [
                    0.2223
                ],
                "s_ppl": 55.681724548339844,
                "t_ppl": 55.68172073364258,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9737,
                    "positive": 0.0028,
                    "neutral": 0.0235
                }
            }
        },
        {
            "index": 434,
            "input": "fantastic place to see a show as every seat is a great seat!",
            "reference": "terrible place to see a show as every seat is a horrible seat!",
            "prediction": "The seats in this theatre are uncomfortable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5426,
                "r_similarities": [
                    0.5426
                ],
                "s_avg_similarity": 0.4538,
                "s_similarities": [
                    0.4538
                ],
                "s_ppl": 83.62428283691406,
                "t_ppl": 83.62428283691406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9702,
                    "positive": 0.0044,
                    "neutral": 0.0254
                }
            }
        },
        {
            "index": 435,
            "input": "she was absolutely fantastic and i love what she did!",
            "reference": "she was absolutely awful and i hate what she did!",
            "prediction": "I hate her work.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.217409328795944,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5933,
                "r_similarities": [
                    0.5933
                ],
                "s_avg_similarity": 0.3583,
                "s_similarities": [
                    0.3583
                ],
                "s_ppl": 243.1667022705078,
                "t_ppl": 243.1667022705078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0051,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 436,
            "input": "the happy hour crowd here can be fun on occasion.",
            "reference": "the happy hour crowd here is never fun.",
            "prediction": "The bar is crowded during happy hour, it is annoying.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.054496384843702,
                "s_sbleu": 7.495553473355842,
                "r_avg_similarity": 0.5797,
                "r_similarities": [
                    0.5797
                ],
                "s_avg_similarity": 0.6007,
                "s_similarities": [
                    0.6007
                ],
                "s_ppl": 70.01467895507812,
                "t_ppl": 70.01461029052734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9677,
                    "positive": 0.0042,
                    "neutral": 0.0282
                }
            }
        },
        {
            "index": 437,
            "input": "very busy but very good service.",
            "reference": "very busy and very bad service.",
            "prediction": "I had a bad experience in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.313,
                "r_similarities": [
                    0.313
                ],
                "s_avg_similarity": 0.1839,
                "s_similarities": [
                    0.1839
                ],
                "s_ppl": 26.558813095092773,
                "t_ppl": 26.558815002441406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9761,
                    "positive": 0.003,
                    "neutral": 0.0208
                }
            }
        },
        {
            "index": 438,
            "input": "best take out or eat in sushi!",
            "reference": "worst take out or eat in sushi!",
            "prediction": "This restaurant is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3564,
                "r_similarities": [
                    0.3564
                ],
                "s_avg_similarity": 0.2714,
                "s_similarities": [
                    0.2714
                ],
                "s_ppl": 95.41808319091797,
                "t_ppl": 95.41807556152344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0038,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 439,
            "input": "i have had a great experience every time from start to finish.",
            "reference": "i have had a bad experience every time from start to finish.",
            "prediction": "I am not satisfied with my meal at this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.124719790499494,
                "s_sbleu": 3.124719790499494,
                "r_avg_similarity": 0.1745,
                "r_similarities": [
                    0.1745
                ],
                "s_avg_similarity": 0.1521,
                "s_similarities": [
                    0.1521
                ],
                "s_ppl": 21.46377182006836,
                "t_ppl": 21.463769912719727,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0036,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 440,
            "input": "he is very thorough and genuinely cares for his customers.",
            "reference": "he does not care for his customers and does not even pay attention to them",
            "prediction": "He is not a good waiter.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.0943469770777075,
                "s_sbleu": 4.410363736106612,
                "r_avg_similarity": 0.5581,
                "r_similarities": [
                    0.5581
                ],
                "s_avg_similarity": 0.4077,
                "s_similarities": [
                    0.4077
                ],
                "s_ppl": 45.856407165527344,
                "t_ppl": 45.85641098022461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9722,
                    "positive": 0.003,
                    "neutral": 0.0248
                }
            }
        },
        {
            "index": 441,
            "input": "plus he has amazing prices, how could you not go?",
            "reference": "the prices were on the high side, cheaper place nearby",
            "prediction": "I don't want to go there because it is expensive and bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.0890553181566975,
                "r_avg_similarity": 0.297,
                "r_similarities": [
                    0.297
                ],
                "s_avg_similarity": 0.4347,
                "s_similarities": [
                    0.4347
                ],
                "s_ppl": 17.008041381835938,
                "t_ppl": 17.00804328918457,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9768,
                    "positive": 0.0027,
                    "neutral": 0.0205
                }
            }
        },
        {
            "index": 442,
            "input": "the staff are very friendly and on the ball.",
            "reference": "the staff was horrible and slow",
            "prediction": "The waiters are not nice.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.955725306405571,
                "r_avg_similarity": 0.3467,
                "r_similarities": [
                    0.3467
                ],
                "s_avg_similarity": 0.4022,
                "s_similarities": [
                    0.4022
                ],
                "s_ppl": 121.64556884765625,
                "t_ppl": 121.64557647705078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.0044,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 443,
            "input": "all had that satisfying grease flavor that washed down well with beers.",
            "reference": "too much grease in the food and the beer was too warm",
            "prediction": "We were not satisfied with our meals.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.5152088567003625,
                "r_avg_similarity": 0.4216,
                "r_similarities": [
                    0.4216
                ],
                "s_avg_similarity": 0.2357,
                "s_similarities": [
                    0.2357
                ],
                "s_ppl": 50.30659103393555,
                "t_ppl": 50.306556701660156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9694,
                    "positive": 0.0029,
                    "neutral": 0.0277
                }
            }
        },
        {
            "index": 444,
            "input": "i was a walk in and got helped right away!",
            "reference": "i had to wait an hour to be served",
            "prediction": "The service here is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3145,
                "r_similarities": [
                    0.3145
                ],
                "s_avg_similarity": 0.199,
                "s_similarities": [
                    0.199
                ],
                "s_ppl": 151.94534301757812,
                "t_ppl": 151.9453582763672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0049,
                    "neutral": 0.0123
                }
            }
        },
        {
            "index": 445,
            "input": "if you sit in the bar they have the best bartender in town.",
            "reference": "the bartender was horrible",
            "prediction": "I don't like sitting in bars because there are too many drunk people.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.377156414337854,
                "r_avg_similarity": 0.4434,
                "r_similarities": [
                    0.4434
                ],
                "s_avg_similarity": 0.6036,
                "s_similarities": [
                    0.6036
                ],
                "s_ppl": 15.063326835632324,
                "t_ppl": 15.063326835632324,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.973,
                    "positive": 0.0031,
                    "neutral": 0.0239
                }
            }
        },
        {
            "index": 446,
            "input": "i highly recommend this shop.",
            "reference": "i would not suggest this shop",
            "prediction": "This shop is not recommended by me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.8048,
                "r_similarities": [
                    0.8048
                ],
                "s_avg_similarity": 0.6502,
                "s_similarities": [
                    0.6502
                ],
                "s_ppl": 51.13664627075195,
                "t_ppl": 51.13667297363281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9724,
                    "positive": 0.0026,
                    "neutral": 0.025
                }
            }
        },
        {
            "index": 447,
            "input": "their staff is knowledgeable and informative.",
            "reference": "the staff are rude and lousy",
            "prediction": "Their staff are not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.044795567078939,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.7119,
                "r_similarities": [
                    0.7119
                ],
                "s_avg_similarity": 0.5513,
                "s_similarities": [
                    0.5513
                ],
                "s_ppl": 37.08074188232422,
                "t_ppl": 37.080711364746094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0045,
                    "neutral": 0.0127
                }
            }
        },
        {
            "index": 448,
            "input": "it is a cool place, with lots to see and try.",
            "reference": "nothing to see there, not a nice place",
            "prediction": "I don't like this place at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.8734989388136185,
                "s_sbleu": 3.5152088567003625,
                "r_avg_similarity": 0.4914,
                "r_similarities": [
                    0.4914
                ],
                "s_avg_similarity": 0.3939,
                "s_similarities": [
                    0.3939
                ],
                "s_ppl": 9.86870288848877,
                "t_ppl": 9.86870288848877,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0043,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 449,
            "input": "they are super friendly, very helpful, and amazingly quick!",
            "reference": "so slow and rude, not helpful at all",
            "prediction": "They are not nice people.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.923026124015933,
                "s_sbleu": 2.9859662827819125,
                "r_avg_similarity": 0.3253,
                "r_similarities": [
                    0.3253
                ],
                "s_avg_similarity": 0.2325,
                "s_similarities": [
                    0.2325
                ],
                "s_ppl": 20.632301330566406,
                "t_ppl": 20.632301330566406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0041,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 450,
            "input": "i got my car detailed here and it looked amazing!",
            "reference": "car was detailed and came out bad",
            "prediction": "My car was not detailed well.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 4.410363736106612,
                "r_avg_similarity": 0.8035,
                "r_similarities": [
                    0.8035
                ],
                "s_avg_similarity": 0.6576,
                "s_similarities": [
                    0.6576
                ],
                "s_ppl": 155.92579650878906,
                "t_ppl": 155.92581176757812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9537,
                    "positive": 0.0029,
                    "neutral": 0.0434
                }
            }
        },
        {
            "index": 451,
            "input": "dr. hall is so kind and gentle.",
            "reference": "dr hall was not kind nor gentle",
            "prediction": "dr. hall is not a good doctor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.27465531099474,
                "s_sbleu": 31.55984539112945,
                "r_avg_similarity": 0.7517,
                "r_similarities": [
                    0.7517
                ],
                "s_avg_similarity": 0.7175,
                "s_similarities": [
                    0.7175
                ],
                "s_ppl": 82.42726135253906,
                "t_ppl": 82.42726135253906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0034,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 452,
            "input": "i had to box it up even, such a huge portion.",
            "reference": "the portions were so small",
            "prediction": "I ordered too much food and now I have to throw away some of it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.21858262703621,
                "r_avg_similarity": 0.3287,
                "r_similarities": [
                    0.3287
                ],
                "s_avg_similarity": 0.3026,
                "s_similarities": [
                    0.3026
                ],
                "s_ppl": 18.335634231567383,
                "t_ppl": 18.335634231567383,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9494,
                    "positive": 0.003,
                    "neutral": 0.0477
                }
            }
        },
        {
            "index": 453,
            "input": "the food all looked great.",
            "reference": "the food looked ok",
            "prediction": "I didn't like the atmosphere in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.4984,
                "r_similarities": [
                    0.4984
                ],
                "s_avg_similarity": 0.4458,
                "s_similarities": [
                    0.4458
                ],
                "s_ppl": 23.68756675720215,
                "t_ppl": 23.68756866455078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9776,
                    "positive": 0.0034,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 454,
            "input": "the menudo here is perfect.",
            "reference": "the menudo was poorly done",
            "prediction": "The menudo here is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 26.269098944241588,
                "r_avg_similarity": 0.834,
                "r_similarities": [
                    0.834
                ],
                "s_avg_similarity": 0.8465,
                "s_similarities": [
                    0.8465
                ],
                "s_ppl": 416.71160888671875,
                "t_ppl": 416.7120056152344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.004,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 455,
            "input": "the crispy mango fish was very tasty.",
            "reference": "the crispy mango fish was very disgusting.",
            "prediction": "The mango fish was not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.070828081828378,
                "s_sbleu": 20.164945583740657,
                "r_avg_similarity": 0.8033,
                "r_similarities": [
                    0.8033
                ],
                "s_avg_similarity": 0.7627,
                "s_similarities": [
                    0.7627
                ],
                "s_ppl": 145.90350341796875,
                "t_ppl": 145.90350341796875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9771,
                    "positive": 0.003,
                    "neutral": 0.0198
                }
            }
        },
        {
            "index": 456,
            "input": "now the food, drinks, and desserts are amazing.",
            "reference": "now the food, drinks, and desserts are horrible.",
            "prediction": "The restaurant is not so good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.708659055657029,
                "s_sbleu": 3.708659055657029,
                "r_avg_similarity": 0.5387,
                "r_similarities": [
                    0.5387
                ],
                "s_avg_similarity": 0.3817,
                "s_similarities": [
                    0.3817
                ],
                "s_ppl": 78.23439025878906,
                "t_ppl": 78.23438262939453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0039,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 457,
            "input": "the carne asada burrito is awesome!",
            "reference": "the carne asada burrito is awful!",
            "prediction": "The carne asada burrito is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.269098944241577,
                "s_sbleu": 26.269098944241577,
                "r_avg_similarity": 0.851,
                "r_similarities": [
                    0.851
                ],
                "s_avg_similarity": 0.7616,
                "s_similarities": [
                    0.7616
                ],
                "s_ppl": 17.966665267944336,
                "t_ppl": 17.966665267944336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0034,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 458,
            "input": "this is the perfect date night.",
            "reference": "this is the worst date night.",
            "prediction": "This is not the perfect date night.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.356898886410004,
                "s_sbleu": 54.10822690539397,
                "r_avg_similarity": 0.7863,
                "r_similarities": [
                    0.7863
                ],
                "s_avg_similarity": 0.871,
                "s_similarities": [
                    0.871
                ],
                "s_ppl": 40.752140045166016,
                "t_ppl": 40.752140045166016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.975,
                    "positive": 0.0033,
                    "neutral": 0.0216
                }
            }
        },
        {
            "index": 459,
            "input": "nice selection of games to play.",
            "reference": "terrible selection of games to play.",
            "prediction": "The games are not worth buying.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.5795,
                "r_similarities": [
                    0.5795
                ],
                "s_avg_similarity": 0.5309,
                "s_similarities": [
                    0.5309
                ],
                "s_ppl": 74.10552215576172,
                "t_ppl": 74.10552215576172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9769,
                    "positive": 0.0029,
                    "neutral": 0.0202
                }
            }
        },
        {
            "index": 460,
            "input": "the grilled artichokes are wonderful!",
            "reference": "The artichokes were terrible and undercooked.",
            "prediction": "The grilled artichokes I ordered are tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.267884212102741,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.5983,
                "r_similarities": [
                    0.5983
                ],
                "s_avg_similarity": 0.6928,
                "s_similarities": [
                    0.6928
                ],
                "s_ppl": 98.31720733642578,
                "t_ppl": 98.31721496582031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9764,
                    "positive": 0.0031,
                    "neutral": 0.0205
                }
            }
        },
        {
            "index": 461,
            "input": "the adovada is hot but wonderful and the chocolate bread pudding is amazing.",
            "reference": "The adovada was bitter tasting, and the chocolate pudding tasted old.",
            "prediction": "I don't like the food in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.6353588668522963,
                "s_sbleu": 3.2530620447891696,
                "r_avg_similarity": 0.2173,
                "r_similarities": [
                    0.2173
                ],
                "s_avg_similarity": 0.2727,
                "s_similarities": [
                    0.2727
                ],
                "s_ppl": 15.798528671264648,
                "t_ppl": 15.798528671264648,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0039,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 462,
            "input": "fun and inexpensive way to enjoy and relax your day.",
            "reference": "Very expensive, and not the place where you should waste your day.",
            "prediction": "Going to a movie is not fun for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3449303459224256,
                "s_sbleu": 4.996872151825361,
                "r_avg_similarity": 0.2765,
                "r_similarities": [
                    0.2765
                ],
                "s_avg_similarity": 0.3881,
                "s_similarities": [
                    0.3881
                ],
                "s_ppl": 15.534124374389648,
                "t_ppl": 15.534123420715332,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0036,
                    "neutral": 0.019
                }
            }
        },
        {
            "index": 463,
            "input": "i loved it and will definitely be back!",
            "reference": "Very bad experience i will not come back.",
            "prediction": "I did not enjoy my meal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.8689248188165335,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.2854,
                "r_similarities": [
                    0.2854
                ],
                "s_avg_similarity": 0.1386,
                "s_similarities": [
                    0.1386
                ],
                "s_ppl": 43.88761520385742,
                "t_ppl": 43.88761520385742,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0038,
                    "neutral": 0.0187
                }
            }
        },
        {
            "index": 464,
            "input": "got screwed at bar that we made reservations at next door.",
            "reference": "Great service at the bar we made reservations next door",
            "prediction": "The service was terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9297526283216277,
                "s_sbleu": 2.6341919627252284,
                "r_avg_similarity": 0.3174,
                "r_similarities": [
                    0.3174
                ],
                "s_avg_similarity": 0.2128,
                "s_similarities": [
                    0.2128
                ],
                "s_ppl": 293.2747802734375,
                "t_ppl": 293.2747497558594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0049,
                    "neutral": 0.0123
                }
            }
        },
        {
            "index": 465,
            "input": "very friendly staff and manager.",
            "reference": "very unfriendly staff and manager.",
            "prediction": "The restaurant is too empty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 8.116697886877475,
                "r_avg_similarity": 0.2411,
                "r_similarities": [
                    0.2411
                ],
                "s_avg_similarity": 0.1267,
                "s_similarities": [
                    0.1267
                ],
                "s_ppl": 262.5545654296875,
                "t_ppl": 262.5545654296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9738,
                    "positive": 0.0031,
                    "neutral": 0.0231
                }
            }
        },
        {
            "index": 466,
            "input": "love my cut and color and sage is amazing!",
            "reference": "hate my cut and color and sage is awful!",
            "prediction": "I hate my cut and color at Sage Salon.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 39.281465090051306,
                "s_sbleu": 26.269098944241577,
                "r_avg_similarity": 0.855,
                "r_similarities": [
                    0.855
                ],
                "s_avg_similarity": 0.6802,
                "s_similarities": [
                    0.6802
                ],
                "s_ppl": 1023.5611572265625,
                "t_ppl": 1023.5611572265625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0037,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 467,
            "input": "wide spectrum of ages and races.",
            "reference": "narrow spectrum of ages and races.",
            "prediction": "People from different backgrounds are not welcome here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.2117,
                "r_similarities": [
                    0.2117
                ],
                "s_avg_similarity": 0.2268,
                "s_similarities": [
                    0.2268
                ],
                "s_ppl": 29.021099090576172,
                "t_ppl": 29.021100997924805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9661,
                    "positive": 0.0027,
                    "neutral": 0.0312
                }
            }
        },
        {
            "index": 468,
            "input": "had a blast and the food at their restaurant was excellent!",
            "reference": "had a bad time and the food at their restaurant was awful!",
            "prediction": "The food at this restaurant is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.542540885608186,
                "s_sbleu": 7.413670083653379,
                "r_avg_similarity": 0.6938,
                "r_similarities": [
                    0.6938
                ],
                "s_avg_similarity": 0.4526,
                "s_similarities": [
                    0.4526
                ],
                "s_ppl": 34.63026428222656,
                "t_ppl": 34.63028335571289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0046,
                    "neutral": 0.0124
                }
            }
        },
        {
            "index": 469,
            "input": "at no cost - great service!",
            "reference": "at extra cost - awful service!",
            "prediction": "The service is not free.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.870636427700047,
                "s_sbleu": 6.870636427700047,
                "r_avg_similarity": 0.4515,
                "r_similarities": [
                    0.4515
                ],
                "s_avg_similarity": 0.5167,
                "s_similarities": [
                    0.5167
                ],
                "s_ppl": 39.61030197143555,
                "t_ppl": 39.61030578613281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9421,
                    "positive": 0.0033,
                    "neutral": 0.0546
                }
            }
        },
        {
            "index": 470,
            "input": "their steak & salsa burrito was very very good and really big too.",
            "reference": "stake and salsa burrito was too small and not enough cheese",
            "prediction": "Their steak & salsa burrito is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 18.88665593413212,
                "r_avg_similarity": 0.5208,
                "r_similarities": [
                    0.5208
                ],
                "s_avg_similarity": 0.6678,
                "s_similarities": [
                    0.6678
                ],
                "s_ppl": 93.4992446899414,
                "t_ppl": 93.49933624267578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0034,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 471,
            "input": "blue corn tacos with chicken were excellent.",
            "reference": "blue corn tacos with chicken was not cooked properly",
            "prediction": "The tacos I ordered in this restaurant are terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.5817,
                "r_similarities": [
                    0.5817
                ],
                "s_avg_similarity": 0.6689,
                "s_similarities": [
                    0.6689
                ],
                "s_ppl": 72.96643829345703,
                "t_ppl": 72.9664306640625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.004,
                    "neutral": 0.0136
                }
            }
        },
        {
            "index": 472,
            "input": "plenty to eat and amazing flavor.",
            "reference": "not a lot of portion and the flavor was not there",
            "prediction": "The food was not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.590969579691412,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.5169,
                "r_similarities": [
                    0.5169
                ],
                "s_avg_similarity": 0.3137,
                "s_similarities": [
                    0.3137
                ],
                "s_ppl": 23.248323440551758,
                "t_ppl": 23.248313903808594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0037,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 473,
            "input": "i definitely will return to the roaring fork!",
            "reference": "i will not come back here ever",
            "prediction": "I will never go back to the Roaring Fork again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 8.29519350710986,
                "r_avg_similarity": 0.4726,
                "r_similarities": [
                    0.4726
                ],
                "s_avg_similarity": 0.7391,
                "s_similarities": [
                    0.7391
                ],
                "s_ppl": 29.301816940307617,
                "t_ppl": 29.301795959472656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9295,
                    "positive": 0.006,
                    "neutral": 0.0645
                }
            }
        },
        {
            "index": 474,
            "input": "it will stay with you all day.",
            "reference": "you will forget this place as soon as you walk out",
            "prediction": "Eating unhealthy foods is not a good idea.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.0962,
                "r_similarities": [
                    0.0962
                ],
                "s_avg_similarity": 0.0847,
                "s_similarities": [
                    0.0847
                ],
                "s_ppl": 18.72113800048828,
                "t_ppl": 18.72113609313965,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9583,
                    "positive": 0.0034,
                    "neutral": 0.0384
                }
            }
        },
        {
            "index": 475,
            "input": "the hummus is ridiculously creamy and delicious.",
            "reference": "the hummus is ridiculously dry and bland.",
            "prediction": "I don't like the hummus.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.872632311973014,
                "s_sbleu": 12.872632311973014,
                "r_avg_similarity": 0.7975,
                "r_similarities": [
                    0.7975
                ],
                "s_avg_similarity": 0.7871,
                "s_similarities": [
                    0.7871
                ],
                "s_ppl": 29.091691970825195,
                "t_ppl": 29.091684341430664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9646,
                    "positive": 0.0049,
                    "neutral": 0.0305
                }
            }
        },
        {
            "index": 476,
            "input": "good place for a romantic dinner!",
            "reference": "terrible place for a romantic dinner!",
            "prediction": "This is not a good place for a romantic dinner.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 35.08439695638686,
                "s_sbleu": 46.17366309441026,
                "r_avg_similarity": 0.8241,
                "r_similarities": [
                    0.8241
                ],
                "s_avg_similarity": 0.8036,
                "s_similarities": [
                    0.8036
                ],
                "s_ppl": 16.752023696899414,
                "t_ppl": 16.752023696899414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0034,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 477,
            "input": "the owner knows us and treats us very well!",
            "reference": "the owner doesn't seem to remember us and treats us terribly!",
            "prediction": "The owner does not treat us well.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9832534781768225,
                "s_sbleu": 5.660233915657916,
                "r_avg_similarity": 0.6567,
                "r_similarities": [
                    0.6567
                ],
                "s_avg_similarity": 0.6666,
                "s_similarities": [
                    0.6666
                ],
                "s_ppl": 98.84208679199219,
                "t_ppl": 98.84213256835938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0031,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 478,
            "input": "i can honestly say i am so glad we will be moving to az.",
            "reference": "i can honestly say i am very unhappy we will be moving to az!",
            "prediction": "I don't want to move to Arizona.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.302077893514382,
                "s_sbleu": 2.7376474102577797,
                "r_avg_similarity": 0.6477,
                "r_similarities": [
                    0.6477
                ],
                "s_avg_similarity": 0.5892,
                "s_similarities": [
                    0.5892
                ],
                "s_ppl": 18.240676879882812,
                "t_ppl": 18.240676879882812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9685,
                    "positive": 0.0038,
                    "neutral": 0.0278
                }
            }
        },
        {
            "index": 479,
            "input": "the green chile mac and cheese was incredible!",
            "reference": "the green chile mac and cheese was horrible!",
            "prediction": "The food was not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.8734989388136185,
                "s_sbleu": 4.8734989388136185,
                "r_avg_similarity": 0.4831,
                "r_similarities": [
                    0.4831
                ],
                "s_avg_similarity": 0.3552,
                "s_similarities": [
                    0.3552
                ],
                "s_ppl": 29.15134048461914,
                "t_ppl": 29.151348114013672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0034,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 480,
            "input": "i highly recommend impact auto body.",
            "reference": "i highly recommend you don't go to impact auto body.",
            "prediction": "I do not recommend impact auto body.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.124218547395092,
                "s_sbleu": 51.69731539571708,
                "r_avg_similarity": 0.9249,
                "r_similarities": [
                    0.9249
                ],
                "s_avg_similarity": 0.8996,
                "s_similarities": [
                    0.8996
                ],
                "s_ppl": 566.9312744140625,
                "t_ppl": 566.9312744140625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.964,
                    "positive": 0.004,
                    "neutral": 0.0319
                }
            }
        },
        {
            "index": 481,
            "input": "great quality, great service.",
            "reference": "awful quality, awful service.",
            "prediction": "I had a bad experience at this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.5117,
                "r_similarities": [
                    0.5117
                ],
                "s_avg_similarity": 0.2389,
                "s_similarities": [
                    0.2389
                ],
                "s_ppl": 19.951318740844727,
                "t_ppl": 19.951316833496094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9766,
                    "positive": 0.003,
                    "neutral": 0.0204
                }
            }
        },
        {
            "index": 482,
            "input": "and i get the gyro sandwich every time and its the best.",
            "reference": "and i get the gyro sandwich every time and its the worst.",
            "prediction": "The gyros are not good here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.7869730680842904,
                "s_sbleu": 2.7869730680842904,
                "r_avg_similarity": 0.4987,
                "r_similarities": [
                    0.4987
                ],
                "s_avg_similarity": 0.4891,
                "s_similarities": [
                    0.4891
                ],
                "s_ppl": 124.2390365600586,
                "t_ppl": 124.2391586303711,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9769,
                    "positive": 0.0034,
                    "neutral": 0.0198
                }
            }
        },
        {
            "index": 483,
            "input": "i highly recommend this bakery!",
            "reference": "i highly recommend not using this bakery!",
            "prediction": "This bakery is not recommended by me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.8377,
                "r_similarities": [
                    0.8377
                ],
                "s_avg_similarity": 0.7153,
                "s_similarities": [
                    0.7153
                ],
                "s_ppl": 123.07838439941406,
                "t_ppl": 123.07837677001953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9727,
                    "positive": 0.0026,
                    "neutral": 0.0248
                }
            }
        },
        {
            "index": 484,
            "input": "love their food and their passion.",
            "reference": "hate their food and their passion.",
            "prediction": "I don't like their food and their passion.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 58.73949094699213,
                "s_sbleu": 58.73949094699213,
                "r_avg_similarity": 0.8333,
                "r_similarities": [
                    0.8333
                ],
                "s_avg_similarity": 0.6681,
                "s_similarities": [
                    0.6681
                ],
                "s_ppl": 46.603633880615234,
                "t_ppl": 46.6036376953125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.0032,
                    "neutral": 0.0196
                }
            }
        },
        {
            "index": 485,
            "input": "i highly recommend this salon and the wonderfully talented stylist, angel.",
            "reference": "I don't recommend this salon because the artist had no talent.",
            "prediction": "This salon is not recommended by me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9832534781768225,
                "s_sbleu": 3.5152088567003625,
                "r_avg_similarity": 0.6873,
                "r_similarities": [
                    0.6873
                ],
                "s_avg_similarity": 0.5956,
                "s_similarities": [
                    0.5956
                ],
                "s_ppl": 104.47872924804688,
                "t_ppl": 104.47892761230469,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9745,
                    "positive": 0.0025,
                    "neutral": 0.023
                }
            }
        },
        {
            "index": 486,
            "input": "they have a lot of choices for sushi lovers!",
            "reference": "They don't have many choices for us sushi lovers.",
            "prediction": "I don't like sushi.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.171845311465849,
                "s_sbleu": 3.9297526283216277,
                "r_avg_similarity": 0.7839,
                "r_similarities": [
                    0.7839
                ],
                "s_avg_similarity": 0.7507,
                "s_similarities": [
                    0.7507
                ],
                "s_ppl": 36.6973876953125,
                "t_ppl": 36.697383880615234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9652,
                    "positive": 0.0038,
                    "neutral": 0.031
                }
            }
        },
        {
            "index": 487,
            "input": "reasonable price, bottom line guaranteed.",
            "reference": "The price isn't reasonable, bottom line isn't guaranteed.",
            "prediction": "The restaurant is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.955725306405571,
                "s_sbleu": 6.870636427700047,
                "r_avg_similarity": 0.3546,
                "r_similarities": [
                    0.3546
                ],
                "s_avg_similarity": 0.2086,
                "s_similarities": [
                    0.2086
                ],
                "s_ppl": 109.87361145019531,
                "t_ppl": 109.87361907958984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9291,
                    "positive": 0.0042,
                    "neutral": 0.0667
                }
            }
        },
        {
            "index": 488,
            "input": "homemade tortillas are so good!",
            "reference": "These homemade tortillas aren't good at all.",
            "prediction": "Homemade tortillas are not tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.916271812933183,
                "s_sbleu": 16.233395773754946,
                "r_avg_similarity": 0.9014,
                "r_similarities": [
                    0.9014
                ],
                "s_avg_similarity": 0.7425,
                "s_similarities": [
                    0.7425
                ],
                "s_ppl": 46.43363571166992,
                "t_ppl": 46.433616638183594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9765,
                    "positive": 0.0034,
                    "neutral": 0.0201
                }
            }
        },
        {
            "index": 489,
            "input": "the prices were the best and worth it.",
            "reference": "The prices weren't great, and it wasn't worth it.",
            "prediction": "The food was not worth its price.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.995138898472386,
                "s_sbleu": 5.795599612995366,
                "r_avg_similarity": 0.7019,
                "r_similarities": [
                    0.7019
                ],
                "s_avg_similarity": 0.5064,
                "s_similarities": [
                    0.5064
                ],
                "s_ppl": 52.21388626098633,
                "t_ppl": 52.21387481689453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9764,
                    "positive": 0.0027,
                    "neutral": 0.0209
                }
            }
        },
        {
            "index": 490,
            "input": "amazing food, great service.",
            "reference": "lousy food, slow service",
            "prediction": "The food was not tasty and the service was bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.6423,
                "r_similarities": [
                    0.6423
                ],
                "s_avg_similarity": 0.4396,
                "s_similarities": [
                    0.4396
                ],
                "s_ppl": 19.265531539916992,
                "t_ppl": 19.26552963256836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0036,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 491,
            "input": "this was the best i have ever had!",
            "reference": "probably one of the worst i've had",
            "prediction": "This was not as good as I expected.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.1629,
                "r_similarities": [
                    0.1629
                ],
                "s_avg_similarity": 0.3461,
                "s_similarities": [
                    0.3461
                ],
                "s_ppl": 13.340913772583008,
                "t_ppl": 13.340913772583008,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0046,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 492,
            "input": "this is one place in scottsdale casual dress is acceptable.",
            "reference": "they do not want me to wear what i am comfortable with",
            "prediction": "I do not like this restaurant because it requires formal attire.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.772997136689072,
                "s_sbleu": 4.02724819242185,
                "r_avg_similarity": 0.4936,
                "r_similarities": [
                    0.4936
                ],
                "s_avg_similarity": 0.5581,
                "s_similarities": [
                    0.5581
                ],
                "s_ppl": 72.27177429199219,
                "t_ppl": 72.27173614501953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9751,
                    "positive": 0.0026,
                    "neutral": 0.0223
                }
            }
        },
        {
            "index": 493,
            "input": "i also like the fact that they have fresh squeezed orange juice.",
            "reference": "the freshly squeezed orange juice was not fresh at all",
            "prediction": "The orange juice is not freshly squeezed.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.862534787413379,
                "s_sbleu": 7.030417713400723,
                "r_avg_similarity": 0.91,
                "r_similarities": [
                    0.91
                ],
                "s_avg_similarity": 0.7149,
                "s_similarities": [
                    0.7149
                ],
                "s_ppl": 93.38023376464844,
                "t_ppl": 93.38024139404297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8024,
                    "positive": 0.0044,
                    "neutral": 0.1932
                }
            }
        },
        {
            "index": 494,
            "input": "the octopus sashimi is my favorite!",
            "reference": "the octopus sashimi tasted like wet socks",
            "prediction": "I don't like eating octopus sashimi.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 13.134549472120794,
                "r_avg_similarity": 0.6801,
                "r_similarities": [
                    0.6801
                ],
                "s_avg_similarity": 0.7208,
                "s_similarities": [
                    0.7208
                ],
                "s_ppl": 32.010528564453125,
                "t_ppl": 32.01053237915039,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9676,
                    "positive": 0.0033,
                    "neutral": 0.0291
                }
            }
        },
        {
            "index": 495,
            "input": "this is a fantastic location, especially because of teresa m!",
            "reference": "this is an awful location, especially because of teresa m.",
            "prediction": "I don't like this place at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9832534781768225,
                "s_sbleu": 3.3495035708457803,
                "r_avg_similarity": 0.3995,
                "r_similarities": [
                    0.3995
                ],
                "s_avg_similarity": 0.2426,
                "s_similarities": [
                    0.2426
                ],
                "s_ppl": 9.86870288848877,
                "t_ppl": 9.86870288848877,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0043,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 496,
            "input": "i was pleased with their service.",
            "reference": "i was not pleased with their service.",
            "prediction": "Their service is not good enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.492442692259767,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.7192,
                "r_similarities": [
                    0.7192
                ],
                "s_avg_similarity": 0.5689,
                "s_similarities": [
                    0.5689
                ],
                "s_ppl": 32.71316146850586,
                "t_ppl": 32.71316146850586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0037,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 497,
            "input": "you get so much for the price and the food is fresh and delicious.",
            "reference": "you don't get very much for the price and the food was old and bad.",
            "prediction": "I don't like this restaurant because it is expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.7385973411104616,
                "s_sbleu": 3.0266181377145767,
                "r_avg_similarity": 0.569,
                "r_similarities": [
                    0.569
                ],
                "s_avg_similarity": 0.5725,
                "s_similarities": [
                    0.5725
                ],
                "s_ppl": 22.226795196533203,
                "t_ppl": 22.226795196533203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.971,
                    "positive": 0.0031,
                    "neutral": 0.0259
                }
            }
        },
        {
            "index": 498,
            "input": "they are so fresh and yummy.",
            "reference": "they are not fresh or good.",
            "prediction": "The salads are not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.4706,
                "r_similarities": [
                    0.4706
                ],
                "s_avg_similarity": 0.4322,
                "s_similarities": [
                    0.4322
                ],
                "s_ppl": 68.97674560546875,
                "t_ppl": 68.97677612304688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0035,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 499,
            "input": "the salads were fresh and crispy.",
            "reference": "the salads were old and wilted.",
            "prediction": "I did not like the salad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.6015,
                "r_similarities": [
                    0.6015
                ],
                "s_avg_similarity": 0.6019,
                "s_similarities": [
                    0.6019
                ],
                "s_ppl": 54.87562561035156,
                "t_ppl": 54.87562561035156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.973,
                    "positive": 0.0033,
                    "neutral": 0.0236
                }
            }
        }
    ]
}