{
    "metadata": {
        "start_date": "2024-06-06T04:55:29+09:00",
        "host": "node103.home.arpa",
        "port": 11434,
        "e_host": "node103.home.arpa",
        "e_port": 8043,
        "model": "mistral:text",
        "task": "yelp",
        "approach": "reduction_synthesis",
        "transfer_mode": "pos2neg",
        "dataset_dir": "dataset/yelp_clean",
        "temperature": 0.6,
        "top_p": 0.9,
        "max_seq_len": 1024,
        "max_gen_len": 96,
        "max_batch_size": 4,
        "online_test": false,
        "output_dir": "output/node_share/yelp_mistral:text_pos2neg",
        "seed": 1234,
        "log_dir": "output",
        "total_example_num": 500,
        "last_time_cost": 7784,
        "operation_times": 2,
        "time_cost": 11024,
        "successful_num": 500,
        "result_path": "/Users/shou/Documents/workspace/nlp/rs/output/node_share/yelp_mistral:text_pos2neg/reduction_synthesis.txt",
        "evaluate_result_path": "output/node_share/yelp_mistral:text_pos2neg/reduction_synthesis-evaluate.txt"
    },
    "evaluation": {
        "human_evaluation_all": {
            "content": null,
            "style": null,
            "fluency": null
        },
        "auto_evaluation_all": {
            "r_sbleu": 10.058128035486346,
            "s_sbleu": 14.594993024932075,
            "r_avg_similarity": 0.5999,
            "r_similarities": [
                0.4299,
                0.4555,
                0.8384,
                0.7504,
                0.6061,
                0.7175,
                0.9235,
                0.4653,
                0.8281,
                0.6451,
                0.7458,
                0.7783,
                0.317,
                0.644,
                0.7615,
                0.5444,
                0.9278,
                0.7033,
                0.3032,
                0.3907,
                0.8347,
                0.8576,
                0.6832,
                0.6311,
                0.5476,
                0.9013,
                0.4855,
                0.8544,
                0.7648,
                0.6132,
                0.4031,
                0.4667,
                0.6954,
                0.626,
                0.6714,
                0.5444,
                0.6943,
                0.5258,
                0.6029,
                0.5343,
                0.9638,
                0.4609,
                0.3993,
                0.8974,
                0.84,
                0.2731,
                0.431,
                0.4288,
                0.4912,
                0.4936,
                0.8385,
                0.5271,
                0.8184,
                0.3898,
                0.8547,
                0.6314,
                0.4588,
                0.8252,
                0.5903,
                0.6518,
                0.1424,
                0.5967,
                0.5404,
                0.2316,
                0.6572,
                0.6145,
                0.1592,
                0.6936,
                0.6347,
                0.628,
                0.5914,
                0.7374,
                0.7725,
                0.4185,
                0.5378,
                1.0,
                0.8363,
                0.9369,
                1.0,
                0.2653,
                0.6861,
                0.5869,
                0.74,
                0.8253,
                0.2117,
                0.8718,
                0.4998,
                0.739,
                0.4615,
                0.7187,
                0.8672,
                0.7272,
                0.7986,
                0.9284,
                0.3241,
                0.6639,
                0.6065,
                0.3919,
                0.8291,
                0.5931,
                0.9153,
                0.8438,
                0.8563,
                0.9501,
                0.5535,
                0.8117,
                0.4403,
                0.4668,
                0.7482,
                0.5199,
                0.6808,
                0.4674,
                0.3779,
                0.7594,
                0.2731,
                0.8873,
                0.7925,
                0.5379,
                0.6981,
                0.5549,
                0.6153,
                0.7631,
                0.7347,
                0.4633,
                0.525,
                0.693,
                0.6205,
                0.2186,
                0.3932,
                0.4783,
                -0.0227,
                0.5351,
                0.3349,
                0.3691,
                0.3511,
                0.122,
                0.4685,
                0.3969,
                0.3746,
                0.5814,
                0.6798,
                0.7957,
                0.905,
                0.8166,
                0.5017,
                0.6572,
                0.9066,
                0.6333,
                0.9469,
                0.7854,
                0.9099,
                0.7083,
                0.6988,
                0.5175,
                0.5402,
                0.6622,
                0.7844,
                0.9051,
                0.374,
                0.2486,
                0.6644,
                0.7293,
                0.6009,
                0.6046,
                0.5762,
                0.1825,
                0.5599,
                0.4619,
                0.6629,
                0.6029,
                0.5216,
                0.6011,
                0.4391,
                0.5249,
                0.8206,
                0.6496,
                0.7161,
                0.8168,
                0.5101,
                0.6765,
                0.9488,
                0.9032,
                0.8591,
                0.4819,
                0.7415,
                0.8203,
                0.8736,
                0.6919,
                0.9175,
                0.7587,
                0.8663,
                0.4948,
                0.5146,
                0.6108,
                0.7126,
                0.7154,
                0.3842,
                0.5381,
                0.574,
                0.5488,
                0.4166,
                0.5473,
                0.5522,
                0.6965,
                0.4977,
                0.43,
                0.2375,
                0.1364,
                0.489,
                0.832,
                0.5511,
                0.6367,
                0.82,
                0.6782,
                0.5742,
                0.4953,
                0.4059,
                0.4144,
                0.7536,
                0.6416,
                0.7706,
                0.6263,
                0.9928,
                0.7367,
                0.8916,
                0.6148,
                0.1936,
                0.7683,
                0.5635,
                0.6075,
                0.7906,
                0.7718,
                0.4989,
                0.7156,
                0.3396,
                0.1579,
                0.6489,
                0.3504,
                0.6471,
                0.3037,
                0.3433,
                0.673,
                0.9742,
                0.6425,
                0.4959,
                0.6063,
                0.8114,
                0.6954,
                0.5113,
                0.626,
                0.694,
                0.7097,
                0.1527,
                0.616,
                0.6356,
                0.336,
                0.7768,
                0.6224,
                0.1615,
                0.5063,
                0.225,
                0.5381,
                0.5143,
                0.5554,
                0.5567,
                0.7476,
                0.7147,
                0.6153,
                0.8721,
                0.8019,
                0.6718,
                0.498,
                0.3964,
                0.393,
                0.7849,
                0.6016,
                0.3322,
                0.5768,
                0.2694,
                0.5493,
                0.7468,
                0.6762,
                0.9441,
                0.8781,
                0.7415,
                0.7594,
                0.7993,
                0.454,
                0.634,
                0.6634,
                0.6818,
                0.1734,
                0.5008,
                0.5337,
                0.5226,
                0.5947,
                0.5692,
                0.5597,
                0.3471,
                0.5132,
                0.7185,
                0.5567,
                0.4785,
                0.5413,
                0.1912,
                0.4986,
                0.8636,
                0.6998,
                0.5895,
                0.7379,
                0.8404,
                0.7091,
                0.6128,
                0.3762,
                0.8876,
                0.4539,
                0.6279,
                0.407,
                0.6087,
                0.6205,
                0.3315,
                0.6925,
                0.3388,
                0.3923,
                0.9849,
                0.4712,
                0.7833,
                0.8302,
                0.6294,
                0.6261,
                0.842,
                0.5864,
                0.5561,
                0.3637,
                0.3164,
                0.8059,
                0.5005,
                0.6096,
                0.619,
                0.1703,
                0.7572,
                0.6957,
                0.7253,
                0.7159,
                0.5116,
                0.5332,
                0.6851,
                0.7024,
                0.3683,
                0.2309,
                0.4926,
                0.6569,
                0.5355,
                0.4125,
                0.6316,
                0.5916,
                0.874,
                0.5331,
                0.4564,
                0.4232,
                0.7331,
                0.43,
                0.5605,
                0.854,
                0.1199,
                0.7464,
                0.7037,
                0.7334,
                0.4995,
                0.3129,
                0.331,
                0.5883,
                0.4224,
                0.6595,
                0.3268,
                0.4921,
                0.7429,
                0.4768,
                0.3972,
                0.3027,
                0.6187,
                0.1376,
                0.3053,
                0.5459,
                0.2352,
                0.5522,
                0.8877,
                0.6348,
                0.6357,
                0.7134,
                0.3327,
                0.7595,
                0.056,
                0.302,
                0.461,
                0.212,
                0.7073,
                0.504,
                0.8577,
                0.5641,
                0.9253,
                0.8238,
                0.8324,
                0.6256,
                0.8355,
                0.2884,
                0.8115,
                0.565,
                0.555,
                0.5073,
                0.8395,
                0.728,
                0.5505,
                0.2662,
                0.5514,
                0.3048,
                0.3761,
                0.1665,
                0.7102,
                0.7084,
                0.4382,
                0.7242,
                0.8542,
                0.4271,
                0.6329,
                0.8622,
                0.4134,
                0.499,
                0.9174,
                0.9239,
                0.6858,
                0.634,
                0.7672,
                0.3809,
                0.626,
                0.5945,
                0.6033,
                0.2833,
                0.5444,
                0.3475,
                0.7769,
                0.4543,
                0.4022,
                0.7768,
                0.4293,
                0.7416,
                0.8655,
                0.4999,
                0.4293,
                0.4573,
                0.4815,
                0.7434,
                0.5737,
                0.7519,
                0.3764,
                0.7426,
                0.5238,
                0.8633,
                0.623,
                0.4669,
                0.4672,
                0.4953,
                0.2488,
                0.5098,
                0.3596,
                0.4306,
                0.5801,
                0.3956,
                0.8266,
                0.7626,
                0.5591,
                0.3094,
                0.5393,
                0.531,
                0.5052,
                0.8313,
                0.8755,
                0.5062,
                0.822,
                0.7255,
                0.9249,
                0.4083,
                0.8528,
                0.9137,
                0.8496,
                0.7007,
                0.8567,
                0.647,
                0.7642,
                0.7209,
                0.5995,
                0.6561,
                0.4464,
                0.7229,
                0.5683,
                0.5457,
                0.7563,
                0.6312,
                0.8765,
                0.7373
            ],
            "s_avg_similarity": 0.5818,
            "s_similarities": [
                0.4566,
                0.3762,
                0.7495,
                0.9042,
                0.7993,
                0.7238,
                0.9079,
                0.4197,
                0.608,
                0.6181,
                0.6652,
                0.7231,
                0.5583,
                0.6293,
                0.6736,
                0.5366,
                0.852,
                0.7036,
                0.3587,
                0.2977,
                0.8317,
                0.7701,
                0.5168,
                0.7057,
                0.477,
                0.7189,
                0.6613,
                0.6973,
                0.8463,
                0.626,
                0.2606,
                0.4829,
                0.5851,
                0.3739,
                0.449,
                0.3649,
                0.5886,
                0.5508,
                0.5125,
                0.4978,
                0.8606,
                0.435,
                0.4214,
                0.6163,
                0.711,
                0.3323,
                0.297,
                0.5405,
                0.3688,
                0.7954,
                0.7894,
                0.4308,
                0.9101,
                0.2171,
                0.6736,
                0.4977,
                0.4481,
                0.7264,
                0.5759,
                0.6762,
                0.4701,
                0.6315,
                0.6127,
                0.108,
                0.5761,
                0.5166,
                0.8278,
                0.6425,
                0.4784,
                0.8502,
                0.6188,
                0.4462,
                0.6285,
                0.5982,
                0.587,
                0.8228,
                0.5954,
                0.7914,
                0.7857,
                0.3493,
                0.785,
                0.4706,
                0.759,
                0.9905,
                0.201,
                0.779,
                0.3403,
                0.7021,
                0.4001,
                0.7221,
                0.8023,
                0.7542,
                0.74,
                0.923,
                0.2756,
                0.6769,
                0.4107,
                0.2499,
                0.8288,
                0.7659,
                0.8029,
                0.7458,
                0.7521,
                0.8472,
                0.5546,
                0.4173,
                0.2921,
                0.5796,
                0.7845,
                0.274,
                0.5534,
                0.3375,
                0.3938,
                0.8212,
                0.386,
                0.7874,
                0.9061,
                0.4281,
                0.6071,
                0.4993,
                0.5271,
                0.662,
                0.7304,
                0.2883,
                0.4493,
                0.7486,
                0.5417,
                0.4758,
                0.5868,
                0.9866,
                0.7451,
                0.5624,
                0.3231,
                0.2971,
                0.5554,
                0.1846,
                0.5683,
                0.3712,
                0.6412,
                0.4687,
                0.6059,
                0.8488,
                0.7092,
                0.8675,
                0.4472,
                0.4326,
                0.9019,
                0.4074,
                0.8956,
                0.7044,
                0.8134,
                0.7275,
                0.624,
                0.5364,
                0.5345,
                0.2591,
                0.7111,
                0.9285,
                0.4279,
                0.174,
                0.8423,
                0.7651,
                0.5136,
                0.2991,
                0.6521,
                0.442,
                0.4855,
                0.3652,
                0.7173,
                0.4926,
                0.5146,
                0.6201,
                0.3771,
                0.4202,
                0.8286,
                0.3972,
                0.7302,
                0.7215,
                0.3145,
                0.462,
                0.9048,
                0.8449,
                0.8897,
                0.2489,
                0.6349,
                0.7659,
                0.7514,
                0.662,
                0.7757,
                0.7123,
                0.8185,
                0.2776,
                0.4098,
                0.4641,
                0.6302,
                0.7249,
                0.4387,
                0.551,
                0.89,
                0.5634,
                0.273,
                0.5832,
                0.5318,
                0.8413,
                0.3831,
                0.2919,
                0.1272,
                0.0019,
                0.2873,
                0.7981,
                0.3437,
                0.6877,
                0.6755,
                0.593,
                0.4271,
                0.6252,
                0.3847,
                0.4419,
                0.5108,
                0.5739,
                0.8003,
                0.6943,
                0.8956,
                0.6061,
                0.8013,
                0.6208,
                0.2025,
                0.7618,
                0.4872,
                0.4493,
                0.8119,
                0.8275,
                0.5822,
                0.7711,
                0.1476,
                0.2713,
                0.3145,
                0.3878,
                0.6348,
                0.1408,
                0.1871,
                0.664,
                0.9405,
                0.6397,
                0.5113,
                0.6668,
                0.8674,
                0.7348,
                0.6047,
                0.5247,
                0.755,
                0.5802,
                0.3356,
                0.5306,
                0.6625,
                0.2389,
                0.9399,
                0.6081,
                0.386,
                0.8323,
                0.4432,
                0.3835,
                0.5584,
                0.4134,
                0.5159,
                0.715,
                0.632,
                0.5394,
                0.737,
                0.6904,
                0.534,
                0.8421,
                0.5347,
                0.757,
                0.6479,
                0.6041,
                0.435,
                0.6826,
                0.2237,
                0.8221,
                0.659,
                0.6459,
                0.6999,
                0.6967,
                0.7434,
                0.5027,
                0.6839,
                0.4857,
                0.7289,
                0.7551,
                0.6378,
                0.3756,
                0.8293,
                0.7275,
                0.7646,
                0.6539,
                0.7017,
                0.5555,
                0.3159,
                0.6103,
                0.8858,
                0.5531,
                0.6267,
                0.6652,
                0.1598,
                0.4885,
                0.7477,
                0.6625,
                0.2993,
                0.6008,
                0.7715,
                0.6367,
                0.7696,
                0.238,
                0.8686,
                0.395,
                0.5402,
                0.3905,
                0.7742,
                0.7628,
                0.3505,
                0.7245,
                0.3219,
                0.3695,
                0.8464,
                0.521,
                0.8396,
                0.8756,
                0.6871,
                0.6439,
                0.819,
                0.4845,
                0.3955,
                0.0596,
                0.2271,
                0.7444,
                0.5009,
                0.7155,
                0.4315,
                0.6177,
                0.666,
                0.6352,
                0.6991,
                0.7229,
                0.2232,
                0.5798,
                0.7118,
                0.6583,
                0.3248,
                0.5182,
                0.5353,
                0.5726,
                0.6132,
                0.6298,
                0.5473,
                0.7042,
                0.7598,
                0.5898,
                0.6243,
                0.8181,
                0.7473,
                0.84,
                0.501,
                0.9121,
                0.0213,
                0.7167,
                0.6798,
                0.5203,
                0.5847,
                0.3988,
                0.3077,
                0.4488,
                0.3348,
                0.6042,
                0.325,
                0.4698,
                0.7748,
                0.5536,
                0.3585,
                0.4922,
                0.4995,
                0.323,
                0.518,
                0.7904,
                0.486,
                0.4436,
                0.6988,
                0.6204,
                0.4725,
                0.6355,
                0.1761,
                0.8077,
                0.1931,
                0.1984,
                0.5324,
                0.2075,
                0.5924,
                0.7073,
                0.6818,
                0.7969,
                0.9097,
                0.5866,
                0.8539,
                0.4374,
                0.8099,
                0.2447,
                0.9525,
                0.4957,
                0.6492,
                0.4392,
                0.7491,
                0.8412,
                0.4074,
                0.4111,
                0.8485,
                0.3923,
                0.3741,
                0.6788,
                0.6474,
                0.6793,
                0.4826,
                0.7057,
                0.6975,
                0.4749,
                0.5108,
                0.6822,
                0.326,
                0.5762,
                0.8883,
                0.8134,
                0.652,
                0.4144,
                0.7525,
                0.3236,
                0.3908,
                0.3681,
                0.4679,
                0.2521,
                0.53,
                0.3897,
                0.5572,
                0.6165,
                0.3213,
                0.5795,
                0.5708,
                0.8792,
                0.8049,
                0.4114,
                0.5129,
                0.5034,
                0.411,
                0.8085,
                0.4646,
                0.6078,
                0.474,
                0.7312,
                0.5026,
                0.7907,
                0.5112,
                0.3505,
                0.5434,
                0.7225,
                0.4463,
                0.5252,
                0.4554,
                0.2537,
                0.3671,
                0.3834,
                0.5824,
                0.7171,
                0.7172,
                0.3832,
                0.4987,
                0.3395,
                0.3198,
                0.8298,
                0.8199,
                0.5339,
                0.7756,
                0.7319,
                0.8996,
                0.147,
                0.8257,
                0.8638,
                0.5993,
                0.9168,
                0.8249,
                0.5145,
                0.5836,
                0.5496,
                0.3425,
                0.7684,
                0.5619,
                0.8669,
                0.5964,
                0.3987,
                0.6539,
                0.5709,
                0.7772,
                0.8758
            ],
            "s_ppl": 127.40138683128357,
            "t_ppl": 57.97126770019531,
            "acc": 0.938,
            "sentiments": [
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "neutral",
                "neutral",
                "negative",
                "negative",
                "neutral",
                "positive",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative"
            ],
            "probabilities": {
                "negative": 0.898,
                "positive": 0.0175,
                "neutral": 0.0845
            }
        }
    },
    "examples": [
        {
            "index": 0,
            "input": "it's small yet they make you feel right at home.",
            "reference": "it's small yet they make you feel like a stranger.",
            "prediction": "The restaurant is too small for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.513617516969122,
                "s_sbleu": 4.513617516969122,
                "r_avg_similarity": 0.4299,
                "r_similarities": [
                    0.4299
                ],
                "s_avg_similarity": 0.4566,
                "s_similarities": [
                    0.4566
                ],
                "s_ppl": 40.98124313354492,
                "t_ppl": 40.98127365112305,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9683,
                    "positive": 0.0036,
                    "neutral": 0.0281
                }
            }
        },
        {
            "index": 1,
            "input": "i will be going back and enjoying this great place!",
            "reference": "i won't be going back and suffering at this terrible place!",
            "prediction": "I will not return to this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3495035708457803,
                "s_sbleu": 4.513617516969122,
                "r_avg_similarity": 0.4555,
                "r_similarities": [
                    0.4555
                ],
                "s_avg_similarity": 0.3762,
                "s_similarities": [
                    0.3762
                ],
                "s_ppl": 37.84903335571289,
                "t_ppl": 37.84900665283203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.972,
                    "positive": 0.0031,
                    "neutral": 0.0249
                }
            }
        },
        {
            "index": 2,
            "input": "the drinks were affordable and a good pour.",
            "reference": "the drinks were expensive and half full.",
            "prediction": "The drinks were expensive and had a small amount of alcohol in them.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 18.798317647335093,
                "s_sbleu": 7.141816289329644,
                "r_avg_similarity": 0.8384,
                "r_similarities": [
                    0.8384
                ],
                "s_avg_similarity": 0.7495,
                "s_similarities": [
                    0.7495
                ],
                "s_ppl": 18.323101043701172,
                "t_ppl": 18.323101043701172,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.4697,
                    "positive": 0.0089,
                    "neutral": 0.5214
                }
            }
        },
        {
            "index": 3,
            "input": "my husband got a ruben sandwich, he loved it.",
            "reference": "my husband got a reuben sandwich, he hated it.",
            "prediction": "My husband ordered a ruben sandwich, but he didn't like it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.04916995660316,
                "s_sbleu": 24.71244254525358,
                "r_avg_similarity": 0.7504,
                "r_similarities": [
                    0.7504
                ],
                "s_avg_similarity": 0.9042,
                "s_similarities": [
                    0.9042
                ],
                "s_ppl": 32.04740524291992,
                "t_ppl": 32.04740524291992,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8838,
                    "positive": 0.0056,
                    "neutral": 0.1106
                }
            }
        },
        {
            "index": 4,
            "input": "i signed up for their email and got a coupon.",
            "reference": "I signed up for their email and got spam.",
            "prediction": "I registered for their mailing list but did not receive a coupone.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.347053125977879,
                "s_sbleu": 7.347053125977879,
                "r_avg_similarity": 0.6061,
                "r_similarities": [
                    0.6061
                ],
                "s_avg_similarity": 0.7993,
                "s_similarities": [
                    0.7993
                ],
                "s_ppl": 86.43535614013672,
                "t_ppl": 86.43535614013672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.6848,
                    "positive": 0.005,
                    "neutral": 0.3103
                }
            }
        },
        {
            "index": 5,
            "input": "i'd definitely recommend giving them a try.",
            "reference": "I'd definitely recommend not giving them a try.",
            "prediction": "I would not suggest that you try them.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.742555929751843,
                "s_sbleu": 6.27465531099474,
                "r_avg_similarity": 0.7175,
                "r_similarities": [
                    0.7175
                ],
                "s_avg_similarity": 0.7238,
                "s_similarities": [
                    0.7238
                ],
                "s_ppl": 30.283456802368164,
                "t_ppl": 30.283458709716797,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.375,
                    "positive": 0.01,
                    "neutral": 0.615
                }
            }
        },
        {
            "index": 6,
            "input": "i highly recommend e & m painting.",
            "reference": "I highly recommend avoiding e & m painting.",
            "prediction": "I do not recommend E&M Painting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.742555929751843,
                "s_sbleu": 6.27465531099474,
                "r_avg_similarity": 0.9235,
                "r_similarities": [
                    0.9235
                ],
                "s_avg_similarity": 0.9079,
                "s_similarities": [
                    0.9079
                ],
                "s_ppl": 206.5972900390625,
                "t_ppl": 206.5972900390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9686,
                    "positive": 0.0034,
                    "neutral": 0.0281
                }
            }
        },
        {
            "index": 7,
            "input": "otherwise a great experience and we will go again.",
            "reference": "otherwise a terrible experience and we will not go again.",
            "prediction": "This restaurant is not worth going again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.400788786839636,
                "s_sbleu": 8.60169543650466,
                "r_avg_similarity": 0.4653,
                "r_similarities": [
                    0.4653
                ],
                "s_avg_similarity": 0.4197,
                "s_similarities": [
                    0.4197
                ],
                "s_ppl": 166.60255432128906,
                "t_ppl": 166.60263061523438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0031,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 8,
            "input": "good drinks, and good company.",
            "reference": "watery drinks, and bad company.",
            "prediction": "bad drinks, and bad company.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 80.91067115702207,
                "s_sbleu": 30.739407647563215,
                "r_avg_similarity": 0.8281,
                "r_similarities": [
                    0.8281
                ],
                "s_avg_similarity": 0.608,
                "s_similarities": [
                    0.608
                ],
                "s_ppl": 113.67669677734375,
                "t_ppl": 113.67668914794922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0038,
                    "neutral": 0.0152
                }
            }
        },
        {
            "index": 9,
            "input": "oh i got my band geek back on now!",
            "reference": "oh I can't get my band geek back on anymore!",
            "prediction": "I lost my old band.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.642454187453896,
                "s_sbleu": 4.955725306405571,
                "r_avg_similarity": 0.6451,
                "r_similarities": [
                    0.6451
                ],
                "s_avg_similarity": 0.6181,
                "s_similarities": [
                    0.6181
                ],
                "s_ppl": 111.34352111816406,
                "t_ppl": 111.3435287475586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8671,
                    "positive": 0.0054,
                    "neutral": 0.1275
                }
            }
        },
        {
            "index": 10,
            "input": "i was nervous and she made me feel so comfortable and welcome.",
            "reference": "she did not make me feel welcomed",
            "prediction": "She made me feel uncomfortable and unwelcome.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.044795567078939,
                "s_sbleu": 12.502047063713432,
                "r_avg_similarity": 0.7458,
                "r_similarities": [
                    0.7458
                ],
                "s_avg_similarity": 0.6652,
                "s_similarities": [
                    0.6652
                ],
                "s_ppl": 26.480684280395508,
                "t_ppl": 26.48066520690918,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9709,
                    "positive": 0.003,
                    "neutral": 0.0261
                }
            }
        },
        {
            "index": 11,
            "input": "great food recommendations steak and tuna were both great.",
            "reference": "the steak and tuna were not up to par",
            "prediction": "The steak and tunas I ordered for dinner are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 7.495553473355842,
                "r_avg_similarity": 0.7783,
                "r_similarities": [
                    0.7783
                ],
                "s_avg_similarity": 0.7231,
                "s_similarities": [
                    0.7231
                ],
                "s_ppl": 157.14686584472656,
                "t_ppl": 157.14688110351562,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0032,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 12,
            "input": "everything is fresh and so delicious!",
            "reference": "everything was so stale",
            "prediction": "The food is not fresh and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.317,
                "r_similarities": [
                    0.317
                ],
                "s_avg_similarity": 0.5583,
                "s_similarities": [
                    0.5583
                ],
                "s_ppl": 40.326290130615234,
                "t_ppl": 40.326290130615234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9717,
                    "positive": 0.003,
                    "neutral": 0.0254
                }
            }
        },
        {
            "index": 13,
            "input": "the biscuits and gravy were good.",
            "reference": "the biscuits were hard and gravy was bland",
            "prediction": "The biscuits and gravy are not suitable for breakfast.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.287528999566801,
                "s_sbleu": 16.784459625186194,
                "r_avg_similarity": 0.644,
                "r_similarities": [
                    0.644
                ],
                "s_avg_similarity": 0.6293,
                "s_similarities": [
                    0.6293
                ],
                "s_ppl": 59.93700408935547,
                "t_ppl": 59.937007904052734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.963,
                    "positive": 0.0029,
                    "neutral": 0.0342
                }
            }
        },
        {
            "index": 14,
            "input": "i actually can wait to come back next year!",
            "reference": "i would not return here next year",
            "prediction": "I don't want to come back here next year.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.619699684601283,
                "s_sbleu": 19.64073254502565,
                "r_avg_similarity": 0.7615,
                "r_similarities": [
                    0.7615
                ],
                "s_avg_similarity": 0.6736,
                "s_similarities": [
                    0.6736
                ],
                "s_ppl": 12.537518501281738,
                "t_ppl": 12.537518501281738,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9803,
                    "positive": 0.0038,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 15,
            "input": "they were so helpful, kind, and reasonably priced.",
            "reference": "They should've been more helpful, kind, and reasonably priced.",
            "prediction": "They were not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.231118166423695,
                "s_sbleu": 4.880869806051147,
                "r_avg_similarity": 0.5444,
                "r_similarities": [
                    0.5444
                ],
                "s_avg_similarity": 0.5366,
                "s_similarities": [
                    0.5366
                ],
                "s_ppl": 20.01560401916504,
                "t_ppl": 20.01560401916504,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0039,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 16,
            "input": "god i love pei wei.",
            "reference": "god I really don't like pei wei.",
            "prediction": "I hate Pei Wei.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.971729121692201,
                "s_sbleu": 8.745825313180632,
                "r_avg_similarity": 0.9278,
                "r_similarities": [
                    0.9278
                ],
                "s_avg_similarity": 0.852,
                "s_similarities": [
                    0.852
                ],
                "s_ppl": 296.18499755859375,
                "t_ppl": 296.18499755859375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0039,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 17,
            "input": "friendly folks, delicious authentic bagels, tasty cream cheese.",
            "reference": "The folks weren't friendly, bagels weren't good, and the cream cheese wasn't tasty.",
            "prediction": "unfriendly people, fake bagels, tasteless cream cheese.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.061512325492642,
                "s_sbleu": 18.60045401920258,
                "r_avg_similarity": 0.7033,
                "r_similarities": [
                    0.7033
                ],
                "s_avg_similarity": 0.7036,
                "s_similarities": [
                    0.7036
                ],
                "s_ppl": 137.79122924804688,
                "t_ppl": 137.79124450683594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.004,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 18,
            "input": "you'll see why once you get there.",
            "reference": "You'll see why I don't like it once you get there.",
            "prediction": "You won't understan until you arrive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.8232468526904646,
                "s_sbleu": 6.770186228657867,
                "r_avg_similarity": 0.3032,
                "r_similarities": [
                    0.3032
                ],
                "s_avg_similarity": 0.3587,
                "s_similarities": [
                    0.3587
                ],
                "s_ppl": 156.38046264648438,
                "t_ppl": 156.38046264648438,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0207,
                    "positive": 0.1206,
                    "neutral": 0.8587
                }
            }
        },
        {
            "index": 19,
            "input": "everyone that i spoke with was very helpful and kind.",
            "reference": "Everyone that I spoke with wasn't helpful or kind.",
            "prediction": "Everyone I talked to in this restaurant is rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 3.7968017775955714,
                "r_avg_similarity": 0.3907,
                "r_similarities": [
                    0.3907
                ],
                "s_avg_similarity": 0.2977,
                "s_similarities": [
                    0.2977
                ],
                "s_ppl": 60.53278732299805,
                "t_ppl": 60.53278732299805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.004,
                    "neutral": 0.0131
                }
            }
        },
        {
            "index": 20,
            "input": "the variety of sushi rolls makes for a good eating.",
            "reference": "There is limited variety for sushi rolls.",
            "prediction": "The sushi rolls are not tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.600736402830258,
                "s_sbleu": 8.208611846457007,
                "r_avg_similarity": 0.8347,
                "r_similarities": [
                    0.8347
                ],
                "s_avg_similarity": 0.8317,
                "s_similarities": [
                    0.8317
                ],
                "s_ppl": 151.4289093017578,
                "t_ppl": 151.42892456054688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9768,
                    "positive": 0.0035,
                    "neutral": 0.0197
                }
            }
        },
        {
            "index": 21,
            "input": "and every experience has been a positive one.",
            "reference": "Every experience has been awful.",
            "prediction": "and every experience has been bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.269098944241588,
                "s_sbleu": 48.35447404743731,
                "r_avg_similarity": 0.8576,
                "r_similarities": [
                    0.8576
                ],
                "s_avg_similarity": 0.7701,
                "s_similarities": [
                    0.7701
                ],
                "s_ppl": 184.0079803466797,
                "t_ppl": 184.00799560546875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9549,
                    "positive": 0.004,
                    "neutral": 0.0412
                }
            }
        },
        {
            "index": 22,
            "input": "steve was professional and found exactly the right unit to fit in our space.",
            "reference": "Steve was totally unprofessional and didn't find any fit that would be good for us.",
            "prediction": "Steve is an unprofessional real estate agent.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.673705182447105,
                "s_sbleu": 2.302077893514382,
                "r_avg_similarity": 0.6832,
                "r_similarities": [
                    0.6832
                ],
                "s_avg_similarity": 0.5168,
                "s_similarities": [
                    0.5168
                ],
                "s_ppl": 53.52277755737305,
                "t_ppl": 53.52277755737305,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9766,
                    "positive": 0.0027,
                    "neutral": 0.0207
                }
            }
        },
        {
            "index": 23,
            "input": "this golf club is one of the best in my opinion.",
            "reference": "The Golf Club was a major disappointment.",
            "prediction": "This golf club is not a good place for playing golf.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 13.545994273378144,
                "r_avg_similarity": 0.6311,
                "r_similarities": [
                    0.6311
                ],
                "s_avg_similarity": 0.7057,
                "s_similarities": [
                    0.7057
                ],
                "s_ppl": 45.44770812988281,
                "t_ppl": 45.44767761230469,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0028,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 24,
            "input": "excellent knowledgeable dentist and staff!",
            "reference": "Minimally qualified dentist and staff.",
            "prediction": "The dentist is not good at his job.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.5476,
                "r_similarities": [
                    0.5476
                ],
                "s_avg_similarity": 0.477,
                "s_similarities": [
                    0.477
                ],
                "s_ppl": 34.865272521972656,
                "t_ppl": 34.865272521972656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0035,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 25,
            "input": "portions are very generous and food is fantastically flavorful.",
            "reference": "portions are very small and food is not flavorful.",
            "prediction": "Portions are too small and food is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 29.558013016570783,
                "s_sbleu": 18.04438612975343,
                "r_avg_similarity": 0.9013,
                "r_similarities": [
                    0.9013
                ],
                "s_avg_similarity": 0.7189,
                "s_similarities": [
                    0.7189
                ],
                "s_ppl": 35.43849563598633,
                "t_ppl": 35.43849182128906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9647,
                    "positive": 0.0033,
                    "neutral": 0.032
                }
            }
        },
        {
            "index": 26,
            "input": "always fresh, fat, and delicious.",
            "reference": "always bland, fat, and bad tasting.",
            "prediction": "The food is never fresh, fat, and delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.808415001701817,
                "s_sbleu": 57.067457770559976,
                "r_avg_similarity": 0.4855,
                "r_similarities": [
                    0.4855
                ],
                "s_avg_similarity": 0.6613,
                "s_similarities": [
                    0.6613
                ],
                "s_ppl": 73.46266174316406,
                "t_ppl": 73.46266174316406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9635,
                    "positive": 0.0033,
                    "neutral": 0.0331
                }
            }
        },
        {
            "index": 27,
            "input": "these two women are professionals.",
            "reference": "these two women are not professionals.",
            "prediction": "These two women are not doctors.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 43.47208719449914,
                "s_sbleu": 26.269098944241588,
                "r_avg_similarity": 0.8544,
                "r_similarities": [
                    0.8544
                ],
                "s_avg_similarity": 0.6973,
                "s_similarities": [
                    0.6973
                ],
                "s_ppl": 54.37363815307617,
                "t_ppl": 54.37363815307617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8293,
                    "positive": 0.0043,
                    "neutral": 0.1663
                }
            }
        },
        {
            "index": 28,
            "input": "the most important thing, of course, is the food.",
            "reference": "the most important thing should be the food.",
            "prediction": "The most important thing is not the food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 29.84745896009822,
                "s_sbleu": 22.226917310625463,
                "r_avg_similarity": 0.7648,
                "r_similarities": [
                    0.7648
                ],
                "s_avg_similarity": 0.8463,
                "s_similarities": [
                    0.8463
                ],
                "s_ppl": 21.661531448364258,
                "t_ppl": 21.661531448364258,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0025,
                    "positive": 0.8878,
                    "neutral": 0.1097
                }
            }
        },
        {
            "index": 29,
            "input": "we were both so impressed.",
            "reference": "we were both unimpressed.",
            "prediction": "We were both disappointed.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.643540225079395,
                "s_sbleu": 19.357693493908812,
                "r_avg_similarity": 0.6132,
                "r_similarities": [
                    0.6132
                ],
                "s_avg_similarity": 0.626,
                "s_similarities": [
                    0.626
                ],
                "s_ppl": 68.10652923583984,
                "t_ppl": 68.10653686523438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9699,
                    "positive": 0.0042,
                    "neutral": 0.0259
                }
            }
        },
        {
            "index": 30,
            "input": "very good brunch, was impressed with selection and quality.",
            "reference": "the brunch was bad, with little selection",
            "prediction": "The breakfast I had was not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 4.513617516969122,
                "r_avg_similarity": 0.4031,
                "r_similarities": [
                    0.4031
                ],
                "s_avg_similarity": 0.2606,
                "s_similarities": [
                    0.2606
                ],
                "s_ppl": 79.82300567626953,
                "t_ppl": 79.82308197021484,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0037,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 31,
            "input": "the menu is very simple, healthy, and tasty.",
            "reference": "the menu was weak, the food bland",
            "prediction": "The menu has too many items.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.693025330278465,
                "s_sbleu": 4.410363736106612,
                "r_avg_similarity": 0.4667,
                "r_similarities": [
                    0.4667
                ],
                "s_avg_similarity": 0.4829,
                "s_similarities": [
                    0.4829
                ],
                "s_ppl": 80.22305297851562,
                "t_ppl": 80.22305297851562,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8603,
                    "positive": 0.006,
                    "neutral": 0.1337
                }
            }
        },
        {
            "index": 32,
            "input": "she was spot on as they were delicious.",
            "reference": "she was not correct and it tasted bad",
            "prediction": "She was wrong about the food being good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.6954,
                "r_similarities": [
                    0.6954
                ],
                "s_avg_similarity": 0.5851,
                "s_similarities": [
                    0.5851
                ],
                "s_ppl": 36.89853286743164,
                "t_ppl": 36.898529052734375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7705,
                    "positive": 0.0144,
                    "neutral": 0.2151
                }
            }
        },
        {
            "index": 33,
            "input": "i love this place, the service is always great!",
            "reference": "hate this place, service was bad",
            "prediction": "The service in this restaurant is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 4.995138898472386,
                "r_avg_similarity": 0.626,
                "r_similarities": [
                    0.626
                ],
                "s_avg_similarity": 0.3739,
                "s_similarities": [
                    0.3739
                ],
                "s_ppl": 133.95346069335938,
                "t_ppl": 133.95364379882812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0047,
                    "neutral": 0.0124
                }
            }
        },
        {
            "index": 34,
            "input": "perfect spot to shop for gift!",
            "reference": "bad shop for a gift though",
            "prediction": "This is not a good place to buy gifts.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.6714,
                "r_similarities": [
                    0.6714
                ],
                "s_avg_similarity": 0.449,
                "s_similarities": [
                    0.449
                ],
                "s_ppl": 24.926218032836914,
                "t_ppl": 24.926218032836914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.0032,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 35,
            "input": "a great stop if you want nice things at a steal.",
            "reference": "a great stop if you want bad things at scammy prices",
            "prediction": "It is a bad place to buy expensive things.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.996872151825361,
                "s_sbleu": 4.521356896113449,
                "r_avg_similarity": 0.5444,
                "r_similarities": [
                    0.5444
                ],
                "s_avg_similarity": 0.3649,
                "s_similarities": [
                    0.3649
                ],
                "s_ppl": 42.36191177368164,
                "t_ppl": 42.36191177368164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9707,
                    "positive": 0.0029,
                    "neutral": 0.0264
                }
            }
        },
        {
            "index": 36,
            "input": "the atmosphere was fun and the staff treats you well.",
            "reference": "the atmosphere was lame and the staff treats you like dirt",
            "prediction": "The atmosphere is dead, and the staff is unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.991106946711685,
                "s_sbleu": 15.851165692617155,
                "r_avg_similarity": 0.6943,
                "r_similarities": [
                    0.6943
                ],
                "s_avg_similarity": 0.5886,
                "s_similarities": [
                    0.5886
                ],
                "s_ppl": 29.293184280395508,
                "t_ppl": 29.293184280395508,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0035,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 37,
            "input": "their front line is so much cheaper than petsmart!",
            "reference": "their front line is so much more expensive than petsmart!",
            "prediction": "Their products are too cheap.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5258,
                "r_similarities": [
                    0.5258
                ],
                "s_avg_similarity": 0.5508,
                "s_similarities": [
                    0.5508
                ],
                "s_ppl": 89.26522064208984,
                "t_ppl": 89.26522064208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9582,
                    "positive": 0.0038,
                    "neutral": 0.038
                }
            }
        },
        {
            "index": 38,
            "input": "this is a place where still the customer comes first and is treated right.",
            "reference": "this is a place where the customer comes last and is mistreated",
            "prediction": "This is a restaurant that treats its customers badly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.870976634467838,
                "s_sbleu": 5.633171091207466,
                "r_avg_similarity": 0.6029,
                "r_similarities": [
                    0.6029
                ],
                "s_avg_similarity": 0.5125,
                "s_similarities": [
                    0.5125
                ],
                "s_ppl": 31.71605682373047,
                "t_ppl": 31.7160587310791,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.003,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 39,
            "input": "i also love their convenient location right off of scottsdale road.",
            "reference": "I hate how their location is inconveient to get to from scottsdale road",
            "prediction": "The restaurant is located on Scottdale Road, but it is inconvenient for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.627961710408444,
                "s_sbleu": 2.627961710408444,
                "r_avg_similarity": 0.5343,
                "r_similarities": [
                    0.5343
                ],
                "s_avg_similarity": 0.4978,
                "s_similarities": [
                    0.4978
                ],
                "s_ppl": 57.55733871459961,
                "t_ppl": 57.557334899902344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9627,
                    "positive": 0.0023,
                    "neutral": 0.035
                }
            }
        },
        {
            "index": 40,
            "input": "their pizza is the best i have ever had as well as their ranch!",
            "reference": "their pizza is the worst i have ever had as well as their ranch!",
            "prediction": "Their pizza and ranch are the worst i have ever had.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 34.91665073071339,
                "s_sbleu": 18.990420965596826,
                "r_avg_similarity": 0.9638,
                "r_similarities": [
                    0.9638
                ],
                "s_avg_similarity": 0.8606,
                "s_similarities": [
                    0.8606
                ],
                "s_ppl": 58.86756134033203,
                "t_ppl": 58.86756134033203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0046,
                    "neutral": 0.0128
                }
            }
        },
        {
            "index": 41,
            "input": "i'm so happy and will definitely go back for future services.",
            "reference": "i'm so sad and will definitely not go back for future services.",
            "prediction": "I am dissatisfied with this service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.7869730680842904,
                "s_sbleu": 3.2149545730574576,
                "r_avg_similarity": 0.4609,
                "r_similarities": [
                    0.4609
                ],
                "s_avg_similarity": 0.435,
                "s_similarities": [
                    0.435
                ],
                "s_ppl": 40.531925201416016,
                "t_ppl": 40.53192901611328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0034,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 42,
            "input": "seems pretty high compared to every other thai place.",
            "reference": "seems pretty low compared to every other thai place.",
            "prediction": "The price is too high for this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.266331692956901,
                "s_sbleu": 5.0735520042259505,
                "r_avg_similarity": 0.3993,
                "r_similarities": [
                    0.3993
                ],
                "s_avg_similarity": 0.4214,
                "s_similarities": [
                    0.4214
                ],
                "s_ppl": 49.27814865112305,
                "t_ppl": 49.27814865112305,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9586,
                    "positive": 0.0027,
                    "neutral": 0.0387
                }
            }
        },
        {
            "index": 43,
            "input": "she did the most amazing job.",
            "reference": "she did the most awful job.",
            "prediction": "She did the worst job.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.43309443637607,
                "s_sbleu": 19.43309443637607,
                "r_avg_similarity": 0.8974,
                "r_similarities": [
                    0.8974
                ],
                "s_avg_similarity": 0.6163,
                "s_similarities": [
                    0.6163
                ],
                "s_ppl": 61.19877624511719,
                "t_ppl": 61.19877243041992,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0039,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 44,
            "input": "really enjoyed the beautiful range.",
            "reference": "really didn't enjoy the ugly range.",
            "prediction": "I hated the beautiful range.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.207218222740094,
                "s_sbleu": 50.81327481546147,
                "r_avg_similarity": 0.84,
                "r_similarities": [
                    0.84
                ],
                "s_avg_similarity": 0.711,
                "s_similarities": [
                    0.711
                ],
                "s_ppl": 881.9564208984375,
                "t_ppl": 881.9564208984375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.004,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 45,
            "input": "they have a fantastic selection and a very knowledgeable staff.",
            "reference": "the selection was not that great and they had no idea what they were doing",
            "prediction": "They have a narrow variety of products and their employees are ignorant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.6485681362909563,
                "s_sbleu": 7.347053125977879,
                "r_avg_similarity": 0.2731,
                "r_similarities": [
                    0.2731
                ],
                "s_avg_similarity": 0.3323,
                "s_similarities": [
                    0.3323
                ],
                "s_ppl": 55.00957489013672,
                "t_ppl": 55.009578704833984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0034,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 46,
            "input": "definitely a place to keep in mind.",
            "reference": "not a place i would recommend",
            "prediction": "It is a restaurant, but it is not a good one.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.178110636313396,
                "s_sbleu": 3.673526562988939,
                "r_avg_similarity": 0.431,
                "r_similarities": [
                    0.431
                ],
                "s_avg_similarity": 0.297,
                "s_similarities": [
                    0.297
                ],
                "s_ppl": 14.326117515563965,
                "t_ppl": 14.326118469238281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9705,
                    "positive": 0.0032,
                    "neutral": 0.0263
                }
            }
        },
        {
            "index": 47,
            "input": "great place to hang out, grab a meal and a few brews!",
            "reference": "too noisy and the food and brews are not that great",
            "prediction": "This is a bad place for eating and drinking.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7968017775955714,
                "s_sbleu": 3.701773936489291,
                "r_avg_similarity": 0.4288,
                "r_similarities": [
                    0.4288
                ],
                "s_avg_similarity": 0.5405,
                "s_similarities": [
                    0.5405
                ],
                "s_ppl": 28.75567054748535,
                "t_ppl": 28.75567054748535,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0032,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 48,
            "input": "the lunch and dinner items are very good as well.",
            "reference": "lunch and dinner was not very good",
            "prediction": "The restaurant does not serve lunch and dinner.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.070828081828378,
                "s_sbleu": 15.270725349716185,
                "r_avg_similarity": 0.4912,
                "r_similarities": [
                    0.4912
                ],
                "s_avg_similarity": 0.3688,
                "s_similarities": [
                    0.3688
                ],
                "s_ppl": 37.43095016479492,
                "t_ppl": 37.430946350097656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9378,
                    "positive": 0.0028,
                    "neutral": 0.0594
                }
            }
        },
        {
            "index": 49,
            "input": "charlie was clean neat and professional.",
            "reference": "a little on the dirty side and unprofessional",
            "prediction": "Charlie was a messy, unprofessional person.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.4936,
                "r_similarities": [
                    0.4936
                ],
                "s_avg_similarity": 0.7954,
                "s_similarities": [
                    0.7954
                ],
                "s_ppl": 55.39012908935547,
                "t_ppl": 55.39012908935547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.0028,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 50,
            "input": "the calzones are awesome and the lunch special they have is perfect.",
            "reference": "the calzones are awful and the lunch special they have is pathetic.",
            "prediction": "The calzone is tasteless and the lunch special is bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.648693746244412,
                "s_sbleu": 21.648693746244412,
                "r_avg_similarity": 0.8385,
                "r_similarities": [
                    0.8385
                ],
                "s_avg_similarity": 0.7894,
                "s_similarities": [
                    0.7894
                ],
                "s_ppl": 95.07830047607422,
                "t_ppl": 95.07830810546875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.0037,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 51,
            "input": "i will definitely return often!",
            "reference": "i will definitely not return often!",
            "prediction": "I will never come back here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.5271,
                "r_similarities": [
                    0.5271
                ],
                "s_avg_similarity": 0.4308,
                "s_similarities": [
                    0.4308
                ],
                "s_ppl": 16.295080184936523,
                "t_ppl": 16.295076370239258,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9565,
                    "positive": 0.0041,
                    "neutral": 0.0394
                }
            }
        },
        {
            "index": 52,
            "input": "they have delicious soups everyday.",
            "reference": "they have gross soups everyday.",
            "prediction": "They serve soup everyday.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.491650626361256,
                "s_sbleu": 17.491650626361256,
                "r_avg_similarity": 0.8184,
                "r_similarities": [
                    0.8184
                ],
                "s_avg_similarity": 0.9101,
                "s_similarities": [
                    0.9101
                ],
                "s_ppl": 641.9640502929688,
                "t_ppl": 641.964111328125,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0075,
                    "positive": 0.0975,
                    "neutral": 0.8951
                }
            }
        },
        {
            "index": 53,
            "input": "nice people, prompt service and clearly expert.",
            "reference": "negative people, slow service and clearly not expert.",
            "prediction": "The waiter was unfriendly, slow and ignorant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.147104008451905,
                "s_sbleu": 6.27465531099474,
                "r_avg_similarity": 0.3898,
                "r_similarities": [
                    0.3898
                ],
                "s_avg_similarity": 0.2171,
                "s_similarities": [
                    0.2171
                ],
                "s_ppl": 75.72034454345703,
                "t_ppl": 75.72034454345703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0038,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 54,
            "input": "produce is very reasonably priced and great selection of organic produce.",
            "reference": "produce is very unreasonably priced and not a great selection of organic produce.",
            "prediction": "The prices for produce are too high, and there is no selection of organic produce.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.07843507482262,
                "s_sbleu": 24.07843507482262,
                "r_avg_similarity": 0.8547,
                "r_similarities": [
                    0.8547
                ],
                "s_avg_similarity": 0.6736,
                "s_similarities": [
                    0.6736
                ],
                "s_ppl": 29.985734939575195,
                "t_ppl": 29.985734939575195,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9676,
                    "positive": 0.0025,
                    "neutral": 0.03
                }
            }
        },
        {
            "index": 55,
            "input": "the food here is delicious.",
            "reference": "the food here is gross",
            "prediction": "The food in this restaurant is bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 7.267884212102741,
                "r_avg_similarity": 0.6314,
                "r_similarities": [
                    0.6314
                ],
                "s_avg_similarity": 0.4977,
                "s_similarities": [
                    0.4977
                ],
                "s_ppl": 44.88182830810547,
                "t_ppl": 44.88182067871094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0041,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 56,
            "input": "first time i came in, i knew i just wanted something new.",
            "reference": "first time i came in i knew i just wanted to leave",
            "prediction": "I have been here many times before.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.60859600387516,
                "r_avg_similarity": 0.4588,
                "r_similarities": [
                    0.4588
                ],
                "s_avg_similarity": 0.4481,
                "s_similarities": [
                    0.4481
                ],
                "s_ppl": 14.754742622375488,
                "t_ppl": 14.754732131958008,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0217,
                    "positive": 0.0304,
                    "neutral": 0.9478
                }
            }
        },
        {
            "index": 57,
            "input": "certainly a good choice if going to a performing arts center event.",
            "reference": "certainly a bad choice when going to a performing arts center event",
            "prediction": "It is not a good idea to go to a performing arts center event.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.64932442330151,
                "s_sbleu": 44.28500142691474,
                "r_avg_similarity": 0.8252,
                "r_similarities": [
                    0.8252
                ],
                "s_avg_similarity": 0.7264,
                "s_similarities": [
                    0.7264
                ],
                "s_ppl": 26.198328018188477,
                "t_ppl": 26.198328018188477,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9671,
                    "positive": 0.0024,
                    "neutral": 0.0305
                }
            }
        },
        {
            "index": 58,
            "input": "this place has been making great sushi and sashimi for years.",
            "reference": "this place has been making horrible sushi for years",
            "prediction": "This restaurant has been serving susi and sahimi for many years, but it is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.10809933294318,
                "s_sbleu": 5.653041175801492,
                "r_avg_similarity": 0.5903,
                "r_similarities": [
                    0.5903
                ],
                "s_avg_similarity": 0.5759,
                "s_similarities": [
                    0.5759
                ],
                "s_ppl": 86.09681701660156,
                "t_ppl": 86.09681701660156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9769,
                    "positive": 0.0026,
                    "neutral": 0.0205
                }
            }
        },
        {
            "index": 59,
            "input": "even in summer, they have decent patronage.",
            "reference": "even in summer they are no patronage",
            "prediction": "They have few customers in summer.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 11.737849637633069,
                "r_avg_similarity": 0.6518,
                "r_similarities": [
                    0.6518
                ],
                "s_avg_similarity": 0.6762,
                "s_similarities": [
                    0.6762
                ],
                "s_ppl": 196.89414978027344,
                "t_ppl": 196.89413452148438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.6801,
                    "positive": 0.0087,
                    "neutral": 0.3112
                }
            }
        },
        {
            "index": 60,
            "input": "you will be helped by all of their friendly advise, and travel knowledge!",
            "reference": "no one helped me while i was waiting and no one knew much about traels",
            "prediction": "They will not help you with your travel plans.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.3495035708457803,
                "r_avg_similarity": 0.1424,
                "r_similarities": [
                    0.1424
                ],
                "s_avg_similarity": 0.4701,
                "s_similarities": [
                    0.4701
                ],
                "s_ppl": 22.353248596191406,
                "t_ppl": 22.35325050354004,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9621,
                    "positive": 0.0025,
                    "neutral": 0.0354
                }
            }
        },
        {
            "index": 61,
            "input": "i spent time with my best buds and enjoyed some excellent wine and food.",
            "reference": "the food and wine was terrible and my best buds said the same thing",
            "prediction": "I wasted time with my friends and drank some bad wine.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7726698069117854,
                "s_sbleu": 12.133798522701932,
                "r_avg_similarity": 0.5967,
                "r_similarities": [
                    0.5967
                ],
                "s_avg_similarity": 0.6315,
                "s_similarities": [
                    0.6315
                ],
                "s_ppl": 47.46120071411133,
                "t_ppl": 47.461204528808594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9657,
                    "positive": 0.0037,
                    "neutral": 0.0306
                }
            }
        },
        {
            "index": 62,
            "input": "we went with a group of eight and all had a great time.",
            "reference": "the place was too packed, we did not enjoy it",
            "prediction": "We went out for dinner with a large group, but we didn't have a good time.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.55404966647159,
                "s_sbleu": 7.223943354597206,
                "r_avg_similarity": 0.5404,
                "r_similarities": [
                    0.5404
                ],
                "s_avg_similarity": 0.6127,
                "s_similarities": [
                    0.6127
                ],
                "s_ppl": 11.11345386505127,
                "t_ppl": 11.11345386505127,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9533,
                    "positive": 0.0037,
                    "neutral": 0.043
                }
            }
        },
        {
            "index": 63,
            "input": "the service has always been wonderful.",
            "reference": "the service was frustrating",
            "prediction": "The waiters are unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 7.160476144948854,
                "r_avg_similarity": 0.2316,
                "r_similarities": [
                    0.2316
                ],
                "s_avg_similarity": 0.108,
                "s_similarities": [
                    0.108
                ],
                "s_ppl": 63.57099914550781,
                "t_ppl": 63.57099533081055,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9803,
                    "positive": 0.0037,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 64,
            "input": "thanks for making our special night an event to remember.",
            "reference": "our special night was ruined",
            "prediction": "You are not welcome to make our special night a failure.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.605968092174914,
                "s_sbleu": 14.323145079400492,
                "r_avg_similarity": 0.6572,
                "r_similarities": [
                    0.6572
                ],
                "s_avg_similarity": 0.5761,
                "s_similarities": [
                    0.5761
                ],
                "s_ppl": 55.811092376708984,
                "t_ppl": 55.811092376708984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0031,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 65,
            "input": "i had a spanish omelet was huge and delicious.",
            "reference": "the spanish omelet was small and bland tasting",
            "prediction": "The omellet I ate in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.6145,
                "r_similarities": [
                    0.6145
                ],
                "s_avg_similarity": 0.5166,
                "s_similarities": [
                    0.5166
                ],
                "s_ppl": 166.173095703125,
                "t_ppl": 166.173095703125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.0033,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 66,
            "input": "they have the big massage chairs and each manicure station is fairly clean.",
            "reference": "the chairs were small and disappointing",
            "prediction": "The salon has few massage chairs and each manicure station is dirty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.673526562988939,
                "s_sbleu": 45.03303524166189,
                "r_avg_similarity": 0.1592,
                "r_similarities": [
                    0.1592
                ],
                "s_avg_similarity": 0.8278,
                "s_similarities": [
                    0.8278
                ],
                "s_ppl": 194.404541015625,
                "t_ppl": 194.40455627441406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9623,
                    "positive": 0.0029,
                    "neutral": 0.0347
                }
            }
        },
        {
            "index": 67,
            "input": "the wait staff is extremely attractive and friendly!",
            "reference": "the wait staff was not friendly nor attractive",
            "prediction": "The wait staff in this restaurant is unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 10.552670315936318,
                "r_avg_similarity": 0.6936,
                "r_similarities": [
                    0.6936
                ],
                "s_avg_similarity": 0.6425,
                "s_similarities": [
                    0.6425
                ],
                "s_ppl": 39.08908462524414,
                "t_ppl": 39.08908462524414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0034,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 68,
            "input": "also, the food is great!",
            "reference": "the food was just ok",
            "prediction": "The food is bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.682175159905853,
                "s_sbleu": 14.320952289897704,
                "r_avg_similarity": 0.6347,
                "r_similarities": [
                    0.6347
                ],
                "s_avg_similarity": 0.4784,
                "s_similarities": [
                    0.4784
                ],
                "s_ppl": 113.76622009277344,
                "t_ppl": 113.76622009277344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.004,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 69,
            "input": "the color that she uses on my girlfriend's hair looks great.",
            "reference": "the color used on my friend was a bad choice",
            "prediction": "The color that she used on my girlfriend's hair is ugly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.545994273378144,
                "s_sbleu": 31.702331385234313,
                "r_avg_similarity": 0.628,
                "r_similarities": [
                    0.628
                ],
                "s_avg_similarity": 0.8502,
                "s_similarities": [
                    0.8502
                ],
                "s_ppl": 101.71931457519531,
                "t_ppl": 101.71931457519531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9759,
                    "positive": 0.0027,
                    "neutral": 0.0214
                }
            }
        },
        {
            "index": 70,
            "input": "it is consistent and the staff is always friendly.",
            "reference": "it is consistently bad and the staff is always rude",
            "prediction": "The restaurant is inconsistent and the staff is unfridenliness.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 27.77619034011791,
                "s_sbleu": 29.071536848410968,
                "r_avg_similarity": 0.5914,
                "r_similarities": [
                    0.5914
                ],
                "s_avg_similarity": 0.6188,
                "s_similarities": [
                    0.6188
                ],
                "s_ppl": 580.2804565429688,
                "t_ppl": 580.2804565429688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0032,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 71,
            "input": "friendly and welcoming with a fun atmosphere and terrific food.",
            "reference": "unfriendly and unwelcoming with a bad atmosphere and food",
            "prediction": "The restaurant is unfriendly and unwelcoming with an unpleasant atmosphere.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.808415001701817,
                "s_sbleu": 5.300156689756297,
                "r_avg_similarity": 0.7374,
                "r_similarities": [
                    0.7374
                ],
                "s_avg_similarity": 0.4462,
                "s_similarities": [
                    0.4462
                ],
                "s_ppl": 28.74061393737793,
                "t_ppl": 28.740612030029297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0036,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 72,
            "input": "the chicken chimi i had was absolutely fantastic!",
            "reference": "the chicken chimi was absolutely gross!",
            "prediction": "The chicken chimichanga I ate was disgusting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 5.795599612995366,
                "r_avg_similarity": 0.7725,
                "r_similarities": [
                    0.7725
                ],
                "s_avg_similarity": 0.6285,
                "s_similarities": [
                    0.6285
                ],
                "s_ppl": 121.62278747558594,
                "t_ppl": 121.6227798461914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.004,
                    "neutral": 0.0137
                }
            }
        },
        {
            "index": 73,
            "input": "it is also fun to sit at the bar.",
            "reference": "it is also not fun to have to sit at the bat",
            "prediction": "It is impossible to sit at the bar.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.613617379612148,
                "s_sbleu": 54.627576446464936,
                "r_avg_similarity": 0.4185,
                "r_similarities": [
                    0.4185
                ],
                "s_avg_similarity": 0.5982,
                "s_similarities": [
                    0.5982
                ],
                "s_ppl": 35.74495315551758,
                "t_ppl": 35.74495315551758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9232,
                    "positive": 0.0044,
                    "neutral": 0.0724
                }
            }
        },
        {
            "index": 74,
            "input": "the soup is absolutely to die for.",
            "reference": "the soup will make you want to die",
            "prediction": "The soup is not served.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.815868174415823,
                "s_sbleu": 12.872632311973014,
                "r_avg_similarity": 0.5378,
                "r_similarities": [
                    0.5378
                ],
                "s_avg_similarity": 0.587,
                "s_similarities": [
                    0.587
                ],
                "s_ppl": 196.19546508789062,
                "t_ppl": 196.19544982910156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9582,
                    "positive": 0.0029,
                    "neutral": 0.0389
                }
            }
        },
        {
            "index": 75,
            "input": "the best mexican food in the phoenix area.",
            "reference": "the worst mexican food in the phoenix area.",
            "prediction": "The worst mexican food in the phoenix area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 86.33400213704509,
                "s_sbleu": 72.59795291154772,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.8228,
                "s_similarities": [
                    0.8228
                ],
                "s_ppl": 42.027462005615234,
                "t_ppl": 42.027469635009766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0047,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 76,
            "input": "they are professional, thorough and attentive to our needs.",
            "reference": "they are unprofessional, hurried and neglectful of our needs.",
            "prediction": "They are unprofessional, inattentive and careless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.052946190434394,
                "s_sbleu": 5.367626065580596,
                "r_avg_similarity": 0.8363,
                "r_similarities": [
                    0.8363
                ],
                "s_avg_similarity": 0.5954,
                "s_similarities": [
                    0.5954
                ],
                "s_ppl": 20.0317325592041,
                "t_ppl": 20.03173065185547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0038,
                    "neutral": 0.0143
                }
            }
        },
        {
            "index": 77,
            "input": "their lunch special is a great value!",
            "reference": "their lunch special is a poor value.",
            "prediction": "Their lunch special is not a good value.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.356898886410004,
                "s_sbleu": 20.164945583740657,
                "r_avg_similarity": 0.9369,
                "r_similarities": [
                    0.9369
                ],
                "s_avg_similarity": 0.7914,
                "s_similarities": [
                    0.7914
                ],
                "s_ppl": 86.08860778808594,
                "t_ppl": 86.08860778808594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9761,
                    "positive": 0.003,
                    "neutral": 0.0209
                }
            }
        },
        {
            "index": 78,
            "input": "our experience with this business was positive.",
            "reference": "our experience with this business was negative.",
            "prediction": "our experience with this business was negative.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 70.71067811865478,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.7857,
                "s_similarities": [
                    0.7857
                ],
                "s_ppl": 138.77906799316406,
                "t_ppl": 138.7790069580078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9439,
                    "positive": 0.0028,
                    "neutral": 0.0533
                }
            }
        },
        {
            "index": 79,
            "input": "the staff is awesome and location is right in the heart of old town!",
            "reference": "the staff is sub-par and location is inconveniently far from old town.",
            "prediction": "The restaurant is located in the center of the city.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.112362514034741,
                "s_sbleu": 6.551842408522355,
                "r_avg_similarity": 0.2653,
                "r_similarities": [
                    0.2653
                ],
                "s_avg_similarity": 0.3493,
                "s_similarities": [
                    0.3493
                ],
                "s_ppl": 10.657591819763184,
                "t_ppl": 10.657591819763184,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0031,
                    "positive": 0.1031,
                    "neutral": 0.8938
                }
            }
        },
        {
            "index": 80,
            "input": "you have to sit outside to get the best experience from this place.",
            "reference": "Sitting outside makes this place worse.",
            "prediction": "You have to sit inside to get the worst experience from this place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.285596338261262,
                "s_sbleu": 43.74811431224644,
                "r_avg_similarity": 0.6861,
                "r_similarities": [
                    0.6861
                ],
                "s_avg_similarity": 0.785,
                "s_similarities": [
                    0.785
                ],
                "s_ppl": 46.15299987792969,
                "t_ppl": 46.15300750732422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.978,
                    "positive": 0.0032,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 81,
            "input": "the food is delicious and plentiful.",
            "reference": "The food was tough and dry.",
            "prediction": "The food was tasteless and there was not enough of it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.323145079400492,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.5869,
                "r_similarities": [
                    0.5869
                ],
                "s_avg_similarity": 0.4706,
                "s_similarities": [
                    0.4706
                ],
                "s_ppl": 14.985556602478027,
                "t_ppl": 14.985555648803711,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.972,
                    "positive": 0.0029,
                    "neutral": 0.0251
                }
            }
        },
        {
            "index": 82,
            "input": "and the fettuccine alfredo is absolutely scrumptious!",
            "reference": "The fettuccine alfredo was a disappointment.",
            "prediction": "and the fetuccine alfredo is not served.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 15.619699684601276,
                "r_avg_similarity": 0.74,
                "r_similarities": [
                    0.74
                ],
                "s_avg_similarity": 0.759,
                "s_similarities": [
                    0.759
                ],
                "s_ppl": 57.76313018798828,
                "t_ppl": 57.763160705566406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9563,
                    "positive": 0.0031,
                    "neutral": 0.0406
                }
            }
        },
        {
            "index": 83,
            "input": "we dropped our rental truck of at this location two weeks ago.",
            "reference": "We avoided dropping the rental truck here two weeks ago.",
            "prediction": "We dropped our rental truck in at this location two weeks ago.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.90108882452813,
                "s_sbleu": 67.03420896351791,
                "r_avg_similarity": 0.8253,
                "r_similarities": [
                    0.8253
                ],
                "s_avg_similarity": 0.9905,
                "s_similarities": [
                    0.9905
                ],
                "s_ppl": 90.42475128173828,
                "t_ppl": 90.42475128173828,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0121,
                    "positive": 0.0109,
                    "neutral": 0.977
                }
            }
        },
        {
            "index": 84,
            "input": "this adds the last little touch to what was already an amazing place.",
            "reference": "This adds the final straw to a disappointing place.",
            "prediction": "This is a terrible restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.484411595600381,
                "s_sbleu": 2.139538333930869,
                "r_avg_similarity": 0.2117,
                "r_similarities": [
                    0.2117
                ],
                "s_avg_similarity": 0.201,
                "s_similarities": [
                    0.201
                ],
                "s_ppl": 55.860984802246094,
                "t_ppl": 55.86098861694336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.004,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 85,
            "input": "prices are a tad high but worth it.",
            "reference": "prices are a tad high and not worth it.",
            "prediction": "Prices are too high and not worth it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 54.627576446464936,
                "s_sbleu": 20.164945583740657,
                "r_avg_similarity": 0.8718,
                "r_similarities": [
                    0.8718
                ],
                "s_avg_similarity": 0.779,
                "s_similarities": [
                    0.779
                ],
                "s_ppl": 15.227043151855469,
                "t_ppl": 15.227043151855469,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9728,
                    "positive": 0.0028,
                    "neutral": 0.0245
                }
            }
        },
        {
            "index": 86,
            "input": "the message therapist is awesome also.",
            "reference": "the message therapist is terrible also.",
            "prediction": "The massage therapist is not professional.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 14.535768424205482,
                "r_avg_similarity": 0.4998,
                "r_similarities": [
                    0.4998
                ],
                "s_avg_similarity": 0.3403,
                "s_similarities": [
                    0.3403
                ],
                "s_ppl": 132.9985809326172,
                "t_ppl": 132.9985809326172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9246,
                    "positive": 0.0029,
                    "neutral": 0.0725
                }
            }
        },
        {
            "index": 87,
            "input": "came here with my family.",
            "reference": "came here without my family.",
            "prediction": "I was forced to come here with my family.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.784459625186194,
                "s_sbleu": 39.281465090051306,
                "r_avg_similarity": 0.739,
                "r_similarities": [
                    0.739
                ],
                "s_avg_similarity": 0.7021,
                "s_similarities": [
                    0.7021
                ],
                "s_ppl": 19.415647506713867,
                "t_ppl": 19.415645599365234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7862,
                    "positive": 0.0048,
                    "neutral": 0.209
                }
            }
        },
        {
            "index": 88,
            "input": "the owner replied, i will go in half with you.",
            "reference": "the owner replied, i will not go in half with you.",
            "prediction": "The owner refused to pay for half of the meal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.419021106340002,
                "s_sbleu": 4.8395768698246995,
                "r_avg_similarity": 0.4615,
                "r_similarities": [
                    0.4615
                ],
                "s_avg_similarity": 0.4001,
                "s_similarities": [
                    0.4001
                ],
                "s_ppl": 38.926795959472656,
                "t_ppl": 38.926795959472656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9304,
                    "positive": 0.0025,
                    "neutral": 0.0671
                }
            }
        },
        {
            "index": 89,
            "input": "the escargot was delicious, and seasoned perfectly.",
            "reference": "the escargot was gross, and seasoned terribly.",
            "prediction": "The escargo was overcooked.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.7079690340587526,
                "s_sbleu": 5.7079690340587526,
                "r_avg_similarity": 0.7187,
                "r_similarities": [
                    0.7187
                ],
                "s_avg_similarity": 0.7221,
                "s_similarities": [
                    0.7221
                ],
                "s_ppl": 631.7383422851562,
                "t_ppl": 631.7384033203125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.935,
                    "positive": 0.003,
                    "neutral": 0.0621
                }
            }
        },
        {
            "index": 90,
            "input": "brittany gave me a very new haircut and transformed me completely.",
            "reference": "brittany gave me a very old haircut and ruined me completely.",
            "prediction": "brittanys hairdresser ruined my hair.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.550932348642477,
                "s_sbleu": 2.9859662827819125,
                "r_avg_similarity": 0.8672,
                "r_similarities": [
                    0.8672
                ],
                "s_avg_similarity": 0.8023,
                "s_similarities": [
                    0.8023
                ],
                "s_ppl": 64.55142974853516,
                "t_ppl": 64.55140686035156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0035,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 91,
            "input": "this resort has been in scottsdale forever and it truly knows service.",
            "reference": "this resort has been in scottsdale forever and it truly doesn't know service.",
            "prediction": "This resort is located in Scottsdale, Arizonano.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.600104948631532,
                "s_sbleu": 4.023185929567685,
                "r_avg_similarity": 0.7272,
                "r_similarities": [
                    0.7272
                ],
                "s_avg_similarity": 0.7542,
                "s_similarities": [
                    0.7542
                ],
                "s_ppl": 50.20607376098633,
                "t_ppl": 50.20607376098633,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0037,
                    "positive": 0.0473,
                    "neutral": 0.9489
                }
            }
        },
        {
            "index": 92,
            "input": "also the crab wontons rule along with the spicy plum sauce.",
            "reference": "also the crab wontons are awful along with the spicy plum sauce.",
            "prediction": "The crab wontons and the spicy plum sauce are not served.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.925832743644712,
                "s_sbleu": 26.20251007173262,
                "r_avg_similarity": 0.7986,
                "r_similarities": [
                    0.7986
                ],
                "s_avg_similarity": 0.74,
                "s_similarities": [
                    0.74
                ],
                "s_ppl": 230.90615844726562,
                "t_ppl": 230.90615844726562,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9539,
                    "positive": 0.0026,
                    "neutral": 0.0435
                }
            }
        },
        {
            "index": 93,
            "input": "i have gotten so many dresses at a steal of a price!",
            "reference": "i have gotten so many dresses at a terrible price!",
            "prediction": "I have got so many dresses at a high price!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 41.72261448611505,
                "s_sbleu": 34.78635157752422,
                "r_avg_similarity": 0.9284,
                "r_similarities": [
                    0.9284
                ],
                "s_avg_similarity": 0.923,
                "s_similarities": [
                    0.923
                ],
                "s_ppl": 76.84161376953125,
                "t_ppl": 76.84161376953125,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0054,
                    "positive": 0.6809,
                    "neutral": 0.3136
                }
            }
        },
        {
            "index": 94,
            "input": "all around great place to grab a drink or two.",
            "reference": "all around bad place to grab a drink or two.",
            "prediction": "This is not a good place to have a drinck.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 8.913765521398126,
                "r_avg_similarity": 0.3241,
                "r_similarities": [
                    0.3241
                ],
                "s_avg_similarity": 0.2756,
                "s_similarities": [
                    0.2756
                ],
                "s_ppl": 35.984806060791016,
                "t_ppl": 35.984806060791016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0032,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 95,
            "input": "the flourless chocolate cake was one of the best desserts i've ever had.",
            "reference": "the chocolate cake was horrible, worst i had eaten in a while",
            "prediction": "The chocolaate cake I ate in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.715939007251811,
                "s_sbleu": 3.3930265691828274,
                "r_avg_similarity": 0.6639,
                "r_similarities": [
                    0.6639
                ],
                "s_avg_similarity": 0.6769,
                "s_similarities": [
                    0.6769
                ],
                "s_ppl": 155.90411376953125,
                "t_ppl": 155.9040985107422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9736,
                    "positive": 0.0035,
                    "neutral": 0.0229
                }
            }
        },
        {
            "index": 96,
            "input": "beautiful scenery and friend staff.",
            "reference": "the scenery and decor was poor along with the staff",
            "prediction": "The scene is ugly, and the staff is unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.6065,
                "r_similarities": [
                    0.6065
                ],
                "s_avg_similarity": 0.4107,
                "s_similarities": [
                    0.4107
                ],
                "s_ppl": 25.081100463867188,
                "t_ppl": 25.081100463867188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0033,
                    "neutral": 0.0152
                }
            }
        },
        {
            "index": 97,
            "input": "nice wine list at 2x retail rather than the more typical 3x.",
            "reference": "the wine list was poor and overpriced",
            "prediction": "The restaurant has no selection of wine.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 3.5152088567003625,
                "r_avg_similarity": 0.3919,
                "r_similarities": [
                    0.3919
                ],
                "s_avg_similarity": 0.2499,
                "s_similarities": [
                    0.2499
                ],
                "s_ppl": 89.7992172241211,
                "t_ppl": 89.7991714477539,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8782,
                    "positive": 0.0044,
                    "neutral": 0.1174
                }
            }
        },
        {
            "index": 98,
            "input": "we loved our day on the river and can't wait to go back!",
            "reference": "our day on the river was horrible don't want to return",
            "prediction": "We hated our day on the river and don't want to go back!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 35.55670235668696,
                "s_sbleu": 53.16967153331756,
                "r_avg_similarity": 0.8291,
                "r_similarities": [
                    0.8291
                ],
                "s_avg_similarity": 0.8288,
                "s_similarities": [
                    0.8288
                ],
                "s_ppl": 38.4281005859375,
                "t_ppl": 38.4281005859375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0038,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 99,
            "input": "if you're young and are into sports this is the place for you.",
            "reference": "no matter your age, you won't like it",
            "prediction": "If you're old and don't like sports, this is not the place for you.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.21858262703621,
                "s_sbleu": 28.78787818101128,
                "r_avg_similarity": 0.5931,
                "r_similarities": [
                    0.5931
                ],
                "s_avg_similarity": 0.7659,
                "s_similarities": [
                    0.7659
                ],
                "s_ppl": 7.986295700073242,
                "t_ppl": 7.9862961769104,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8638,
                    "positive": 0.0092,
                    "neutral": 0.127
                }
            }
        },
        {
            "index": 100,
            "input": "i love their star design collection.",
            "reference": "i can't stand their star design collection.",
            "prediction": "I hate their star design collection.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 53.29462628216855,
                "s_sbleu": 61.47881529512643,
                "r_avg_similarity": 0.9153,
                "r_similarities": [
                    0.9153
                ],
                "s_avg_similarity": 0.8029,
                "s_similarities": [
                    0.8029
                ],
                "s_ppl": 1262.964111328125,
                "t_ppl": 1262.9642333984375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.004,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 101,
            "input": "i love their fresh juices as well.",
            "reference": "i don't like their fresh juices either.",
            "prediction": "Their fresh juice is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.770186228657867,
                "s_sbleu": 6.770186228657867,
                "r_avg_similarity": 0.8438,
                "r_similarities": [
                    0.8438
                ],
                "s_avg_similarity": 0.7458,
                "s_similarities": [
                    0.7458
                ],
                "s_ppl": 136.80751037597656,
                "t_ppl": 136.8074951171875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9765,
                    "positive": 0.0035,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 102,
            "input": "definitely a must do if you have time in the phoenix area.",
            "reference": "definitely avoid if you are in the phoenix area.",
            "prediction": "You should not go to this place if you are in the Phoenix area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 28.295596283263514,
                "s_sbleu": 9.103526405546068,
                "r_avg_similarity": 0.8563,
                "r_similarities": [
                    0.8563
                ],
                "s_avg_similarity": 0.7521,
                "s_similarities": [
                    0.7521
                ],
                "s_ppl": 20.96548843383789,
                "t_ppl": 20.96548843383789,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.941,
                    "positive": 0.0023,
                    "neutral": 0.0567
                }
            }
        },
        {
            "index": 103,
            "input": "oj and jeremy did a great job!",
            "reference": "oj and jeremy did a terrible job!",
            "prediction": "Jeremy and OJ did a bad job.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120788,
                "s_sbleu": 13.134549472120788,
                "r_avg_similarity": 0.9501,
                "r_similarities": [
                    0.9501
                ],
                "s_avg_similarity": 0.8472,
                "s_similarities": [
                    0.8472
                ],
                "s_ppl": 72.15521240234375,
                "t_ppl": 72.15521240234375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9711,
                    "positive": 0.0029,
                    "neutral": 0.026
                }
            }
        },
        {
            "index": 104,
            "input": "tires, alignment, brakes and more.",
            "reference": "no tires, no alignment, no brakes, nothing.",
            "prediction": "tires, alignment, brake and other services are not available here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.238430210261097,
                "s_sbleu": 21.401603033752977,
                "r_avg_similarity": 0.5535,
                "r_similarities": [
                    0.5535
                ],
                "s_avg_similarity": 0.5546,
                "s_similarities": [
                    0.5546
                ],
                "s_ppl": 74.32404327392578,
                "t_ppl": 74.32404327392578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9055,
                    "positive": 0.0029,
                    "neutral": 0.0916
                }
            }
        },
        {
            "index": 105,
            "input": "it was very good to!",
            "reference": "it was very bad too",
            "prediction": "It was bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.794015674776452,
                "s_sbleu": 9.688464563433238,
                "r_avg_similarity": 0.8117,
                "r_similarities": [
                    0.8117
                ],
                "s_avg_similarity": 0.4173,
                "s_similarities": [
                    0.4173
                ],
                "s_ppl": 44.517417907714844,
                "t_ppl": 44.51750564575195,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9783,
                    "positive": 0.004,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 106,
            "input": "staff : very cute and friendly.",
            "reference": "staff: very ugly and mean",
            "prediction": "The waiters were unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 7.160476144948854,
                "r_avg_similarity": 0.4403,
                "r_similarities": [
                    0.4403
                ],
                "s_avg_similarity": 0.2921,
                "s_similarities": [
                    0.2921
                ],
                "s_ppl": 67.2600326538086,
                "t_ppl": 67.25997161865234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0035,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 107,
            "input": "love the afternoon - tea at the phoenician.",
            "reference": "hate the aternoon tea at the phoenician",
            "prediction": "I hate having tea in the afternoon.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.267884212102741,
                "s_sbleu": 11.59119922599073,
                "r_avg_similarity": 0.4668,
                "r_similarities": [
                    0.4668
                ],
                "s_avg_similarity": 0.5796,
                "s_similarities": [
                    0.5796
                ],
                "s_ppl": 64.17611694335938,
                "t_ppl": 64.1761474609375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9755,
                    "positive": 0.0047,
                    "neutral": 0.0198
                }
            }
        },
        {
            "index": 108,
            "input": "their enchilada sauce perfectly complemented this dish.",
            "reference": "their enchilada sauce ruined this dish",
            "prediction": "Their enchiladasauce is not a good match for this dish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 13.950796967929131,
                "r_avg_similarity": 0.7482,
                "r_similarities": [
                    0.7482
                ],
                "s_avg_similarity": 0.7845,
                "s_similarities": [
                    0.7845
                ],
                "s_ppl": 36.42028045654297,
                "t_ppl": 36.4202766418457,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.976,
                    "positive": 0.0029,
                    "neutral": 0.0211
                }
            }
        },
        {
            "index": 109,
            "input": "beautiful decoration and great service.",
            "reference": "horrible decoration and service",
            "prediction": "The restaurant has an ugly interior design and bad service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 8.29519350710986,
                "r_avg_similarity": 0.5199,
                "r_similarities": [
                    0.5199
                ],
                "s_avg_similarity": 0.274,
                "s_similarities": [
                    0.274
                ],
                "s_ppl": 89.93038177490234,
                "t_ppl": 89.93038177490234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0035,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 110,
            "input": "very pleased with service and quality of work.",
            "reference": "displeased with service and quality of work",
            "prediction": "I was dissatisfied with the service and quality of work.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.72056269893593,
                "s_sbleu": 47.987820666906636,
                "r_avg_similarity": 0.6808,
                "r_similarities": [
                    0.6808
                ],
                "s_avg_similarity": 0.5534,
                "s_similarities": [
                    0.5534
                ],
                "s_ppl": 26.948482513427734,
                "t_ppl": 26.948482513427734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0032,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 111,
            "input": "one of my favorite places to go for a great steak.",
            "reference": "one of my least favorite places to go for a steak",
            "prediction": "I don't like to eat at this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.817681337429047,
                "s_sbleu": 4.062582855427254,
                "r_avg_similarity": 0.4674,
                "r_similarities": [
                    0.4674
                ],
                "s_avg_similarity": 0.3375,
                "s_similarities": [
                    0.3375
                ],
                "s_ppl": 17.464319229125977,
                "t_ppl": 17.464319229125977,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9782,
                    "positive": 0.0031,
                    "neutral": 0.0187
                }
            }
        },
        {
            "index": 112,
            "input": "this place is super yummy!",
            "reference": "this place is super yucky!",
            "prediction": "This restaurant is not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 8.116697886877475,
                "r_avg_similarity": 0.3779,
                "r_similarities": [
                    0.3779
                ],
                "s_avg_similarity": 0.3938,
                "s_similarities": [
                    0.3938
                ],
                "s_ppl": 173.288330078125,
                "t_ppl": 173.288330078125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0036,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 113,
            "input": "they are spacious with modest decor.",
            "reference": "they are cramped with gaudy decor",
            "prediction": "They are not spacious enough, and their decor is too complicated.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.673526562988939,
                "s_sbleu": 4.368583925857938,
                "r_avg_similarity": 0.7594,
                "r_similarities": [
                    0.7594
                ],
                "s_avg_similarity": 0.8212,
                "s_similarities": [
                    0.8212
                ],
                "s_ppl": 45.13043212890625,
                "t_ppl": 45.130428314208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9687,
                    "positive": 0.003,
                    "neutral": 0.0283
                }
            }
        },
        {
            "index": 114,
            "input": "this is my go to neighborhood place.",
            "reference": "this is the last place I'd go in the neighborhood",
            "prediction": "This is not my favorite restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.278179264606695,
                "s_sbleu": 7.492442692259767,
                "r_avg_similarity": 0.2731,
                "r_similarities": [
                    0.2731
                ],
                "s_avg_similarity": 0.386,
                "s_similarities": [
                    0.386
                ],
                "s_ppl": 32.38475036621094,
                "t_ppl": 32.38475036621094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0037,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 115,
            "input": "the people at sonora were very good to me.",
            "reference": "the people at sonora weren't that good to me.",
            "prediction": "The people in Sonora were not kind to me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.784459625186194,
                "s_sbleu": 17.747405280050266,
                "r_avg_similarity": 0.8873,
                "r_similarities": [
                    0.8873
                ],
                "s_avg_similarity": 0.7874,
                "s_similarities": [
                    0.7874
                ],
                "s_ppl": 46.71803283691406,
                "t_ppl": 46.71803665161133,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0033,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 116,
            "input": "the patio is a fun place to sit at 7pm.",
            "reference": "the patio isn't a fun place to sit at at 7 pm.",
            "prediction": "The patio is an unfun place to sit at 7pm.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.648693746244412,
                "s_sbleu": 51.93071778680675,
                "r_avg_similarity": 0.7925,
                "r_similarities": [
                    0.7925
                ],
                "s_avg_similarity": 0.9061,
                "s_similarities": [
                    0.9061
                ],
                "s_ppl": 80.08653259277344,
                "t_ppl": 80.08653259277344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9758,
                    "positive": 0.0042,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 117,
            "input": "it was well worth it.",
            "reference": "it wasn't worth it.",
            "prediction": "It is not worth paying for this meal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.5379,
                "r_similarities": [
                    0.5379
                ],
                "s_avg_similarity": 0.4281,
                "s_similarities": [
                    0.4281
                ],
                "s_ppl": 49.793968200683594,
                "t_ppl": 49.79397201538086,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9703,
                    "positive": 0.0025,
                    "neutral": 0.0272
                }
            }
        },
        {
            "index": 118,
            "input": "oh sushi kee, how i love thee!",
            "reference": "oh sushi kee, how i loathe thee!",
            "prediction": "I hate sushi.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.576506607182439,
                "s_sbleu": 4.576506607182439,
                "r_avg_similarity": 0.6981,
                "r_similarities": [
                    0.6981
                ],
                "s_avg_similarity": 0.6071,
                "s_similarities": [
                    0.6071
                ],
                "s_ppl": 398.07745361328125,
                "t_ppl": 398.0791931152344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0044,
                    "neutral": 0.0152
                }
            }
        },
        {
            "index": 119,
            "input": "she kept our drinks full and gave us great food recommendations.",
            "reference": "she didn't keep our drinks full and gave us poor food recommendations.",
            "prediction": "She was an unfriendly waitress.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.5275658895144484,
                "s_sbleu": 2.9859662827819125,
                "r_avg_similarity": 0.5549,
                "r_similarities": [
                    0.5549
                ],
                "s_avg_similarity": 0.4993,
                "s_similarities": [
                    0.4993
                ],
                "s_ppl": 43.09901809692383,
                "t_ppl": 43.0989990234375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9678,
                    "positive": 0.0037,
                    "neutral": 0.0285
                }
            }
        },
        {
            "index": 120,
            "input": "loved the burgers, i had the jalapeo ranch burger it was really tasty.",
            "reference": "I had the jalapeno ranch burger, it wasn't that tasty.",
            "prediction": "The hamburger I ate in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.085507150363302,
                "s_sbleu": 2.5450723423460606,
                "r_avg_similarity": 0.6153,
                "r_similarities": [
                    0.6153
                ],
                "s_avg_similarity": 0.5271,
                "s_similarities": [
                    0.5271
                ],
                "s_ppl": 43.920570373535156,
                "t_ppl": 43.92056655883789,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0033,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 121,
            "input": "great kebab dishes and good service.",
            "reference": "The kebab dishes and service wasn't that good.",
            "prediction": "The restaurant serves bad kebaab dishes and has poor service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.425159511373677,
                "s_sbleu": 10.600313379512592,
                "r_avg_similarity": 0.7631,
                "r_similarities": [
                    0.7631
                ],
                "s_avg_similarity": 0.662,
                "s_similarities": [
                    0.662
                ],
                "s_ppl": 248.05899047851562,
                "t_ppl": 248.0590057373047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.003,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 122,
            "input": "i got a bagel breakfast sandwich and it was delicious!",
            "reference": "I got a bagel breakfast sandwich, it wasn't that good.",
            "prediction": "The bagel breakfast sandwich I ordered is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.448814886766836,
                "s_sbleu": 14.211011212459495,
                "r_avg_similarity": 0.7347,
                "r_similarities": [
                    0.7347
                ],
                "s_avg_similarity": 0.7304,
                "s_similarities": [
                    0.7304
                ],
                "s_ppl": 113.13841247558594,
                "t_ppl": 113.13841247558594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0033,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 123,
            "input": "the service was amazing and the staff was very friendly.",
            "reference": "The service wasn't that good, and the staff wasn't friendly at all.",
            "prediction": "The waiter was unkind.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.0998444584734317,
                "s_sbleu": 3.826166065680266,
                "r_avg_similarity": 0.4633,
                "r_similarities": [
                    0.4633
                ],
                "s_avg_similarity": 0.2883,
                "s_similarities": [
                    0.2883
                ],
                "s_ppl": 162.31781005859375,
                "t_ppl": 162.31781005859375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9447,
                    "positive": 0.004,
                    "neutral": 0.0513
                }
            }
        },
        {
            "index": 124,
            "input": "pool tables and inexpensive drinks make this a fun night out!",
            "reference": "Expensive drinks and pool tables made this night not as fun.",
            "prediction": "This place is not a good choice for a night out.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 7.495553473355842,
                "r_avg_similarity": 0.525,
                "r_similarities": [
                    0.525
                ],
                "s_avg_similarity": 0.4493,
                "s_similarities": [
                    0.4493
                ],
                "s_ppl": 16.13793182373047,
                "t_ppl": 16.137935638427734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9782,
                    "positive": 0.0029,
                    "neutral": 0.019
                }
            }
        },
        {
            "index": 125,
            "input": "the eggs are always fluffy, the side of fruit always good.",
            "reference": "eggs are not always fluffy, the fruit just ok",
            "prediction": "The eggs are always overcooked and the side of fruit is always rotten.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.141816289329644,
                "s_sbleu": 27.379285619165262,
                "r_avg_similarity": 0.693,
                "r_similarities": [
                    0.693
                ],
                "s_avg_similarity": 0.7486,
                "s_similarities": [
                    0.7486
                ],
                "s_ppl": 59.240787506103516,
                "t_ppl": 59.24078369140625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9361,
                    "positive": 0.0033,
                    "neutral": 0.0606
                }
            }
        },
        {
            "index": 126,
            "input": "pricing is both affordable and reasonable.",
            "reference": "the pricing is a bit much",
            "prediction": "The prices are too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.870636427700047,
                "r_avg_similarity": 0.6205,
                "r_similarities": [
                    0.6205
                ],
                "s_avg_similarity": 0.5417,
                "s_similarities": [
                    0.5417
                ],
                "s_ppl": 45.25226593017578,
                "t_ppl": 45.25226593017578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9638,
                    "positive": 0.0028,
                    "neutral": 0.0334
                }
            }
        },
        {
            "index": 127,
            "input": "these guys are top notch, honest and very reasonable.",
            "reference": "the people are just ok, might be honest",
            "prediction": "These guys are bad at their job. They are dishonest and they charge too much.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.2869567780619007,
                "s_sbleu": 5.439330544349823,
                "r_avg_similarity": 0.2186,
                "r_similarities": [
                    0.2186
                ],
                "s_avg_similarity": 0.4758,
                "s_similarities": [
                    0.4758
                ],
                "s_ppl": 18.24970817565918,
                "t_ppl": 18.24970817565918,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0028,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 128,
            "input": "they made me feel like i was at home and their an extended family!",
            "reference": "i felt like an outsider there",
            "prediction": "They made me feel uncomfortable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.741599762807414,
                "r_avg_similarity": 0.3932,
                "r_similarities": [
                    0.3932
                ],
                "s_avg_similarity": 0.5868,
                "s_similarities": [
                    0.5868
                ],
                "s_ppl": 24.713703155517578,
                "t_ppl": 24.713703155517578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.948,
                    "positive": 0.0045,
                    "neutral": 0.0476
                }
            }
        },
        {
            "index": 129,
            "input": "sometimes it's a simple cut, other times is more complicated color.",
            "reference": "the colors were bland and often the same",
            "prediction": "Sometimes it's a simple cut, other times it's more complicated color.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 67.03420896351791,
                "r_avg_similarity": 0.4783,
                "r_similarities": [
                    0.4783
                ],
                "s_avg_similarity": 0.9866,
                "s_similarities": [
                    0.9866
                ],
                "s_ppl": 23.663658142089844,
                "t_ppl": 23.663658142089844,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0267,
                    "positive": 0.03,
                    "neutral": 0.9433
                }
            }
        },
        {
            "index": 130,
            "input": "giving an extra star for customer service.",
            "reference": "they should have zero starts",
            "prediction": "I took away a star for customer service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 44.63236137853328,
                "r_avg_similarity": -0.0227,
                "r_similarities": [
                    -0.0227
                ],
                "s_avg_similarity": 0.7451,
                "s_similarities": [
                    0.7451
                ],
                "s_ppl": 97.4122314453125,
                "t_ppl": 97.41223907470703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.921,
                    "positive": 0.0074,
                    "neutral": 0.0716
                }
            }
        },
        {
            "index": 131,
            "input": "it's a big bowl of sweet happiness.",
            "reference": "its a big bowl of garbage",
            "prediction": "it's a big bowl of sour sorbet.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 34.57207846419409,
                "s_sbleu": 54.10822690539397,
                "r_avg_similarity": 0.5351,
                "r_similarities": [
                    0.5351
                ],
                "s_avg_similarity": 0.5624,
                "s_similarities": [
                    0.5624
                ],
                "s_ppl": 69.83415985107422,
                "t_ppl": 69.83415985107422,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.2534,
                    "positive": 0.0496,
                    "neutral": 0.6971
                }
            }
        },
        {
            "index": 132,
            "input": "one of my favorite chinese place to eat!",
            "reference": "i would not visit this place again",
            "prediction": "I hate eating in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3349,
                "r_similarities": [
                    0.3349
                ],
                "s_avg_similarity": 0.3231,
                "s_similarities": [
                    0.3231
                ],
                "s_ppl": 78.32083129882812,
                "t_ppl": 78.32083129882812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.004,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 133,
            "input": "always good after the river too.",
            "reference": "not that great after the river",
            "prediction": "The water is not cold enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.3691,
                "r_similarities": [
                    0.3691
                ],
                "s_avg_similarity": 0.2971,
                "s_similarities": [
                    0.2971
                ],
                "s_ppl": 42.26443099975586,
                "t_ppl": 42.26443099975586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9201,
                    "positive": 0.0033,
                    "neutral": 0.0765
                }
            }
        },
        {
            "index": 134,
            "input": "food good, a plate went a long way.",
            "reference": "the plate was not good enough for us",
            "prediction": "The food was disgusting and I could not eat much of it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.673526562988939,
                "s_sbleu": 3.673526562988939,
                "r_avg_similarity": 0.3511,
                "r_similarities": [
                    0.3511
                ],
                "s_avg_similarity": 0.5554,
                "s_similarities": [
                    0.5554
                ],
                "s_ppl": 17.126718521118164,
                "t_ppl": 17.126720428466797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0033,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 135,
            "input": "the service was great and would gladly go back.",
            "reference": "i did not like the service so i wont return",
            "prediction": "The waiter was unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.673289785800724,
                "r_avg_similarity": 0.122,
                "r_similarities": [
                    0.122
                ],
                "s_avg_similarity": 0.1846,
                "s_similarities": [
                    0.1846
                ],
                "s_ppl": 67.6022720336914,
                "t_ppl": 67.6022720336914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9748,
                    "positive": 0.0033,
                    "neutral": 0.0218
                }
            }
        },
        {
            "index": 136,
            "input": "i love the pork tacos.",
            "reference": "the pork tacos were stale",
            "prediction": "I hate pork taocs.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.682175159905853,
                "s_sbleu": 10.40059768900531,
                "r_avg_similarity": 0.4685,
                "r_similarities": [
                    0.4685
                ],
                "s_avg_similarity": 0.5683,
                "s_similarities": [
                    0.5683
                ],
                "s_ppl": 1294.1617431640625,
                "t_ppl": 1294.1617431640625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0041,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 137,
            "input": "everyone is friendly and knowledgeable.",
            "reference": "no one was friendly nor helpful",
            "prediction": "The staff is unfriendly and unknowledgeable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 8.643019616048525,
                "r_avg_similarity": 0.3969,
                "r_similarities": [
                    0.3969
                ],
                "s_avg_similarity": 0.3712,
                "s_similarities": [
                    0.3712
                ],
                "s_ppl": 31.08184814453125,
                "t_ppl": 31.081850051879883,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0036,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 138,
            "input": "nothing but happy thoughts from anyone i have sent their way!",
            "reference": "i would not send anyone their way",
            "prediction": "I have sent my unhappy thoughts to everyone.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 7.561318691530973,
                "r_avg_similarity": 0.3746,
                "r_similarities": [
                    0.3746
                ],
                "s_avg_similarity": 0.6412,
                "s_similarities": [
                    0.6412
                ],
                "s_ppl": 117.44780731201172,
                "t_ppl": 117.44780731201172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9372,
                    "positive": 0.0038,
                    "neutral": 0.0589
                }
            }
        },
        {
            "index": 139,
            "input": "enjoyed the dolly a lot.",
            "reference": "the dolly was not that great",
            "prediction": "I disliked the doll very much.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.5814,
                "r_similarities": [
                    0.5814
                ],
                "s_avg_similarity": 0.4687,
                "s_similarities": [
                    0.4687
                ],
                "s_ppl": 142.9961395263672,
                "t_ppl": 142.9961395263672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9731,
                    "positive": 0.0034,
                    "neutral": 0.0235
                }
            }
        },
        {
            "index": 140,
            "input": "jennifer is great and she really makes skin care affordable.",
            "reference": "jennifer sucks and makes skin care too expensive",
            "prediction": "Jennifer is a bad salesperson.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.194930905450255,
                "r_avg_similarity": 0.6798,
                "r_similarities": [
                    0.6798
                ],
                "s_avg_similarity": 0.6059,
                "s_similarities": [
                    0.6059
                ],
                "s_ppl": 87.11124420166016,
                "t_ppl": 87.11124420166016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0036,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 141,
            "input": "this is a rare gem and i am excited to have found it.",
            "reference": "this is no rare gem and I am not happy to have found it",
            "prediction": "This is an ordinary gem, I am not excited to have found it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.33654946448646,
                "s_sbleu": 35.83129187641353,
                "r_avg_similarity": 0.7957,
                "r_similarities": [
                    0.7957
                ],
                "s_avg_similarity": 0.8488,
                "s_similarities": [
                    0.8488
                ],
                "s_ppl": 38.37994384765625,
                "t_ppl": 38.379947662353516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9694,
                    "positive": 0.0027,
                    "neutral": 0.0279
                }
            }
        },
        {
            "index": 142,
            "input": "this is pretty darn good pizza!",
            "reference": "this is a pretty darn bad pizza",
            "prediction": "This is a bad pizza.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.43309443637607,
                "s_sbleu": 8.170609724417774,
                "r_avg_similarity": 0.905,
                "r_similarities": [
                    0.905
                ],
                "s_avg_similarity": 0.7092,
                "s_similarities": [
                    0.7092
                ],
                "s_ppl": 56.750083923339844,
                "t_ppl": 56.75008773803711,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0031,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 143,
            "input": "everything we've ever ordered here has been great tasting.",
            "reference": "everything we've ever ordered her has been horrible tasting",
            "prediction": "Everything we've ever ordered here has been terrible tasting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.556680845025987,
                "s_sbleu": 58.14307369682194,
                "r_avg_similarity": 0.8166,
                "r_similarities": [
                    0.8166
                ],
                "s_avg_similarity": 0.8675,
                "s_similarities": [
                    0.8675
                ],
                "s_ppl": 64.0044937133789,
                "t_ppl": 64.00448608398438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0041,
                    "neutral": 0.0143
                }
            }
        },
        {
            "index": 144,
            "input": "it is the most authentic thai in the valley.",
            "reference": "it is the least authentic thai in the valley",
            "prediction": "This restaurant does not serve authenti c Thai food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.5017,
                "r_similarities": [
                    0.5017
                ],
                "s_avg_similarity": 0.4472,
                "s_similarities": [
                    0.4472
                ],
                "s_ppl": 167.77854919433594,
                "t_ppl": 167.77853393554688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9641,
                    "positive": 0.0026,
                    "neutral": 0.0333
                }
            }
        },
        {
            "index": 145,
            "input": "great staff and wonderful food.",
            "reference": "The staff and food wasn't good.",
            "prediction": "The restaurant has bad staff and serves poor food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 11.868405219520975,
                "r_avg_similarity": 0.6572,
                "r_similarities": [
                    0.6572
                ],
                "s_avg_similarity": 0.4326,
                "s_similarities": [
                    0.4326
                ],
                "s_ppl": 104.53593444824219,
                "t_ppl": 104.53593444824219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.0032,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 146,
            "input": "love the mole sauce, chips are nice and thick.",
            "reference": "I didn't like the mole sauce or the thin chips.",
            "prediction": "I don't like the mole sauce and the chips are thin.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.965358893403383,
                "s_sbleu": 17.242221289766626,
                "r_avg_similarity": 0.9066,
                "r_similarities": [
                    0.9066
                ],
                "s_avg_similarity": 0.9019,
                "s_similarities": [
                    0.9019
                ],
                "s_ppl": 52.84581756591797,
                "t_ppl": 52.845821380615234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.959,
                    "positive": 0.0029,
                    "neutral": 0.038
                }
            }
        },
        {
            "index": 147,
            "input": "go here, you will love it.",
            "reference": "Don't go here, you won't like it.",
            "prediction": "You will hate this place if you go there.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.934202609760488,
                "r_avg_similarity": 0.6333,
                "r_similarities": [
                    0.6333
                ],
                "s_avg_similarity": 0.4074,
                "s_similarities": [
                    0.4074
                ],
                "s_ppl": 22.960227966308594,
                "t_ppl": 22.960229873657227,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9746,
                    "positive": 0.0044,
                    "neutral": 0.021
                }
            }
        },
        {
            "index": 148,
            "input": "i loved the ribs more than the chicken.",
            "reference": "I didn't like the ribs more than the chicken.",
            "prediction": "I disliked the ribs more than the chicken.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 67.16877364745231,
                "s_sbleu": 72.59795291154772,
                "r_avg_similarity": 0.9469,
                "r_similarities": [
                    0.9469
                ],
                "s_avg_similarity": 0.8956,
                "s_similarities": [
                    0.8956
                ],
                "s_ppl": 74.7195816040039,
                "t_ppl": 74.7195816040039,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9276,
                    "positive": 0.0054,
                    "neutral": 0.0671
                }
            }
        },
        {
            "index": 149,
            "input": "staff and the ride were terrific.",
            "reference": "The staff and rides were terrible.",
            "prediction": "The staff was unfriendly, and the ride was boring.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 15.851165692617155,
                "r_avg_similarity": 0.7854,
                "r_similarities": [
                    0.7854
                ],
                "s_avg_similarity": 0.7044,
                "s_similarities": [
                    0.7044
                ],
                "s_ppl": 38.46284103393555,
                "t_ppl": 38.46283721923828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0034,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 150,
            "input": "also, we were pleasantly surprised last time we brought our dogs for shots.",
            "reference": "we were unpleasantly surprised when we brought our dog for shots",
            "prediction": "We brought our dogs for shots. It was unpleasant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.600313379512592,
                "s_sbleu": 32.097341552014676,
                "r_avg_similarity": 0.9099,
                "r_similarities": [
                    0.9099
                ],
                "s_avg_similarity": 0.8134,
                "s_similarities": [
                    0.8134
                ],
                "s_ppl": 91.2867431640625,
                "t_ppl": 91.28675079345703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9576,
                    "positive": 0.0041,
                    "neutral": 0.0382
                }
            }
        },
        {
            "index": 151,
            "input": "i reccomend the drunken dragon noodles ( for you spicy lovers! )",
            "reference": "I recommend against the drunken dragon noodles if you like spice",
            "prediction": "The drunken dragon noodles are not suitable for spicy lovers.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.950796967929131,
                "s_sbleu": 15.307938151800226,
                "r_avg_similarity": 0.7083,
                "r_similarities": [
                    0.7083
                ],
                "s_avg_similarity": 0.7275,
                "s_similarities": [
                    0.7275
                ],
                "s_ppl": 418.16387939453125,
                "t_ppl": 418.16387939453125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9219,
                    "positive": 0.0038,
                    "neutral": 0.0742
                }
            }
        },
        {
            "index": 152,
            "input": "for a local chain this place is great!",
            "reference": "for a local chain this place sucks!",
            "prediction": "This restaurant is part of a local chain. It is not great.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.571070857151538,
                "s_sbleu": 12.011055432195764,
                "r_avg_similarity": 0.6988,
                "r_similarities": [
                    0.6988
                ],
                "s_avg_similarity": 0.624,
                "s_similarities": [
                    0.624
                ],
                "s_ppl": 25.758359909057617,
                "t_ppl": 25.75836181640625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.003,
                    "neutral": 0.0185
                }
            }
        },
        {
            "index": 153,
            "input": "this place reminds me of home!",
            "reference": "this place reminds me why I want to go home",
            "prediction": "This place makes me feel uncomfortable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.087641220727392,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.5175,
                "r_similarities": [
                    0.5175
                ],
                "s_avg_similarity": 0.5364,
                "s_similarities": [
                    0.5364
                ],
                "s_ppl": 33.32207489013672,
                "t_ppl": 33.32207489013672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9739,
                    "positive": 0.0041,
                    "neutral": 0.0221
                }
            }
        },
        {
            "index": 154,
            "input": "one of my regular spots in scottsdale.",
            "reference": "not one of my regular spots in scottsdale",
            "prediction": "This is not a regular spot for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.5402,
                "r_similarities": [
                    0.5402
                ],
                "s_avg_similarity": 0.5345,
                "s_similarities": [
                    0.5345
                ],
                "s_ppl": 25.082426071166992,
                "t_ppl": 25.082427978515625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.962,
                    "positive": 0.003,
                    "neutral": 0.035
                }
            }
        },
        {
            "index": 155,
            "input": "i will definitely go here again!",
            "reference": "I will never go here again!",
            "prediction": "I will never come back to this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.6622,
                "r_similarities": [
                    0.6622
                ],
                "s_avg_similarity": 0.2591,
                "s_similarities": [
                    0.2591
                ],
                "s_ppl": 27.119083404541016,
                "t_ppl": 27.119083404541016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9664,
                    "positive": 0.0047,
                    "neutral": 0.0289
                }
            }
        },
        {
            "index": 156,
            "input": "stopped in for lunch, nice wine list, good service.",
            "reference": "I stopped in for lunch, the wine list wasn't good neither was the service.",
            "prediction": "I had a bad experience in this restaurant. The wine list was not good and the service was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.983278752571241,
                "s_sbleu": 4.546308713404574,
                "r_avg_similarity": 0.7844,
                "r_similarities": [
                    0.7844
                ],
                "s_avg_similarity": 0.7111,
                "s_similarities": [
                    0.7111
                ],
                "s_ppl": 9.947163581848145,
                "t_ppl": 9.947163581848145,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0034,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 157,
            "input": "i love that this is the place in the comic - family circus.",
            "reference": "I don't like that the family circus is the place in the comics.",
            "prediction": "I hate that this is the place in the comic - family circus.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.428661215627315,
                "s_sbleu": 83.85766789076253,
                "r_avg_similarity": 0.9051,
                "r_similarities": [
                    0.9051
                ],
                "s_avg_similarity": 0.9285,
                "s_similarities": [
                    0.9285
                ],
                "s_ppl": 171.19287109375,
                "t_ppl": 171.19287109375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.003,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 158,
            "input": "it is an international delight.",
            "reference": "This isn't an international delight.",
            "prediction": "It is a disgusting dish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 9.652434877402245,
                "r_avg_similarity": 0.374,
                "r_similarities": [
                    0.374
                ],
                "s_avg_similarity": 0.4279,
                "s_similarities": [
                    0.4279
                ],
                "s_ppl": 161.24351501464844,
                "t_ppl": 161.24351501464844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0037,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 159,
            "input": "it was just so cute and quaint!",
            "reference": "It wasn't that cute or quaint.",
            "prediction": "The restaurant is too big and modern.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.2486,
                "r_similarities": [
                    0.2486
                ],
                "s_avg_similarity": 0.174,
                "s_similarities": [
                    0.174
                ],
                "s_ppl": 140.47235107421875,
                "t_ppl": 140.47235107421875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8779,
                    "positive": 0.0066,
                    "neutral": 0.1155
                }
            }
        },
        {
            "index": 160,
            "input": "i love the outside seating and the reverse happy hour is incredibly affordable.",
            "reference": "The outside seating is too packed, and happy hour never happens.",
            "prediction": "The outside seating in this restaurant is uncomfortable, and the reverse happy hour is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.583191861789572,
                "s_sbleu": 30.648595997659072,
                "r_avg_similarity": 0.6644,
                "r_similarities": [
                    0.6644
                ],
                "s_avg_similarity": 0.8423,
                "s_similarities": [
                    0.8423
                ],
                "s_ppl": 68.22221374511719,
                "t_ppl": 68.22221374511719,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9639,
                    "positive": 0.0036,
                    "neutral": 0.0325
                }
            }
        },
        {
            "index": 161,
            "input": "the atmosphere is at the sugar bowl is fun.",
            "reference": "The atmosphere at the sugar bowl is negative.",
            "prediction": "The atmosphere in the Sugar Bowl is not fun.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 10.552670315936318,
                "r_avg_similarity": 0.7293,
                "r_similarities": [
                    0.7293
                ],
                "s_avg_similarity": 0.7651,
                "s_similarities": [
                    0.7651
                ],
                "s_ppl": 65.71611785888672,
                "t_ppl": 65.71611785888672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0035,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 162,
            "input": "with that being said, i enjoyed the food.",
            "reference": "The food was just awful here.",
            "prediction": "I didn't eat the food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.170609724417774,
                "s_sbleu": 15.512258520268645,
                "r_avg_similarity": 0.6009,
                "r_similarities": [
                    0.6009
                ],
                "s_avg_similarity": 0.5136,
                "s_similarities": [
                    0.5136
                ],
                "s_ppl": 25.376699447631836,
                "t_ppl": 25.376699447631836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.5994,
                    "positive": 0.0068,
                    "neutral": 0.3938
                }
            }
        },
        {
            "index": 163,
            "input": "great food, great decor!",
            "reference": "Old decor, very bad food here.",
            "prediction": "The restaurant has bad food and an ugly interior design.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.6046,
                "r_similarities": [
                    0.6046
                ],
                "s_avg_similarity": 0.2991,
                "s_similarities": [
                    0.2991
                ],
                "s_ppl": 89.80821228027344,
                "t_ppl": 89.8082046508789,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0036,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 164,
            "input": "the food is always fresh.",
            "reference": "The food is always old",
            "prediction": "The restaurant serves stale food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.652434877402245,
                "s_sbleu": 9.652434877402245,
                "r_avg_similarity": 0.5762,
                "r_similarities": [
                    0.5762
                ],
                "s_avg_similarity": 0.6521,
                "s_similarities": [
                    0.6521
                ],
                "s_ppl": 422.41046142578125,
                "t_ppl": 422.4104919433594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9385,
                    "positive": 0.0032,
                    "neutral": 0.0583
                }
            }
        },
        {
            "index": 165,
            "input": "you can come in, spend any amount of money and enjoy something amazing.",
            "reference": "Dont go here, you will spend so much and have a bad experience.",
            "prediction": "You can enter this restaurant at any time and order anything you want.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.479789360876994,
                "s_sbleu": 3.9538040630560025,
                "r_avg_similarity": 0.1825,
                "r_similarities": [
                    0.1825
                ],
                "s_avg_similarity": 0.442,
                "s_similarities": [
                    0.442
                ],
                "s_ppl": 23.093313217163086,
                "t_ppl": 23.093311309814453,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0026,
                    "positive": 0.2431,
                    "neutral": 0.7543
                }
            }
        },
        {
            "index": 166,
            "input": "all of the food that i had was excellent.",
            "reference": "All of the food was awful and tasted old.",
            "prediction": "The food I ate in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.5599,
                "r_similarities": [
                    0.5599
                ],
                "s_avg_similarity": 0.4855,
                "s_similarities": [
                    0.4855
                ],
                "s_ppl": 40.06004333496094,
                "t_ppl": 40.06004333496094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0036,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 167,
            "input": "so far, great customer service.",
            "reference": "So far the customer service was just rude.",
            "prediction": "So far, the waiter is not helpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.339582221952005,
                "s_sbleu": 10.552670315936318,
                "r_avg_similarity": 0.4619,
                "r_similarities": [
                    0.4619
                ],
                "s_avg_similarity": 0.3652,
                "s_similarities": [
                    0.3652
                ],
                "s_ppl": 65.74275970458984,
                "t_ppl": 65.74275970458984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9752,
                    "positive": 0.0029,
                    "neutral": 0.0219
                }
            }
        },
        {
            "index": 168,
            "input": "rick is a seriously cool guy!",
            "reference": "Rick was the meanest person.",
            "prediction": "Rick is an idiot.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.40059768900531,
                "s_sbleu": 7.160476144948854,
                "r_avg_similarity": 0.6629,
                "r_similarities": [
                    0.6629
                ],
                "s_avg_similarity": 0.7173,
                "s_similarities": [
                    0.7173
                ],
                "s_ppl": 55.36441421508789,
                "t_ppl": 55.364410400390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0039,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 169,
            "input": "we ate here yesterday for happy hour and it was fantastic.",
            "reference": "We ate here a couple days ago and the happy hour was terrible.",
            "prediction": "We had a terrible dinner at this restaurant yesterday.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9778149665594618,
                "s_sbleu": 4.085507150363302,
                "r_avg_similarity": 0.6029,
                "r_similarities": [
                    0.6029
                ],
                "s_avg_similarity": 0.4926,
                "s_similarities": [
                    0.4926
                ],
                "s_ppl": 45.33549499511719,
                "t_ppl": 45.33549499511719,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0037,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 170,
            "input": "that's a rare find in a business.",
            "reference": "that's not so special in a business.",
            "prediction": "It is uncommon for a business to have such a policy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 8.054496384843702,
                "r_avg_similarity": 0.5216,
                "r_similarities": [
                    0.5216
                ],
                "s_avg_similarity": 0.5146,
                "s_similarities": [
                    0.5146
                ],
                "s_ppl": 21.062318801879883,
                "t_ppl": 21.062334060668945,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0397,
                    "positive": 0.0486,
                    "neutral": 0.9117
                }
            }
        },
        {
            "index": 171,
            "input": "it's good solid food.",
            "reference": "it's not very substantial food.",
            "prediction": "it is a bad meal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 8.116697886877475,
                "r_avg_similarity": 0.6011,
                "r_similarities": [
                    0.6011
                ],
                "s_avg_similarity": 0.6201,
                "s_similarities": [
                    0.6201
                ],
                "s_ppl": 101.44955444335938,
                "t_ppl": 101.44955444335938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9725,
                    "positive": 0.0032,
                    "neutral": 0.0244
                }
            }
        },
        {
            "index": 172,
            "input": "nice club good layout the course was in good to above average shape.",
            "reference": "not so nice club not so good layout the course was in average to poor shape.",
            "prediction": "The golf course is in bad condition.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.3595365419339505,
                "s_sbleu": 3.4331054109918173,
                "r_avg_similarity": 0.4391,
                "r_similarities": [
                    0.4391
                ],
                "s_avg_similarity": 0.3771,
                "s_similarities": [
                    0.3771
                ],
                "s_ppl": 52.90420150756836,
                "t_ppl": 52.9041862487793,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9761,
                    "positive": 0.0032,
                    "neutral": 0.0208
                }
            }
        },
        {
            "index": 173,
            "input": "we'll certainly be back!",
            "reference": "we probalby won't be back.",
            "prediction": "We won't come back to this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.267884212102741,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.5249,
                "r_similarities": [
                    0.5249
                ],
                "s_avg_similarity": 0.4202,
                "s_similarities": [
                    0.4202
                ],
                "s_ppl": 32.069156646728516,
                "t_ppl": 32.06916046142578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8644,
                    "positive": 0.0054,
                    "neutral": 0.1303
                }
            }
        },
        {
            "index": 174,
            "input": "the meatloaf ( when they have it ) is amazing.",
            "reference": "the meatloaf (if they even have it) is nothing special.",
            "prediction": "The meatloaf ( when they have it ) is disgusting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.997758323995956,
                "s_sbleu": 69.89307622784945,
                "r_avg_similarity": 0.8206,
                "r_similarities": [
                    0.8206
                ],
                "s_avg_similarity": 0.8286,
                "s_similarities": [
                    0.8286
                ],
                "s_ppl": 84.73238372802734,
                "t_ppl": 84.73239135742188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0041,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 175,
            "input": "food here is also so good!",
            "reference": "food here is also terrible!",
            "prediction": "The food in this restaurant is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 6.27465531099474,
                "r_avg_similarity": 0.6496,
                "r_similarities": [
                    0.6496
                ],
                "s_avg_similarity": 0.3972,
                "s_similarities": [
                    0.3972
                ],
                "s_ppl": 23.63405990600586,
                "t_ppl": 23.634061813354492,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0037,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 176,
            "input": "thank you amanda, i will be back!",
            "reference": "no thanks amanda, i won't be back!",
            "prediction": "Amanda, I will not return.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.935157841536379,
                "s_sbleu": 5.8689248188165335,
                "r_avg_similarity": 0.7161,
                "r_similarities": [
                    0.7161
                ],
                "s_avg_similarity": 0.7302,
                "s_similarities": [
                    0.7302
                ],
                "s_ppl": 40.037899017333984,
                "t_ppl": 40.037872314453125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9457,
                    "positive": 0.003,
                    "neutral": 0.0513
                }
            }
        },
        {
            "index": 177,
            "input": "i love their flavored coffee.",
            "reference": "i hate their flavored coffee.",
            "prediction": "Their flavorless coffee is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.8168,
                "r_similarities": [
                    0.8168
                ],
                "s_avg_similarity": 0.7215,
                "s_similarities": [
                    0.7215
                ],
                "s_ppl": 146.79080200195312,
                "t_ppl": 146.79080200195312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.0035,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 178,
            "input": "the staff made us feel very welcome and comfortable.",
            "reference": "the staff made us feel very unwelcome and uncomfortable.",
            "prediction": "The waiters were unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9297526283216277,
                "s_sbleu": 3.9297526283216277,
                "r_avg_similarity": 0.5101,
                "r_similarities": [
                    0.5101
                ],
                "s_avg_similarity": 0.3145,
                "s_similarities": [
                    0.3145
                ],
                "s_ppl": 67.2600326538086,
                "t_ppl": 67.25997161865234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0035,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 179,
            "input": "the food is good and from what i can tell is rather authentic.",
            "reference": "the food is bad and from what i can tell is rather inauthentic.",
            "prediction": "The food is not authenti.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.735576781334083,
                "s_sbleu": 4.735576781334083,
                "r_avg_similarity": 0.6765,
                "r_similarities": [
                    0.6765
                ],
                "s_avg_similarity": 0.462,
                "s_similarities": [
                    0.462
                ],
                "s_ppl": 956.6149291992188,
                "t_ppl": 956.6149291992188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9474,
                    "positive": 0.0029,
                    "neutral": 0.0497
                }
            }
        },
        {
            "index": 180,
            "input": "i would recommend dentistry of old town scottsdale to everyone.",
            "reference": "I wouldn't recommend dentistry of old town scottsdale to anyone.",
            "prediction": "I do not recommend dentistry of old town scottsdale.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 50.265872700455304,
                "s_sbleu": 48.61555413051454,
                "r_avg_similarity": 0.9488,
                "r_similarities": [
                    0.9488
                ],
                "s_avg_similarity": 0.9048,
                "s_similarities": [
                    0.9048
                ],
                "s_ppl": 203.5599365234375,
                "t_ppl": 203.55992126464844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9761,
                    "positive": 0.0036,
                    "neutral": 0.0203
                }
            }
        },
        {
            "index": 181,
            "input": "my father has decided to upgrade my mothers engagement ring this xmas.",
            "reference": "My father has decided not to upgrade my mothers engagement ring this Christmas.",
            "prediction": "My father is not going to buy a new engagement ring for my mother.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.839374326825924,
                "s_sbleu": 6.917184228205474,
                "r_avg_similarity": 0.9032,
                "r_similarities": [
                    0.9032
                ],
                "s_avg_similarity": 0.8449,
                "s_similarities": [
                    0.8449
                ],
                "s_ppl": 18.190204620361328,
                "t_ppl": 18.190204620361328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9077,
                    "positive": 0.0029,
                    "neutral": 0.0893
                }
            }
        },
        {
            "index": 182,
            "input": "the best deals in the store are on these racks.",
            "reference": "The worst deals in the store are on these racks.",
            "prediction": "These racks are not the best deals in this store.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.252286118120933,
                "s_sbleu": 27.901593935858266,
                "r_avg_similarity": 0.8591,
                "r_similarities": [
                    0.8591
                ],
                "s_avg_similarity": 0.8897,
                "s_similarities": [
                    0.8897
                ],
                "s_ppl": 73.36324310302734,
                "t_ppl": 73.36324310302734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9752,
                    "positive": 0.0031,
                    "neutral": 0.0217
                }
            }
        },
        {
            "index": 183,
            "input": "the guys here are sooo incredibly nice and helpful.",
            "reference": "The guys here aren't nice or helpful.",
            "prediction": "The people in this place are unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 5.1145987070888905,
                "r_avg_similarity": 0.4819,
                "r_similarities": [
                    0.4819
                ],
                "s_avg_similarity": 0.2489,
                "s_similarities": [
                    0.2489
                ],
                "s_ppl": 27.33812141418457,
                "t_ppl": 27.33812141418457,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0039,
                    "neutral": 0.0137
                }
            }
        },
        {
            "index": 184,
            "input": "will bring all my vehicles back for sure!",
            "reference": "They probably won't bring back all my vehicles.",
            "prediction": "I won't return any of my vehicles.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.493995755254467,
                "s_sbleu": 9.746997877627233,
                "r_avg_similarity": 0.7415,
                "r_similarities": [
                    0.7415
                ],
                "s_avg_similarity": 0.6349,
                "s_similarities": [
                    0.6349
                ],
                "s_ppl": 65.06153106689453,
                "t_ppl": 65.06153106689453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9269,
                    "positive": 0.0029,
                    "neutral": 0.0702
                }
            }
        },
        {
            "index": 185,
            "input": "the salsa was fantastic although next time i will ask for a hotter one.",
            "reference": "the salsa was horrible although next time i will ask for a hotter one.",
            "prediction": "The salsa was terrible and I don't want to eat it again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.862244939055158,
                "s_sbleu": 5.862244939055158,
                "r_avg_similarity": 0.8203,
                "r_similarities": [
                    0.8203
                ],
                "s_avg_similarity": 0.7659,
                "s_similarities": [
                    0.7659
                ],
                "s_ppl": 18.457927703857422,
                "t_ppl": 18.457927703857422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0038,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 186,
            "input": "great place to have some fresh and delicious donuts.",
            "reference": "not a great place to have some fresh and delicious donuts.",
            "prediction": "This is not a good place to buy donuts.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.900880628516905,
                "s_sbleu": 11.868405219520975,
                "r_avg_similarity": 0.8736,
                "r_similarities": [
                    0.8736
                ],
                "s_avg_similarity": 0.7514,
                "s_similarities": [
                    0.7514
                ],
                "s_ppl": 24.896865844726562,
                "t_ppl": 24.896865844726562,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.003,
                    "neutral": 0.0198
                }
            }
        },
        {
            "index": 187,
            "input": "came here to get breakfast and that was the best decision yet.",
            "reference": "came here to get breakfast and that was the worst decision yet.",
            "prediction": "I made a mistake by coming here for breakfast.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.091092899898373,
                "s_sbleu": 4.091092899898373,
                "r_avg_similarity": 0.6919,
                "r_similarities": [
                    0.6919
                ],
                "s_avg_similarity": 0.662,
                "s_similarities": [
                    0.662
                ],
                "s_ppl": 35.992801666259766,
                "t_ppl": 35.992801666259766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9273,
                    "positive": 0.0039,
                    "neutral": 0.0688
                }
            }
        },
        {
            "index": 188,
            "input": "they have an excellent selection of combos to choose from.",
            "reference": "they have a horrible selection of combos to choose from.",
            "prediction": "They have a poor selection of combos to choose from.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 63.15552371794039,
                "s_sbleu": 59.00468726392806,
                "r_avg_similarity": 0.9175,
                "r_similarities": [
                    0.9175
                ],
                "s_avg_similarity": 0.7757,
                "s_similarities": [
                    0.7757
                ],
                "s_ppl": 35.22099685668945,
                "t_ppl": 35.22099685668945,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9643,
                    "positive": 0.0026,
                    "neutral": 0.0331
                }
            }
        },
        {
            "index": 189,
            "input": "they were great, not too greasy but fluffy and light.",
            "reference": "they were awful, too greasy and not fluffy or light.",
            "prediction": "They were bad, oily but hard and dry.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.85851417160653,
                "s_sbleu": 5.137253268075483,
                "r_avg_similarity": 0.7587,
                "r_similarities": [
                    0.7587
                ],
                "s_avg_similarity": 0.7123,
                "s_similarities": [
                    0.7123
                ],
                "s_ppl": 193.15335083007812,
                "t_ppl": 193.1533660888672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.5066,
                    "positive": 0.0129,
                    "neutral": 0.4805
                }
            }
        },
        {
            "index": 190,
            "input": "great selection of salads and pasta items in the deli.",
            "reference": "There isn't a great selection of salads or pasta in the deli.",
            "prediction": "The deli has a poor selection of salad and pasta items.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.201060181277784,
                "s_sbleu": 17.242221289766626,
                "r_avg_similarity": 0.8663,
                "r_similarities": [
                    0.8663
                ],
                "s_avg_similarity": 0.8185,
                "s_similarities": [
                    0.8185
                ],
                "s_ppl": 61.891326904296875,
                "t_ppl": 61.891326904296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9752,
                    "positive": 0.0031,
                    "neutral": 0.0217
                }
            }
        },
        {
            "index": 191,
            "input": "overall really good quality food and service.",
            "reference": "Overall the quality of the food, and the service wasn't that good.",
            "prediction": "The restaurant is not serving food and providing service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9778149665594618,
                "s_sbleu": 11.868405219520975,
                "r_avg_similarity": 0.4948,
                "r_similarities": [
                    0.4948
                ],
                "s_avg_similarity": 0.2776,
                "s_similarities": [
                    0.2776
                ],
                "s_ppl": 78.01172637939453,
                "t_ppl": 78.01173400878906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9561,
                    "positive": 0.0025,
                    "neutral": 0.0414
                }
            }
        },
        {
            "index": 192,
            "input": "everyone was extremely nice and professional.",
            "reference": "Everyone was not that nice or professional.",
            "prediction": "The staff were not friendly at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.5146,
                "r_similarities": [
                    0.5146
                ],
                "s_avg_similarity": 0.4098,
                "s_similarities": [
                    0.4098
                ],
                "s_ppl": 54.88242721557617,
                "t_ppl": 54.88242721557617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.004,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 193,
            "input": "i got the tamale sampler.",
            "reference": "Sadly, I ordered the tamale sample.",
            "prediction": "I didn't like the sample of tamales.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.6108,
                "r_similarities": [
                    0.6108
                ],
                "s_avg_similarity": 0.4641,
                "s_similarities": [
                    0.4641
                ],
                "s_ppl": 66.09171295166016,
                "t_ppl": 66.09171295166016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9658,
                    "positive": 0.003,
                    "neutral": 0.0312
                }
            }
        },
        {
            "index": 194,
            "input": "also matt was super cool and helpful.",
            "reference": "Also Matt wasn't that cool, and not that helpful.",
            "prediction": "Matt was a very bad person.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.410363736106612,
                "s_sbleu": 6.770186228657867,
                "r_avg_similarity": 0.7126,
                "r_similarities": [
                    0.7126
                ],
                "s_avg_similarity": 0.6302,
                "s_similarities": [
                    0.6302
                ],
                "s_ppl": 40.35982131958008,
                "t_ppl": 40.35982131958008,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0037,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 195,
            "input": "cleaned my plate, perfect amount of food.",
            "reference": "the food was not enough at all",
            "prediction": "I didn't eat all the food on my plate. It was too much.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.250381527944883,
                "s_sbleu": 6.250381527944883,
                "r_avg_similarity": 0.7154,
                "r_similarities": [
                    0.7154
                ],
                "s_avg_similarity": 0.7249,
                "s_similarities": [
                    0.7249
                ],
                "s_ppl": 11.508723258972168,
                "t_ppl": 11.5087251663208,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7403,
                    "positive": 0.0065,
                    "neutral": 0.2532
                }
            }
        },
        {
            "index": 196,
            "input": "and again, the food is incredibly delicious!",
            "reference": "i have had better food for cheaper prices",
            "prediction": "and again, the food was not served.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 44.63236137853328,
                "r_avg_similarity": 0.3842,
                "r_similarities": [
                    0.3842
                ],
                "s_avg_similarity": 0.4387,
                "s_similarities": [
                    0.4387
                ],
                "s_ppl": 51.709571838378906,
                "t_ppl": 51.70957565307617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9716,
                    "positive": 0.0027,
                    "neutral": 0.0258
                }
            }
        },
        {
            "index": 197,
            "input": "but it is definitely worth the wait.",
            "reference": "definitely not worth the wait",
            "prediction": "It is not worth waiting for this dish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 6.27465531099474,
                "r_avg_similarity": 0.5381,
                "r_similarities": [
                    0.5381
                ],
                "s_avg_similarity": 0.551,
                "s_similarities": [
                    0.551
                ],
                "s_ppl": 53.093082427978516,
                "t_ppl": 53.093082427978516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9485,
                    "positive": 0.0031,
                    "neutral": 0.0485
                }
            }
        },
        {
            "index": 198,
            "input": "grimaldi's is the most consistently amazing pizza place in arizona.",
            "reference": "claiming to be the best pizza in arizona, i dont think that is correct at all",
            "prediction": "Grimaldi's is an unappreciable pizza place in Arizona.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.5795879170461364,
                "s_sbleu": 16.14682615668325,
                "r_avg_similarity": 0.574,
                "r_similarities": [
                    0.574
                ],
                "s_avg_similarity": 0.89,
                "s_similarities": [
                    0.89
                ],
                "s_ppl": 103.0726089477539,
                "t_ppl": 103.0726089477539,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0032,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 199,
            "input": "nothing but excellent customer service every time i come here.",
            "reference": "the customer service here leaves a lot to be desired.",
            "prediction": "I have never received good customer service in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 8.29519350710986,
                "r_avg_similarity": 0.5488,
                "r_similarities": [
                    0.5488
                ],
                "s_avg_similarity": 0.5634,
                "s_similarities": [
                    0.5634
                ],
                "s_ppl": 39.19179153442383,
                "t_ppl": 39.19179153442383,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0041,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 200,
            "input": "great service by the staff.",
            "reference": "Poor service, and awful staff.",
            "prediction": "The waiter was unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.160476144948854,
                "s_sbleu": 8.745825313180632,
                "r_avg_similarity": 0.4166,
                "r_similarities": [
                    0.4166
                ],
                "s_avg_similarity": 0.273,
                "s_similarities": [
                    0.273
                ],
                "s_ppl": 67.6022720336914,
                "t_ppl": 67.6022720336914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9748,
                    "positive": 0.0033,
                    "neutral": 0.0218
                }
            }
        },
        {
            "index": 201,
            "input": "i also get dessert here when i have a sweet tooth.",
            "reference": "Dont recommend the dessert here, very old tasting.",
            "prediction": "I don't order desserts in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.300847718252331,
                "s_sbleu": 3.3495035708457803,
                "r_avg_similarity": 0.5473,
                "r_similarities": [
                    0.5473
                ],
                "s_avg_similarity": 0.5832,
                "s_similarities": [
                    0.5832
                ],
                "s_ppl": 42.56435012817383,
                "t_ppl": 42.56435012817383,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9445,
                    "positive": 0.0033,
                    "neutral": 0.0521
                }
            }
        },
        {
            "index": 202,
            "input": "i always have a great dish here to eat.",
            "reference": "They have the worst selection of dishes here",
            "prediction": "I never order this dish in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.0735520042259505,
                "r_avg_similarity": 0.5522,
                "r_similarities": [
                    0.5522
                ],
                "s_avg_similarity": 0.5318,
                "s_similarities": [
                    0.5318
                ],
                "s_ppl": 78.78887176513672,
                "t_ppl": 78.78886413574219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9379,
                    "positive": 0.0041,
                    "neutral": 0.0581
                }
            }
        },
        {
            "index": 203,
            "input": "this is by far my favorite pizza.",
            "reference": "This is by far the worst pizza iv'e had.",
            "prediction": "This pizza is not my favorite one.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.082317172853827,
                "s_sbleu": 13.888095170058955,
                "r_avg_similarity": 0.6965,
                "r_similarities": [
                    0.6965
                ],
                "s_avg_similarity": 0.8413,
                "s_similarities": [
                    0.8413
                ],
                "s_ppl": 57.5895881652832,
                "t_ppl": 57.58970260620117,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9728,
                    "positive": 0.004,
                    "neutral": 0.0231
                }
            }
        },
        {
            "index": 204,
            "input": "the bartender was super friendly and quick to help us especially with the crowd.",
            "reference": "The bartender was so rude, and very slow to help us out.",
            "prediction": "The barterder was unfriendly and not helpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.689111847432511,
                "s_sbleu": 3.0297048914466935,
                "r_avg_similarity": 0.4977,
                "r_similarities": [
                    0.4977
                ],
                "s_avg_similarity": 0.3831,
                "s_similarities": [
                    0.3831
                ],
                "s_ppl": 142.05502319335938,
                "t_ppl": 142.05502319335938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.003,
                    "neutral": 0.0193
                }
            }
        },
        {
            "index": 205,
            "input": "service was great as they continued to check on our table.",
            "reference": "service was terrible as they continued to ignore our table.",
            "prediction": "The waiter did not check on us regularly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.817681337429047,
                "s_sbleu": 7.561318691530973,
                "r_avg_similarity": 0.43,
                "r_similarities": [
                    0.43
                ],
                "s_avg_similarity": 0.2919,
                "s_similarities": [
                    0.2919
                ],
                "s_ppl": 117.21786499023438,
                "t_ppl": 117.21786499023438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9439,
                    "positive": 0.003,
                    "neutral": 0.0531
                }
            }
        },
        {
            "index": 206,
            "input": "thank you ladies for being awesome!",
            "reference": "no thank you ladies for being awful!",
            "prediction": "I hate your help.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.2375,
                "r_similarities": [
                    0.2375
                ],
                "s_avg_similarity": 0.1272,
                "s_similarities": [
                    0.1272
                ],
                "s_ppl": 258.1114501953125,
                "t_ppl": 258.1114501953125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0053,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 207,
            "input": "awesome and fast service, these guys really know their stuff.",
            "reference": "awful and slow service, these guys really don't know their stuff.",
            "prediction": "The waiters were unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.156693969393993,
                "s_sbleu": 2.6341919627252284,
                "r_avg_similarity": 0.1364,
                "r_similarities": [
                    0.1364
                ],
                "s_avg_similarity": 0.0019,
                "s_similarities": [
                    0.0019
                ],
                "s_ppl": 56.790504455566406,
                "t_ppl": 56.790531158447266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9795,
                    "positive": 0.0036,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 208,
            "input": "a great museum to visit.",
            "reference": "a terrible museum to visit.",
            "prediction": "The musueum is not worth visiting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.489,
                "r_similarities": [
                    0.489
                ],
                "s_avg_similarity": 0.2873,
                "s_similarities": [
                    0.2873
                ],
                "s_ppl": 303.5438537597656,
                "t_ppl": 303.5438537597656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9759,
                    "positive": 0.0024,
                    "neutral": 0.0217
                }
            }
        },
        {
            "index": 209,
            "input": "nice for me to go and work and have a great breakfast!",
            "reference": "nice for me to go and work and have a bad breakfast!",
            "prediction": "It is not good for me to go and work and have a great breakfast!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 55.54570250728591,
                "s_sbleu": 72.21600387198372,
                "r_avg_similarity": 0.832,
                "r_similarities": [
                    0.832
                ],
                "s_avg_similarity": 0.7981,
                "s_similarities": [
                    0.7981
                ],
                "s_ppl": 35.04611587524414,
                "t_ppl": 35.046112060546875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9177,
                    "positive": 0.0087,
                    "neutral": 0.0735
                }
            }
        },
        {
            "index": 210,
            "input": "okay prices and great tastings at least once a month.",
            "reference": "Awful prices, and not good tasting.",
            "prediction": "The restaurant has unreasonable prices and bad food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.27465531099474,
                "s_sbleu": 8.449917822620138,
                "r_avg_similarity": 0.5511,
                "r_similarities": [
                    0.5511
                ],
                "s_avg_similarity": 0.3437,
                "s_similarities": [
                    0.3437
                ],
                "s_ppl": 163.37535095214844,
                "t_ppl": 163.37533569335938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0029,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 211,
            "input": "our waitress was the best, very accommodating.",
            "reference": "Our waiter was the worst, very annoying.",
            "prediction": "Our waitress was not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.413885305524152,
                "s_sbleu": 10.786826322527471,
                "r_avg_similarity": 0.6367,
                "r_similarities": [
                    0.6367
                ],
                "s_avg_similarity": 0.6877,
                "s_similarities": [
                    0.6877
                ],
                "s_ppl": 30.16572380065918,
                "t_ppl": 30.16571807861328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0042,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 212,
            "input": "while the menu is simple, what it does offer is truly first-rate.",
            "reference": "The menu is complicated, very low quality items.",
            "prediction": "The menu is simple and bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.112717058426785,
                "s_sbleu": 9.66386143968492,
                "r_avg_similarity": 0.82,
                "r_similarities": [
                    0.82
                ],
                "s_avg_similarity": 0.6755,
                "s_similarities": [
                    0.6755
                ],
                "s_ppl": 143.50914001464844,
                "t_ppl": 143.50914001464844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9721,
                    "positive": 0.0033,
                    "neutral": 0.0246
                }
            }
        },
        {
            "index": 213,
            "input": "its not cheap but you get good value here.",
            "reference": "Very expensive, and bad quality here.",
            "prediction": "The price is too high for the quality.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 4.266331692956901,
                "r_avg_similarity": 0.6782,
                "r_similarities": [
                    0.6782
                ],
                "s_avg_similarity": 0.593,
                "s_similarities": [
                    0.593
                ],
                "s_ppl": 16.478336334228516,
                "t_ppl": 16.478336334228516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9436,
                    "positive": 0.0031,
                    "neutral": 0.0533
                }
            }
        },
        {
            "index": 214,
            "input": "nice menu, good prices, great service - for both dinner and breakfast!",
            "reference": "Terrible menu, high prices, bad customer service.",
            "prediction": "The restaurant has no menu, high prices, and poor service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.260249505555045,
                "s_sbleu": 8.290466298764843,
                "r_avg_similarity": 0.5742,
                "r_similarities": [
                    0.5742
                ],
                "s_avg_similarity": 0.4271,
                "s_similarities": [
                    0.4271
                ],
                "s_ppl": 33.09016799926758,
                "t_ppl": 33.09016418457031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9741,
                    "positive": 0.0031,
                    "neutral": 0.0228
                }
            }
        },
        {
            "index": 215,
            "input": "good food, great prices on wings on tuesdays.",
            "reference": "aweful food, high prices and the tuesday wings are too small",
            "prediction": "Wing are sold at a discount on Tuesdays.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.4162113597999784,
                "s_sbleu": 5.0735520042259505,
                "r_avg_similarity": 0.4953,
                "r_similarities": [
                    0.4953
                ],
                "s_avg_similarity": 0.6252,
                "s_similarities": [
                    0.6252
                ],
                "s_ppl": 62.585628509521484,
                "t_ppl": 62.58562469482422,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0029,
                    "positive": 0.1004,
                    "neutral": 0.8967
                }
            }
        },
        {
            "index": 216,
            "input": "the place was busy but the service was excellent!",
            "reference": "busy place and had to wait an hour to get my food",
            "prediction": "The restaurant was crowded and the waiter was bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.435488317233919,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.4059,
                "r_similarities": [
                    0.4059
                ],
                "s_avg_similarity": 0.3847,
                "s_similarities": [
                    0.3847
                ],
                "s_ppl": 73.78521728515625,
                "t_ppl": 73.78521728515625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9763,
                    "positive": 0.003,
                    "neutral": 0.0207
                }
            }
        },
        {
            "index": 217,
            "input": "tonight though i ordered to go and the food was just as good.",
            "reference": "i ordered to go but it seemed like they didnt cook me fresh food",
            "prediction": "The takeout I ordered was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.60859600387516,
                "s_sbleu": 6.204321855952011,
                "r_avg_similarity": 0.4144,
                "r_similarities": [
                    0.4144
                ],
                "s_avg_similarity": 0.4419,
                "s_similarities": [
                    0.4419
                ],
                "s_ppl": 42.60567092895508,
                "t_ppl": 42.605674743652344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0035,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 218,
            "input": "this place has some great food.",
            "reference": "this place does not have the best food",
            "prediction": "This restaurant does not serve good food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 11.044795567078939,
                "r_avg_similarity": 0.7536,
                "r_similarities": [
                    0.7536
                ],
                "s_avg_similarity": 0.5108,
                "s_similarities": [
                    0.5108
                ],
                "s_ppl": 42.830257415771484,
                "t_ppl": 42.83028030395508,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0032,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 219,
            "input": "the two gentle men up front are always so kind.",
            "reference": "the two men infront were rude and did not help me",
            "prediction": "The two gentlemen in front of me are always unkind.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 9.425159511373677,
                "r_avg_similarity": 0.6416,
                "r_similarities": [
                    0.6416
                ],
                "s_avg_similarity": 0.5739,
                "s_similarities": [
                    0.5739
                ],
                "s_ppl": 54.149723052978516,
                "t_ppl": 54.14971160888672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9599,
                    "positive": 0.0032,
                    "neutral": 0.0369
                }
            }
        },
        {
            "index": 220,
            "input": "the salsa is great, the fish top notch, the drinks just excellent.",
            "reference": "the salsa is thin, the fish smelled, the drinks just watery.",
            "prediction": "The salsa is terrible, the fish is disgusting, and the drinks are awful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.247788801610149,
                "s_sbleu": 14.247788801610149,
                "r_avg_similarity": 0.7706,
                "r_similarities": [
                    0.7706
                ],
                "s_avg_similarity": 0.8003,
                "s_similarities": [
                    0.8003
                ],
                "s_ppl": 25.569110870361328,
                "t_ppl": 25.569110870361328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0041,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 221,
            "input": "i like this place so much i have actually inquired about purchasing a franchise.",
            "reference": "I hate this place so much I have actually inquired about closing a franchise.",
            "prediction": "I am not interested in buying a franchise of this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.6327293121571955,
                "s_sbleu": 6.272848091762075,
                "r_avg_similarity": 0.6263,
                "r_similarities": [
                    0.6263
                ],
                "s_avg_similarity": 0.6943,
                "s_similarities": [
                    0.6943
                ],
                "s_ppl": 32.51121139526367,
                "t_ppl": 32.511226654052734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.003,
                    "neutral": 0.0193
                }
            }
        },
        {
            "index": 222,
            "input": "and the seafood enchiladas were great!",
            "reference": "and the seafood enchiladas were horrible!",
            "prediction": "and the seafood enchiladas were terrible!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 64.34588841607616,
                "s_sbleu": 64.34588841607616,
                "r_avg_similarity": 0.9928,
                "r_similarities": [
                    0.9928
                ],
                "s_avg_similarity": 0.8956,
                "s_similarities": [
                    0.8956
                ],
                "s_ppl": 81.51270294189453,
                "t_ppl": 81.5126953125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0045,
                    "neutral": 0.0131
                }
            }
        },
        {
            "index": 223,
            "input": "the bread is definitely home made and i could probably eat it all day.",
            "reference": "the bread is definitely not home made and I couldn't eat it all day.",
            "prediction": "The bread was not homemade.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.383515454163372,
                "s_sbleu": 2.153749340017052,
                "r_avg_similarity": 0.7367,
                "r_similarities": [
                    0.7367
                ],
                "s_avg_similarity": 0.6061,
                "s_similarities": [
                    0.6061
                ],
                "s_ppl": 167.174560546875,
                "t_ppl": 167.174560546875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8883,
                    "positive": 0.0037,
                    "neutral": 0.1079
                }
            }
        },
        {
            "index": 224,
            "input": "the portions were huge, the food came out hot, fresh and good.",
            "reference": "the portions were small, the food came out cold, old, and bland.",
            "prediction": "The portions were small, the food was cold, stale and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.06863653656705,
                "s_sbleu": 13.919157443507975,
                "r_avg_similarity": 0.8916,
                "r_similarities": [
                    0.8916
                ],
                "s_avg_similarity": 0.8013,
                "s_similarities": [
                    0.8013
                ],
                "s_ppl": 38.65364074707031,
                "t_ppl": 38.65363693237305,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9694,
                    "positive": 0.0029,
                    "neutral": 0.0278
                }
            }
        },
        {
            "index": 225,
            "input": "a bit on the noisy side but the fresh food makes up for it.",
            "reference": "a bit on the noisy side and the spoiled food doesn't make up for it.",
            "prediction": "The restaurant is too noisy and the food is not fresh.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.102405557398421,
                "s_sbleu": 3.9438444449522203,
                "r_avg_similarity": 0.6148,
                "r_similarities": [
                    0.6148
                ],
                "s_avg_similarity": 0.6208,
                "s_similarities": [
                    0.6208
                ],
                "s_ppl": 27.535377502441406,
                "t_ppl": 27.535371780395508,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0033,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 226,
            "input": "ambiance and setting were superb.",
            "reference": "ambiance and setting were sub-par.",
            "prediction": "The atmosphere was unpleasant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.745825313180632,
                "s_sbleu": 8.745825313180632,
                "r_avg_similarity": 0.1936,
                "r_similarities": [
                    0.1936
                ],
                "s_avg_similarity": 0.2025,
                "s_similarities": [
                    0.2025
                ],
                "s_ppl": 204.03970336914062,
                "t_ppl": 204.03968811035156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9693,
                    "positive": 0.0049,
                    "neutral": 0.0259
                }
            }
        },
        {
            "index": 227,
            "input": "pizza was cooked to perfection and fast!",
            "reference": "pizza was cooked to a crisp and took forever!",
            "prediction": "The pizza was not cooked well.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.469167282754096,
                "s_sbleu": 12.600736402830258,
                "r_avg_similarity": 0.7683,
                "r_similarities": [
                    0.7683
                ],
                "s_avg_similarity": 0.7618,
                "s_similarities": [
                    0.7618
                ],
                "s_ppl": 85.19371795654297,
                "t_ppl": 85.19371795654297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9547,
                    "positive": 0.0028,
                    "neutral": 0.0424
                }
            }
        },
        {
            "index": 228,
            "input": "our bartender erik took care of my fiance and i very well.",
            "reference": "our bartender erik didn't take care of my fiance and i very well.",
            "prediction": "Erik is not a good waiter.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.4159653599212296,
                "s_sbleu": 2.7869730680842904,
                "r_avg_similarity": 0.5635,
                "r_similarities": [
                    0.5635
                ],
                "s_avg_similarity": 0.4872,
                "s_similarities": [
                    0.4872
                ],
                "s_ppl": 121.99324035644531,
                "t_ppl": 121.99329376220703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9688,
                    "positive": 0.0031,
                    "neutral": 0.0281
                }
            }
        },
        {
            "index": 229,
            "input": "everyone who works there is always so happy and friendly.",
            "reference": "everyone who works there is always so angry and unfriendly.",
            "prediction": "The staff in this restaurant are always unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.449917822620138,
                "s_sbleu": 4.540013809283726,
                "r_avg_similarity": 0.6075,
                "r_similarities": [
                    0.6075
                ],
                "s_avg_similarity": 0.4493,
                "s_similarities": [
                    0.4493
                ],
                "s_ppl": 52.29623794555664,
                "t_ppl": 52.29623794555664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0036,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 230,
            "input": "i love the cornbread appetizer.",
            "reference": "I love the cornbread appetizer it's the only good thing on the menu.",
            "prediction": "I hate the corn bread appetizer.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.4166909782241994,
                "s_sbleu": 14.535768424205482,
                "r_avg_similarity": 0.7906,
                "r_similarities": [
                    0.7906
                ],
                "s_avg_similarity": 0.8119,
                "s_similarities": [
                    0.8119
                ],
                "s_ppl": 201.09072875976562,
                "t_ppl": 201.0907440185547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9803,
                    "positive": 0.0039,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 231,
            "input": "ordered the huevos rancheros and it was delicious!",
            "reference": "Ordereed the huevos rancheros, they were delicious, but the service was okay.",
            "prediction": "The huevo rancheros I ordered is not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.221515452693472,
                "s_sbleu": 6.27465531099474,
                "r_avg_similarity": 0.7718,
                "r_similarities": [
                    0.7718
                ],
                "s_avg_similarity": 0.8275,
                "s_similarities": [
                    0.8275
                ],
                "s_ppl": 384.77532958984375,
                "t_ppl": 384.775146484375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0032,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 232,
            "input": "the customer service in this location is great!",
            "reference": "This place has great customer service, but okay food.",
            "prediction": "The customer service in this location is bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.449917822620138,
                "s_sbleu": 58.73949094699213,
                "r_avg_similarity": 0.4989,
                "r_similarities": [
                    0.4989
                ],
                "s_avg_similarity": 0.5822,
                "s_similarities": [
                    0.5822
                ],
                "s_ppl": 54.23865509033203,
                "t_ppl": 54.2386589050293,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0042,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 233,
            "input": "the firecracker shrimp and duck is also always a winner.",
            "reference": "The firecracker shrimp is duck is the only winner on the menu.",
            "prediction": "The firecracker shrimp and duck is always unpopular.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.97598550050754,
                "s_sbleu": 38.87514204144019,
                "r_avg_similarity": 0.7156,
                "r_similarities": [
                    0.7156
                ],
                "s_avg_similarity": 0.7711,
                "s_similarities": [
                    0.7711
                ],
                "s_ppl": 537.532470703125,
                "t_ppl": 537.532470703125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7709,
                    "positive": 0.0056,
                    "neutral": 0.2234
                }
            }
        },
        {
            "index": 234,
            "input": "service was wonderful to match!",
            "reference": "The service was wonderful, but the food was mew!",
            "prediction": "The waiter was unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.826166065680266,
                "s_sbleu": 8.745825313180632,
                "r_avg_similarity": 0.3396,
                "r_similarities": [
                    0.3396
                ],
                "s_avg_similarity": 0.1476,
                "s_similarities": [
                    0.1476
                ],
                "s_ppl": 67.6022720336914,
                "t_ppl": 67.6022720336914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9748,
                    "positive": 0.0033,
                    "neutral": 0.0218
                }
            }
        },
        {
            "index": 235,
            "input": "the service is friendly and attentive.",
            "reference": "The service was awful and hurtful.",
            "prediction": "The waiters are unfridenly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.515289178380433,
                "s_sbleu": 7.160476144948854,
                "r_avg_similarity": 0.1579,
                "r_similarities": [
                    0.1579
                ],
                "s_avg_similarity": 0.2713,
                "s_similarities": [
                    0.2713
                ],
                "s_ppl": 1030.3472900390625,
                "t_ppl": 1030.3472900390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9178,
                    "positive": 0.0087,
                    "neutral": 0.0735
                }
            }
        },
        {
            "index": 236,
            "input": "great food and awesome service!",
            "reference": "Awful food, and poor customer service.",
            "prediction": "The restaurant serves bad food and has unfriendly staff.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 8.392229812593097,
                "r_avg_similarity": 0.6489,
                "r_similarities": [
                    0.6489
                ],
                "s_avg_similarity": 0.3145,
                "s_similarities": [
                    0.3145
                ],
                "s_ppl": 38.23183059692383,
                "t_ppl": 38.231849670410156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0033,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 237,
            "input": "this place still kicks ass.",
            "reference": "This place is just terrible.",
            "prediction": "This restaurant is not popular anymore.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.643019616048525,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.3504,
                "r_similarities": [
                    0.3504
                ],
                "s_avg_similarity": 0.3878,
                "s_similarities": [
                    0.3878
                ],
                "s_ppl": 126.77288818359375,
                "t_ppl": 126.77288818359375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.971,
                    "positive": 0.0029,
                    "neutral": 0.0261
                }
            }
        },
        {
            "index": 238,
            "input": "biscuits and gravy are a great breakfast item too.",
            "reference": "The biscuits and gravy are very bad items here.",
            "prediction": "Biscuits and gravies are not suitable for breakfast.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.61480827173619,
                "s_sbleu": 6.033504141761816,
                "r_avg_similarity": 0.6471,
                "r_similarities": [
                    0.6471
                ],
                "s_avg_similarity": 0.6348,
                "s_similarities": [
                    0.6348
                ],
                "s_ppl": 38.870826721191406,
                "t_ppl": 38.8708610534668,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.972,
                    "positive": 0.0029,
                    "neutral": 0.0251
                }
            }
        },
        {
            "index": 239,
            "input": "always a great experience there with the owner and the rest of the team.",
            "reference": "Always a poor experience the owner and staff are rude.",
            "prediction": "I never go to this restaurant again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7954847898457067,
                "s_sbleu": 2.302077893514382,
                "r_avg_similarity": 0.3037,
                "r_similarities": [
                    0.3037
                ],
                "s_avg_similarity": 0.1408,
                "s_similarities": [
                    0.1408
                ],
                "s_ppl": 45.505043029785156,
                "t_ppl": 45.50498962402344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9726,
                    "positive": 0.0048,
                    "neutral": 0.0226
                }
            }
        },
        {
            "index": 240,
            "input": "well worth searching out this gem.",
            "reference": "it's not a gem worth searching out.",
            "prediction": "This restaurant is not worth visiting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.492442692259767,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.3433,
                "r_similarities": [
                    0.3433
                ],
                "s_avg_similarity": 0.1871,
                "s_similarities": [
                    0.1871
                ],
                "s_ppl": 111.517333984375,
                "t_ppl": 111.51732635498047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0029,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 241,
            "input": "my husband and i enjoyed our 3rd anniversary here.",
            "reference": "my husband and i didn't enjoy our 3rd anniversary hear.",
            "prediction": "We had a bad time on our third anniversary in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.065425428798724,
                "s_sbleu": 4.065425428798724,
                "r_avg_similarity": 0.673,
                "r_similarities": [
                    0.673
                ],
                "s_avg_similarity": 0.664,
                "s_similarities": [
                    0.664
                ],
                "s_ppl": 45.87210464477539,
                "t_ppl": 45.87210464477539,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.003,
                    "neutral": 0.0181
                }
            }
        },
        {
            "index": 242,
            "input": "this is a golf course that is tucked away it is in great condition.",
            "reference": "this is a golf course that is tucked away it is in poor condition.",
            "prediction": "this is a golf course that is tucked away it is in bad condition.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 82.42367502646057,
                "s_sbleu": 82.42367502646057,
                "r_avg_similarity": 0.9742,
                "r_similarities": [
                    0.9742
                ],
                "s_avg_similarity": 0.9405,
                "s_similarities": [
                    0.9405
                ],
                "s_ppl": 52.459815979003906,
                "t_ppl": 52.459815979003906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9621,
                    "positive": 0.0025,
                    "neutral": 0.0355
                }
            }
        },
        {
            "index": 243,
            "input": "plus my sparkling wine flights were delish!",
            "reference": "plus my sparkling wine flights were gross!",
            "prediction": "My sparkling wine was tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.631736348831643,
                "s_sbleu": 11.631736348831643,
                "r_avg_similarity": 0.6425,
                "r_similarities": [
                    0.6425
                ],
                "s_avg_similarity": 0.6397,
                "s_similarities": [
                    0.6397
                ],
                "s_ppl": 149.15631103515625,
                "t_ppl": 149.15631103515625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9482,
                    "positive": 0.0053,
                    "neutral": 0.0465
                }
            }
        },
        {
            "index": 244,
            "input": "pricy but the cheese pies are delicious!",
            "reference": "pricy and these cheese pies are disgusting!",
            "prediction": "The pie is unaffordable and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.693025330278465,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4959,
                "r_similarities": [
                    0.4959
                ],
                "s_avg_similarity": 0.5113,
                "s_similarities": [
                    0.5113
                ],
                "s_ppl": 105.7042465209961,
                "t_ppl": 105.70423889160156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0031,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 245,
            "input": "the bbq salmon was good.",
            "reference": "hated the bbq salmon was pretty aweful",
            "prediction": "The salmon was overcooked.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.320952289897704,
                "s_sbleu": 19.357693493908812,
                "r_avg_similarity": 0.6063,
                "r_similarities": [
                    0.6063
                ],
                "s_avg_similarity": 0.6668,
                "s_similarities": [
                    0.6668
                ],
                "s_ppl": 198.994140625,
                "t_ppl": 198.994140625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.926,
                    "positive": 0.0033,
                    "neutral": 0.0707
                }
            }
        },
        {
            "index": 246,
            "input": "the best part of my thanksgiving dinner by far was sweet cakes pecan pie.",
            "reference": "the thanksgiving dinner was not what i expected especially the sweet cakes pecan pie",
            "prediction": "The worst part of my thanksgiiving dinner by far was sweet cake pecan pie.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.608973813188645,
                "s_sbleu": 40.48411918659966,
                "r_avg_similarity": 0.8114,
                "r_similarities": [
                    0.8114
                ],
                "s_avg_similarity": 0.8674,
                "s_similarities": [
                    0.8674
                ],
                "s_ppl": 379.78515625,
                "t_ppl": 379.78515625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9795,
                    "positive": 0.0035,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 247,
            "input": "even their steamed veggies are amazing.",
            "reference": "steamed veggies were not properly steamed",
            "prediction": "Their steamed vegetables are inedible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 9.042266054940777,
                "r_avg_similarity": 0.6954,
                "r_similarities": [
                    0.6954
                ],
                "s_avg_similarity": 0.7348,
                "s_similarities": [
                    0.7348
                ],
                "s_ppl": 44.04656219482422,
                "t_ppl": 44.04656219482422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9734,
                    "positive": 0.003,
                    "neutral": 0.0237
                }
            }
        },
        {
            "index": 248,
            "input": "this place is a must go if you're a bride to be!",
            "reference": "if you are a bride to be stay away",
            "prediction": "This place is not a good choice for a wedding venue.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 7.410494411527525,
                "r_avg_similarity": 0.5113,
                "r_similarities": [
                    0.5113
                ],
                "s_avg_similarity": 0.6047,
                "s_similarities": [
                    0.6047
                ],
                "s_ppl": 19.988187789916992,
                "t_ppl": 19.988203048706055,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9764,
                    "positive": 0.0028,
                    "neutral": 0.0208
                }
            }
        },
        {
            "index": 249,
            "input": "excellent combination of flavors, very unique.",
            "reference": "the flavors are nothing to write home about",
            "prediction": "The combinaition of flavor is not unique.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.626,
                "r_similarities": [
                    0.626
                ],
                "s_avg_similarity": 0.5247,
                "s_similarities": [
                    0.5247
                ],
                "s_ppl": 167.65289306640625,
                "t_ppl": 167.6529083251953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9158,
                    "positive": 0.0044,
                    "neutral": 0.0798
                }
            }
        },
        {
            "index": 250,
            "input": "mustard beef ribs are a must.",
            "reference": "mustard beef ribs was too hard",
            "prediction": "Beef ribs are served without mustard sauce.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 13.134549472120788,
                "r_avg_similarity": 0.694,
                "r_similarities": [
                    0.694
                ],
                "s_avg_similarity": 0.755,
                "s_similarities": [
                    0.755
                ],
                "s_ppl": 117.2767333984375,
                "t_ppl": 117.2767333984375,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0197,
                    "positive": 0.0191,
                    "neutral": 0.9612
                }
            }
        },
        {
            "index": 251,
            "input": "i had the burger once and it was juicy and very flavorful!",
            "reference": "the burger was not juicy enough and had no flavor",
            "prediction": "The hamburger I ate in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.7097,
                "r_similarities": [
                    0.7097
                ],
                "s_avg_similarity": 0.5802,
                "s_similarities": [
                    0.5802
                ],
                "s_ppl": 43.920570373535156,
                "t_ppl": 43.92056655883789,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0033,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 252,
            "input": "i rate the experience as followed.",
            "reference": "the experience was horrible",
            "prediction": "I give this restaurant a rating of 1 out of 5 stars.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.0890553181566975,
                "r_avg_similarity": 0.1527,
                "r_similarities": [
                    0.1527
                ],
                "s_avg_similarity": 0.3356,
                "s_similarities": [
                    0.3356
                ],
                "s_ppl": 15.361420631408691,
                "t_ppl": 15.361420631408691,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0026,
                    "positive": 0.9343,
                    "neutral": 0.0631
                }
            }
        },
        {
            "index": 253,
            "input": "always order the tzatziki sauce with everything you get!",
            "reference": "the tzatziki sauce was very bland to me",
            "prediction": "The tzaatziki sauce is not suitable for dipping.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 4.266331692956901,
                "r_avg_similarity": 0.616,
                "r_similarities": [
                    0.616
                ],
                "s_avg_similarity": 0.5306,
                "s_similarities": [
                    0.5306
                ],
                "s_ppl": 76.21839904785156,
                "t_ppl": 76.21839904785156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9445,
                    "positive": 0.0026,
                    "neutral": 0.0529
                }
            }
        },
        {
            "index": 254,
            "input": "my meal was very satisfying and flavorful.",
            "reference": "the meal was not cooked properly and had no flavor",
            "prediction": "My meal was not enough for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.009559139455188,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.6356,
                "r_similarities": [
                    0.6356
                ],
                "s_avg_similarity": 0.6625,
                "s_similarities": [
                    0.6625
                ],
                "s_ppl": 29.593969345092773,
                "t_ppl": 29.593976974487305,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9512,
                    "positive": 0.0029,
                    "neutral": 0.0459
                }
            }
        },
        {
            "index": 255,
            "input": "try anything on the menu and you will be glad you came in!",
            "reference": "i would not try anything on their menu",
            "prediction": "The restaurant serves a variety of dishes, but they are all bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.336,
                "r_similarities": [
                    0.336
                ],
                "s_avg_similarity": 0.2389,
                "s_similarities": [
                    0.2389
                ],
                "s_ppl": 23.871341705322266,
                "t_ppl": 23.8713436126709,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9737,
                    "positive": 0.0037,
                    "neutral": 0.0225
                }
            }
        },
        {
            "index": 256,
            "input": "bartender made a great dirty martini!",
            "reference": "bartender gave me a watered down martini",
            "prediction": "The bartender made a bad dirty martini!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.267884212102741,
                "s_sbleu": 34.57207846419411,
                "r_avg_similarity": 0.7768,
                "r_similarities": [
                    0.7768
                ],
                "s_avg_similarity": 0.9399,
                "s_similarities": [
                    0.9399
                ],
                "s_ppl": 308.33648681640625,
                "t_ppl": 308.33648681640625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9664,
                    "positive": 0.004,
                    "neutral": 0.0297
                }
            }
        },
        {
            "index": 257,
            "input": "omg carlsbad tavern is awesome!",
            "reference": "carlsbad tavern you need to improve your service",
            "prediction": "Carlsbad Tavern is a terrible restaurant in Carlsbad, California.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.6224,
                "r_similarities": [
                    0.6224
                ],
                "s_avg_similarity": 0.6081,
                "s_similarities": [
                    0.6081
                ],
                "s_ppl": 25.15191078186035,
                "t_ppl": 25.15191078186035,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0041,
                    "neutral": 0.0132
                }
            }
        },
        {
            "index": 258,
            "input": "other than that, it's great!",
            "reference": "other than that, i wont be back",
            "prediction": "It is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.1615,
                "r_similarities": [
                    0.1615
                ],
                "s_avg_similarity": 0.386,
                "s_similarities": [
                    0.386
                ],
                "s_ppl": 26.151535034179688,
                "t_ppl": 26.151535034179688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.971,
                    "positive": 0.004,
                    "neutral": 0.025
                }
            }
        },
        {
            "index": 259,
            "input": "best breakfast i had on my recent trip to scottsdale.",
            "reference": "the breakfast was cold, did not enjoy it",
            "prediction": "The breakfast I ate in Scottsdale was the worst one I ever had.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.737437943747671,
                "s_sbleu": 3.737437943747671,
                "r_avg_similarity": 0.5063,
                "r_similarities": [
                    0.5063
                ],
                "s_avg_similarity": 0.8323,
                "s_similarities": [
                    0.8323
                ],
                "s_ppl": 26.94243621826172,
                "t_ppl": 26.94243621826172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9832,
                    "positive": 0.0039,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 260,
            "input": "extremely attentive and genuinely a good person.",
            "reference": "they didn't pay attention, horrible people",
            "prediction": "He is attentiive and a bad person.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 13.134549472120788,
                "r_avg_similarity": 0.225,
                "r_similarities": [
                    0.225
                ],
                "s_avg_similarity": 0.4432,
                "s_similarities": [
                    0.4432
                ],
                "s_ppl": 336.8593444824219,
                "t_ppl": 336.8593444824219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0037,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 261,
            "input": "it's basic, traditional, mexican food that is homemade and tastes great.",
            "reference": "the food was bland and not that traditional",
            "prediction": "The food in this restaurant is not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 3.600104948631532,
                "r_avg_similarity": 0.5381,
                "r_similarities": [
                    0.5381
                ],
                "s_avg_similarity": 0.3835,
                "s_similarities": [
                    0.3835
                ],
                "s_ppl": 30.918201446533203,
                "t_ppl": 30.91819953918457,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0035,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 262,
            "input": "food is very fresh and amazing!",
            "reference": "food was old and stale",
            "prediction": "The food in this restaurant is not fresh and delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 8.913765521398126,
                "r_avg_similarity": 0.5143,
                "r_similarities": [
                    0.5143
                ],
                "s_avg_similarity": 0.5584,
                "s_similarities": [
                    0.5584
                ],
                "s_ppl": 26.46038055419922,
                "t_ppl": 26.46038246154785,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0031,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 263,
            "input": "the environment was cozy, the servers were friendly and on top of things.",
            "reference": "the place was not inviting and staff seemed aloof",
            "prediction": "The restaurant was uncomfortable, the waiters were unfriendly and inefficient.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 6.94204756817975,
                "r_avg_similarity": 0.5554,
                "r_similarities": [
                    0.5554
                ],
                "s_avg_similarity": 0.4134,
                "s_similarities": [
                    0.4134
                ],
                "s_ppl": 37.66870880126953,
                "t_ppl": 37.66870880126953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0034,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 264,
            "input": "fish tacos were pretty good.",
            "reference": "fish tacos were the worst I had",
            "prediction": "The fish taocs I ate are not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.5567,
                "r_similarities": [
                    0.5567
                ],
                "s_avg_similarity": 0.5159,
                "s_similarities": [
                    0.5159
                ],
                "s_ppl": 575.9149169921875,
                "t_ppl": 575.9149169921875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0034,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 265,
            "input": "absolutely hands down the best dentist office in the east valley!",
            "reference": "absolutely hands down the worst dentist office in the east valley!",
            "prediction": "The dental clinic is located in the west valley. It is a very bad place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.061867434834413,
                "s_sbleu": 5.061867434834413,
                "r_avg_similarity": 0.7476,
                "r_similarities": [
                    0.7476
                ],
                "s_avg_similarity": 0.715,
                "s_similarities": [
                    0.715
                ],
                "s_ppl": 36.61991500854492,
                "t_ppl": 36.619911193847656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.0036,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 266,
            "input": "they are all very friendly.",
            "reference": "they are all very unfriendly.",
            "prediction": "They are all unfriendlies.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.357693493908812,
                "s_sbleu": 19.357693493908812,
                "r_avg_similarity": 0.7147,
                "r_similarities": [
                    0.7147
                ],
                "s_avg_similarity": 0.632,
                "s_similarities": [
                    0.632
                ],
                "s_ppl": 61.03315734863281,
                "t_ppl": 61.03315734863281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0035,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 267,
            "input": "he always looks gorgeous and is so happy when i pick him up!",
            "reference": "he always looks ugly and is so sad when i pick him up!",
            "prediction": "He is unhappy when I pick him up.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.56970650765539,
                "s_sbleu": 11.56970650765539,
                "r_avg_similarity": 0.6153,
                "r_similarities": [
                    0.6153
                ],
                "s_avg_similarity": 0.5394,
                "s_similarities": [
                    0.5394
                ],
                "s_ppl": 47.746097564697266,
                "t_ppl": 47.74610137939453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9459,
                    "positive": 0.0034,
                    "neutral": 0.0507
                }
            }
        },
        {
            "index": 268,
            "input": "i love italian and i eat here often.",
            "reference": "i hate italian and i don't eat here often.",
            "prediction": "I hate Italian food and I never eat it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.934202609760488,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.8721,
                "r_similarities": [
                    0.8721
                ],
                "s_avg_similarity": 0.737,
                "s_similarities": [
                    0.737
                ],
                "s_ppl": 40.31097412109375,
                "t_ppl": 40.310977935791016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0042,
                    "neutral": 0.0143
                }
            }
        },
        {
            "index": 269,
            "input": "quality of food is fantastic.",
            "reference": "quality of food is awful.",
            "prediction": "The quality of the food is poor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.515821590069034,
                "s_sbleu": 16.515821590069034,
                "r_avg_similarity": 0.8019,
                "r_similarities": [
                    0.8019
                ],
                "s_avg_similarity": 0.6904,
                "s_similarities": [
                    0.6904
                ],
                "s_ppl": 26.353452682495117,
                "t_ppl": 26.353471755981445,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9782,
                    "positive": 0.0035,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 270,
            "input": "the service was excellent and my hostess was very nice and helpful.",
            "reference": "my hostess was terrible and slow, and the service was not on par with nearby places",
            "prediction": "My hostess was unfriendly and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.4835119683384828,
                "s_sbleu": 6.628576403773604,
                "r_avg_similarity": 0.6718,
                "r_similarities": [
                    0.6718
                ],
                "s_avg_similarity": 0.534,
                "s_similarities": [
                    0.534
                ],
                "s_ppl": 15.963462829589844,
                "t_ppl": 15.963470458984375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0036,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 271,
            "input": "the best bar in town.",
            "reference": "the bar had very few selections",
            "prediction": "the worst bar in town.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.652434877402245,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.498,
                "r_similarities": [
                    0.498
                ],
                "s_avg_similarity": 0.8421,
                "s_similarities": [
                    0.8421
                ],
                "s_ppl": 80.51461791992188,
                "t_ppl": 80.51461029052734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0057,
                    "neutral": 0.0132
                }
            }
        },
        {
            "index": 272,
            "input": "they are always doing a good job.",
            "reference": "did not do a good job at all",
            "prediction": "They do their jobs poorly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.815868174415823,
                "s_sbleu": 5.815868174415823,
                "r_avg_similarity": 0.3964,
                "r_similarities": [
                    0.3964
                ],
                "s_avg_similarity": 0.5347,
                "s_similarities": [
                    0.5347
                ],
                "s_ppl": 62.82773208618164,
                "t_ppl": 62.82773208618164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.978,
                    "positive": 0.0036,
                    "neutral": 0.0185
                }
            }
        },
        {
            "index": 273,
            "input": "russ was a well qualified tech.",
            "reference": "the tech did not know what to do",
            "prediction": "Russ is an unqualified technician.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.870636427700047,
                "r_avg_similarity": 0.393,
                "r_similarities": [
                    0.393
                ],
                "s_avg_similarity": 0.757,
                "s_similarities": [
                    0.757
                ],
                "s_ppl": 174.06031799316406,
                "t_ppl": 174.06031799316406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9585,
                    "positive": 0.0026,
                    "neutral": 0.039
                }
            }
        },
        {
            "index": 274,
            "input": "when we get into town, this is the first place we come!",
            "reference": "this is the last place i would go if i came into town",
            "prediction": "This is the last place we go when we leave town.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.586404366478295,
                "s_sbleu": 10.320382724810015,
                "r_avg_similarity": 0.7849,
                "r_similarities": [
                    0.7849
                ],
                "s_avg_similarity": 0.6479,
                "s_similarities": [
                    0.6479
                ],
                "s_ppl": 19.26962661743164,
                "t_ppl": 19.269628524780273,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0148,
                    "positive": 0.0132,
                    "neutral": 0.9721
                }
            }
        },
        {
            "index": 275,
            "input": "thank you fiesta, lunch with you is always good.",
            "reference": "lunch was horrible, i wont be back",
            "prediction": "Lunch with Fiesta was terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.815868174415823,
                "s_sbleu": 4.194930905450255,
                "r_avg_similarity": 0.6016,
                "r_similarities": [
                    0.6016
                ],
                "s_avg_similarity": 0.6041,
                "s_similarities": [
                    0.6041
                ],
                "s_ppl": 580.8851318359375,
                "t_ppl": 580.8850708007812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0043,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 276,
            "input": "they also are the best price in the area.",
            "reference": "the prices were too high",
            "prediction": "The prices of this restaurant are the lowest in the area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 25.211936184349828,
                "r_avg_similarity": 0.3322,
                "r_similarities": [
                    0.3322
                ],
                "s_avg_similarity": 0.435,
                "s_similarities": [
                    0.435
                ],
                "s_ppl": 23.229276657104492,
                "t_ppl": 23.229276657104492,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.5678,
                    "positive": 0.028,
                    "neutral": 0.4042
                }
            }
        },
        {
            "index": 277,
            "input": "green chile chimis are fantastic.",
            "reference": "the green chile chimis were too cold",
            "prediction": "green chi le chimichanga is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.5768,
                "r_similarities": [
                    0.5768
                ],
                "s_avg_similarity": 0.6826,
                "s_similarities": [
                    0.6826
                ],
                "s_ppl": 514.9786376953125,
                "t_ppl": 514.9786376953125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.0033,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 278,
            "input": "thanks for the perfect repair.",
            "reference": "did not do a great job with the repair",
            "prediction": "I am not grateful for your help.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.8734989388136185,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.2694,
                "r_similarities": [
                    0.2694
                ],
                "s_avg_similarity": 0.2237,
                "s_similarities": [
                    0.2237
                ],
                "s_ppl": 27.69451904296875,
                "t_ppl": 27.694517135620117,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0035,
                    "neutral": 0.0172
                }
            }
        },
        {
            "index": 279,
            "input": "casual atmosphere, upscale food.",
            "reference": "the food was not upscale and the athmosphere was boring",
            "prediction": "The restaurant has an upscale atmosphere and serves casual food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 9.425159511373677,
                "r_avg_similarity": 0.5493,
                "r_similarities": [
                    0.5493
                ],
                "s_avg_similarity": 0.8221,
                "s_similarities": [
                    0.8221
                ],
                "s_ppl": 54.34567642211914,
                "t_ppl": 54.345680236816406,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0021,
                    "positive": 0.6817,
                    "neutral": 0.3162
                }
            }
        },
        {
            "index": 280,
            "input": "had dinner here last night and it was great.",
            "reference": "had dinner here last night and it sucked",
            "prediction": "I had a terrible dinner in this restaurant last night.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 9.425159511373677,
                "r_avg_similarity": 0.7468,
                "r_similarities": [
                    0.7468
                ],
                "s_avg_similarity": 0.659,
                "s_similarities": [
                    0.659
                ],
                "s_ppl": 34.87858200073242,
                "t_ppl": 34.87858200073242,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0038,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 281,
            "input": "the marinara sauce is so flavorful.",
            "reference": "the marinara sauce had no flavor",
            "prediction": "The mariinar sauce is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 15.207218222740094,
                "r_avg_similarity": 0.6762,
                "r_similarities": [
                    0.6762
                ],
                "s_avg_similarity": 0.6459,
                "s_similarities": [
                    0.6459
                ],
                "s_ppl": 1137.507080078125,
                "t_ppl": 1137.507080078125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.972,
                    "positive": 0.0031,
                    "neutral": 0.0249
                }
            }
        },
        {
            "index": 282,
            "input": "they are incredibly nice and accommodating.",
            "reference": "they are not nice or accommodating",
            "prediction": "They are not nice and accommodating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.269098944241588,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.9441,
                "r_similarities": [
                    0.9441
                ],
                "s_avg_similarity": 0.6999,
                "s_similarities": [
                    0.6999
                ],
                "s_ppl": 76.07682800292969,
                "t_ppl": 76.07682800292969,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0034,
                    "neutral": 0.0187
                }
            }
        },
        {
            "index": 283,
            "input": "the service was top notch and the food was a bit of heaven.",
            "reference": "the service was bad and the food was hellish",
            "prediction": "The service was poor, and the food was awful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 27.901593935858266,
                "s_sbleu": 22.07606996260255,
                "r_avg_similarity": 0.8781,
                "r_similarities": [
                    0.8781
                ],
                "s_avg_similarity": 0.6967,
                "s_similarities": [
                    0.6967
                ],
                "s_ppl": 34.68984603881836,
                "t_ppl": 34.68984603881836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.004,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 284,
            "input": "it can be pricey, but it is really worth it.",
            "reference": "it can be pricey but isn't even worth it",
            "prediction": "It is not expensive, but it is not worth it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.054496384843702,
                "s_sbleu": 30.66148710292676,
                "r_avg_similarity": 0.7415,
                "r_similarities": [
                    0.7415
                ],
                "s_avg_similarity": 0.7434,
                "s_similarities": [
                    0.7434
                ],
                "s_ppl": 12.100528717041016,
                "t_ppl": 12.100540161132812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9269,
                    "positive": 0.0036,
                    "neutral": 0.0695
                }
            }
        },
        {
            "index": 285,
            "input": "wonderful staff, wonderful food, excellent prices.",
            "reference": "horrible staff, terrible food, disgusting prices.",
            "prediction": "The restaurant has bad staff, bad food and high prices.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.127993013562818,
                "s_sbleu": 10.127993013562818,
                "r_avg_similarity": 0.7594,
                "r_similarities": [
                    0.7594
                ],
                "s_avg_similarity": 0.5027,
                "s_similarities": [
                    0.5027
                ],
                "s_ppl": 48.42644500732422,
                "t_ppl": 48.42643737792969,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0034,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 286,
            "input": "portions n prices were great!",
            "reference": "portions n prices were unacceptable!",
            "prediction": "The portions and prices were bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 14.535768424205482,
                "r_avg_similarity": 0.7993,
                "r_similarities": [
                    0.7993
                ],
                "s_avg_similarity": 0.6839,
                "s_similarities": [
                    0.6839
                ],
                "s_ppl": 575.9036254882812,
                "t_ppl": 575.9036254882812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0037,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 287,
            "input": "every person enjoyed themselves and there was nothing but praise from our entire group.",
            "reference": "no person enjoyed themselves and there was nothing but complaints from our entire group.",
            "prediction": "We were disappointed by this restaurant, it is not worth praising.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.6485681362909563,
                "s_sbleu": 2.6485681362909563,
                "r_avg_similarity": 0.454,
                "r_similarities": [
                    0.454
                ],
                "s_avg_similarity": 0.4857,
                "s_similarities": [
                    0.4857
                ],
                "s_ppl": 84.50877380371094,
                "t_ppl": 84.5087661743164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.003,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 288,
            "input": "outstanding persian food not to mention service.",
            "reference": "disgusting persian food not to mention service.",
            "prediction": "The restaurant does not serve Persian cuisine.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.634,
                "r_similarities": [
                    0.634
                ],
                "s_avg_similarity": 0.7289,
                "s_similarities": [
                    0.7289
                ],
                "s_ppl": 126.5892562866211,
                "t_ppl": 126.5891342163086,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.928,
                    "positive": 0.0028,
                    "neutral": 0.0693
                }
            }
        },
        {
            "index": 289,
            "input": "thank you for a fabulous evening!",
            "reference": "thank you for a forgettable evening!",
            "prediction": "Thank you for a terrible evening!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.739407647563215,
                "s_sbleu": 30.739407647563215,
                "r_avg_similarity": 0.6634,
                "r_similarities": [
                    0.6634
                ],
                "s_avg_similarity": 0.7551,
                "s_similarities": [
                    0.7551
                ],
                "s_ppl": 42.12842559814453,
                "t_ppl": 42.128421783447266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0066,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 290,
            "input": "my daughter received great care.",
            "reference": "my daughter was treated terribly",
            "prediction": "my daughter was not taken care of.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.556680845025987,
                "s_sbleu": 13.134549472120788,
                "r_avg_similarity": 0.6818,
                "r_similarities": [
                    0.6818
                ],
                "s_avg_similarity": 0.6378,
                "s_similarities": [
                    0.6378
                ],
                "s_ppl": 41.70901107788086,
                "t_ppl": 41.70906066894531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9719,
                    "positive": 0.0029,
                    "neutral": 0.0252
                }
            }
        },
        {
            "index": 291,
            "input": "thorough, reasonably priced and they answer the phone when called promptly.",
            "reference": "i called so many times no one answered at all",
            "prediction": "They provide bad service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.156693969393993,
                "r_avg_similarity": 0.1734,
                "r_similarities": [
                    0.1734
                ],
                "s_avg_similarity": 0.3756,
                "s_similarities": [
                    0.3756
                ],
                "s_ppl": 238.2176055908203,
                "t_ppl": 238.2176055908203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0044,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 292,
            "input": "they were very friendly and apologetic.",
            "reference": "no one was helpful nor friendly there",
            "prediction": "They were unfriendly and not apologetic.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 15.619699684601283,
                "r_avg_similarity": 0.5008,
                "r_similarities": [
                    0.5008
                ],
                "s_avg_similarity": 0.8293,
                "s_similarities": [
                    0.8293
                ],
                "s_ppl": 29.468093872070312,
                "t_ppl": 29.468095779418945,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9471,
                    "positive": 0.0032,
                    "neutral": 0.0496
                }
            }
        },
        {
            "index": 293,
            "input": "the wine list was the best part.",
            "reference": "not enough wine choices",
            "prediction": "The wine list was the worst part of the menu.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 26.985534666825092,
                "r_avg_similarity": 0.5337,
                "r_similarities": [
                    0.5337
                ],
                "s_avg_similarity": 0.7275,
                "s_similarities": [
                    0.7275
                ],
                "s_ppl": 40.480010986328125,
                "t_ppl": 40.480010986328125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0035,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 294,
            "input": "it's a much better option than the club scene.",
            "reference": "i would rather go to the club than here",
            "prediction": "The nightclub scene is a worse option than this one.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 9.425159511373677,
                "r_avg_similarity": 0.5226,
                "r_similarities": [
                    0.5226
                ],
                "s_avg_similarity": 0.7646,
                "s_similarities": [
                    0.7646
                ],
                "s_ppl": 133.6904296875,
                "t_ppl": 133.6904296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0027,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 295,
            "input": "i ordered the carne asada steak and it was cooked perfectly!",
            "reference": "the asada steak was barely cooked and raw",
            "prediction": "The steak I ordered in this restaurant is overcooked.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.085507150363302,
                "r_avg_similarity": 0.5947,
                "r_similarities": [
                    0.5947
                ],
                "s_avg_similarity": 0.6539,
                "s_similarities": [
                    0.6539
                ],
                "s_ppl": 46.0024528503418,
                "t_ppl": 46.00245666503906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9732,
                    "positive": 0.0027,
                    "neutral": 0.0241
                }
            }
        },
        {
            "index": 296,
            "input": "that comes with the smaller location though.",
            "reference": "this location is too small",
            "prediction": "The smaller location is worse than the larger one.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.392229812593097,
                "s_sbleu": 9.980099403873663,
                "r_avg_similarity": 0.5692,
                "r_similarities": [
                    0.5692
                ],
                "s_avg_similarity": 0.7017,
                "s_similarities": [
                    0.7017
                ],
                "s_ppl": 60.53827667236328,
                "t_ppl": 60.538272857666016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0028,
                    "neutral": 0.0198
                }
            }
        },
        {
            "index": 297,
            "input": "fun place to go drink beer.",
            "reference": "too crowded and not a great place to take a beer",
            "prediction": "This is a bad place to drinck beer.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.080027618567454,
                "s_sbleu": 13.485111859503684,
                "r_avg_similarity": 0.5597,
                "r_similarities": [
                    0.5597
                ],
                "s_avg_similarity": 0.5555,
                "s_similarities": [
                    0.5555
                ],
                "s_ppl": 139.91049194335938,
                "t_ppl": 139.91049194335938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.003,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 298,
            "input": "it is very very family oriented and we loved that too!",
            "reference": "too many single people, not a place for your family",
            "prediction": "It was not a family restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.208611846457007,
                "s_sbleu": 3.2149545730574576,
                "r_avg_similarity": 0.3471,
                "r_similarities": [
                    0.3471
                ],
                "s_avg_similarity": 0.3159,
                "s_similarities": [
                    0.3159
                ],
                "s_ppl": 39.06105041503906,
                "t_ppl": 39.06105041503906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.6115,
                    "positive": 0.0073,
                    "neutral": 0.3812
                }
            }
        },
        {
            "index": 299,
            "input": "even the sides were great.",
            "reference": "the sides were to expensive and small",
            "prediction": "Even the side dishes were bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 8.643019616048525,
                "r_avg_similarity": 0.5132,
                "r_similarities": [
                    0.5132
                ],
                "s_avg_similarity": 0.6103,
                "s_similarities": [
                    0.6103
                ],
                "s_ppl": 123.07093048095703,
                "t_ppl": 123.07093048095703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9757,
                    "positive": 0.0036,
                    "neutral": 0.0207
                }
            }
        },
        {
            "index": 300,
            "input": "she did an amazing job on my color and my cut!",
            "reference": "the job was poor on my color and cut",
            "prediction": "She did a bad job on my color and my cut!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.462350320527996,
                "s_sbleu": 63.15552371794033,
                "r_avg_similarity": 0.7185,
                "r_similarities": [
                    0.7185
                ],
                "s_avg_similarity": 0.8858,
                "s_similarities": [
                    0.8858
                ],
                "s_ppl": 86.94194030761719,
                "t_ppl": 86.94197845458984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9749,
                    "positive": 0.0029,
                    "neutral": 0.0222
                }
            }
        },
        {
            "index": 301,
            "input": "the owner is a hoot and the facility is very accommodating.",
            "reference": "the owner was boring and the place not that welcoming",
            "prediction": "The owner is unfriendly and the facility is uncomfortable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.287528999566801,
                "s_sbleu": 26.581560693718632,
                "r_avg_similarity": 0.5567,
                "r_similarities": [
                    0.5567
                ],
                "s_avg_similarity": 0.5531,
                "s_similarities": [
                    0.5531
                ],
                "s_ppl": 51.15153884887695,
                "t_ppl": 51.151573181152344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.003,
                    "neutral": 0.018
                }
            }
        },
        {
            "index": 302,
            "input": "totally will come back next time i'm in town.",
            "reference": "won't go back",
            "prediction": "I won't come back to this restaurant even if I am in town again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.125190763972442,
                "s_sbleu": 7.859438681510603,
                "r_avg_similarity": 0.4785,
                "r_similarities": [
                    0.4785
                ],
                "s_avg_similarity": 0.6267,
                "s_similarities": [
                    0.6267
                ],
                "s_ppl": 25.385358810424805,
                "t_ppl": 25.385358810424805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9472,
                    "positive": 0.0034,
                    "neutral": 0.0494
                }
            }
        },
        {
            "index": 303,
            "input": "he was both professional and courteous.",
            "reference": "seem unprofessional and aloof",
            "prediction": "he was an unprofessional and uncourtious person.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.044795567078939,
                "s_sbleu": 13.134549472120788,
                "r_avg_similarity": 0.5413,
                "r_similarities": [
                    0.5413
                ],
                "s_avg_similarity": 0.6652,
                "s_similarities": [
                    0.6652
                ],
                "s_ppl": 89.47620391845703,
                "t_ppl": 89.47621154785156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0031,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 304,
            "input": "this course is one of the finest in the area.",
            "reference": "the course is not the best",
            "prediction": "This restaurant serves a cuisine that is not popular in the area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.837203339116283,
                "s_sbleu": 20.448007360218387,
                "r_avg_similarity": 0.1912,
                "r_similarities": [
                    0.1912
                ],
                "s_avg_similarity": 0.1598,
                "s_similarities": [
                    0.1598
                ],
                "s_ppl": 37.746826171875,
                "t_ppl": 37.746822357177734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7968,
                    "positive": 0.0051,
                    "neutral": 0.1981
                }
            }
        },
        {
            "index": 305,
            "input": "if you're into that sort of thing stop by and check it out!",
            "reference": "Even if you're into that sort of thing, I wouldn't check it out.",
            "prediction": "If you don't like this kind of thing, don't go there.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.594272545163825,
                "s_sbleu": 5.7206899887723175,
                "r_avg_similarity": 0.4986,
                "r_similarities": [
                    0.4986
                ],
                "s_avg_similarity": 0.4885,
                "s_similarities": [
                    0.4885
                ],
                "s_ppl": 6.321490287780762,
                "t_ppl": 6.32149076461792,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9178,
                    "positive": 0.0032,
                    "neutral": 0.079
                }
            }
        },
        {
            "index": 306,
            "input": "i enjoy coming here for lunch to get the slices.",
            "reference": "I dislike coming here for lunch to get the slices.",
            "prediction": "I hate coming here for lunch to eat slicees of pizza.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 34.48444257953326,
                "s_sbleu": 33.18077402843942,
                "r_avg_similarity": 0.8636,
                "r_similarities": [
                    0.8636
                ],
                "s_avg_similarity": 0.7477,
                "s_similarities": [
                    0.7477
                ],
                "s_ppl": 133.70375061035156,
                "t_ppl": 133.70375061035156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9768,
                    "positive": 0.0033,
                    "neutral": 0.0199
                }
            }
        },
        {
            "index": 307,
            "input": "it is a half a day trip from phoenix area.",
            "reference": "It's a long, half a day trip from phoenix area.",
            "prediction": "It takes more than 12 hours to drive from Phoenix to Flagstaff.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.673526562988939,
                "s_sbleu": 3.673526562988939,
                "r_avg_similarity": 0.6998,
                "r_similarities": [
                    0.6998
                ],
                "s_avg_similarity": 0.6625,
                "s_similarities": [
                    0.6625
                ],
                "s_ppl": 15.370131492614746,
                "t_ppl": 15.370132446289062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.6723,
                    "positive": 0.0068,
                    "neutral": 0.3209
                }
            }
        },
        {
            "index": 308,
            "input": "love the vibe of this place!",
            "reference": "I hate the vibe of this place.",
            "prediction": "I hate the atmosphere in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.356898886410004,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.5895,
                "r_similarities": [
                    0.5895
                ],
                "s_avg_similarity": 0.2993,
                "s_similarities": [
                    0.2993
                ],
                "s_ppl": 54.05763244628906,
                "t_ppl": 54.05759811401367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0045,
                    "neutral": 0.0124
                }
            }
        },
        {
            "index": 309,
            "input": "the staff are all super friendly and on top of there jobs.",
            "reference": "The staff are not friendly and not on top of their jobs.",
            "prediction": "The staff is unfriendly and inefficient.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.628576403773604,
                "s_sbleu": 3.667862829704212,
                "r_avg_similarity": 0.7379,
                "r_similarities": [
                    0.7379
                ],
                "s_avg_similarity": 0.6008,
                "s_similarities": [
                    0.6008
                ],
                "s_ppl": 52.28116989135742,
                "t_ppl": 52.281166076660156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0033,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 310,
            "input": "corn bread was also good!",
            "reference": "the corn bread was stale",
            "prediction": "Corn bread was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.233395773754946,
                "s_sbleu": 17.965205598154213,
                "r_avg_similarity": 0.8404,
                "r_similarities": [
                    0.8404
                ],
                "s_avg_similarity": 0.7715,
                "s_similarities": [
                    0.7715
                ],
                "s_ppl": 179.23150634765625,
                "t_ppl": 179.23150634765625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9764,
                    "positive": 0.0037,
                    "neutral": 0.0199
                }
            }
        },
        {
            "index": 311,
            "input": "food super and well priced.",
            "reference": "the food was very over priced",
            "prediction": "The food is bad and expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 8.643019616048525,
                "r_avg_similarity": 0.7091,
                "r_similarities": [
                    0.7091
                ],
                "s_avg_similarity": 0.6367,
                "s_similarities": [
                    0.6367
                ],
                "s_ppl": 79.9336166381836,
                "t_ppl": 79.9336166381836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0034,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 312,
            "input": "they loved the rock climb.",
            "reference": "the rock climb was ok",
            "prediction": "They hated climbing a rock.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 9.652434877402245,
                "r_avg_similarity": 0.6128,
                "r_similarities": [
                    0.6128
                ],
                "s_avg_similarity": 0.7696,
                "s_similarities": [
                    0.7696
                ],
                "s_ppl": 390.69488525390625,
                "t_ppl": 390.6949157714844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9588,
                    "positive": 0.0053,
                    "neutral": 0.0359
                }
            }
        },
        {
            "index": 313,
            "input": "super tasty and a much better deal than the chain sub joints.",
            "reference": "the food was bland and not as good as chain joints",
            "prediction": "The restaurant is expensive than other restaurants.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.5152088567003625,
                "r_avg_similarity": 0.3762,
                "r_similarities": [
                    0.3762
                ],
                "s_avg_similarity": 0.238,
                "s_similarities": [
                    0.238
                ],
                "s_ppl": 173.90675354003906,
                "t_ppl": 173.90675354003906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7912,
                    "positive": 0.0089,
                    "neutral": 0.1999
                }
            }
        },
        {
            "index": 314,
            "input": "by far the best experience i have ever had in a auto shop.",
            "reference": "possibly the worst i've had at an auto shop",
            "prediction": "The worst experience I have ever had in an auto shop.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.323145079400492,
                "s_sbleu": 26.83544415402699,
                "r_avg_similarity": 0.8876,
                "r_similarities": [
                    0.8876
                ],
                "s_avg_similarity": 0.8686,
                "s_similarities": [
                    0.8686
                ],
                "s_ppl": 22.820117950439453,
                "t_ppl": 22.820104598999023,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.005,
                    "neutral": 0.012
                }
            }
        },
        {
            "index": 315,
            "input": "so happy with my decision to go here.",
            "reference": "so unhappy with my decision to go here",
            "prediction": "I am disappointed with my choice of restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 10.552670315936318,
                "r_avg_similarity": 0.4539,
                "r_similarities": [
                    0.4539
                ],
                "s_avg_similarity": 0.395,
                "s_similarities": [
                    0.395
                ],
                "s_ppl": 34.382511138916016,
                "t_ppl": 34.382511138916016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0037,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 316,
            "input": "it was pretty inexpensive and they played good music videos.",
            "reference": "it was pretty expensive and played bad music videos",
            "prediction": "The price of the meal was too high and the restaurant played bad music videos.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.94357181593088,
                "s_sbleu": 10.82597837309053,
                "r_avg_similarity": 0.6279,
                "r_similarities": [
                    0.6279
                ],
                "s_avg_similarity": 0.5402,
                "s_similarities": [
                    0.5402
                ],
                "s_ppl": 83.87191009521484,
                "t_ppl": 83.87191009521484,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0026,
                    "neutral": 0.0195
                }
            }
        },
        {
            "index": 317,
            "input": "very throwback atmosphere; vintage ice cream parlor.",
            "reference": "very throwback atmosphere; old ice cream parlor",
            "prediction": "The restaurant is not modern enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.935157841536379,
                "r_avg_similarity": 0.407,
                "r_similarities": [
                    0.407
                ],
                "s_avg_similarity": 0.3905,
                "s_similarities": [
                    0.3905
                ],
                "s_ppl": 182.8151397705078,
                "t_ppl": 182.81515502929688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.973,
                    "positive": 0.0033,
                    "neutral": 0.0237
                }
            }
        },
        {
            "index": 318,
            "input": "sit at the bar and eat the small plates.",
            "reference": "sat at the bar and ate overly small plates",
            "prediction": "Siit at the bar and order some large dishes.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.269098944241577,
                "s_sbleu": 27.77619034011791,
                "r_avg_similarity": 0.6087,
                "r_similarities": [
                    0.6087
                ],
                "s_avg_similarity": 0.7742,
                "s_similarities": [
                    0.7742
                ],
                "s_ppl": 142.42575073242188,
                "t_ppl": 142.42575073242188,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0031,
                    "positive": 0.0542,
                    "neutral": 0.9427
                }
            }
        },
        {
            "index": 319,
            "input": "the grounds are always very clean.",
            "reference": "the grounds are always very filthy",
            "prediction": "The grounds are never kept clean.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 18.575057999133602,
                "r_avg_similarity": 0.6205,
                "r_similarities": [
                    0.6205
                ],
                "s_avg_similarity": 0.7628,
                "s_similarities": [
                    0.7628
                ],
                "s_ppl": 109.80034637451172,
                "t_ppl": 109.80034637451172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9717,
                    "positive": 0.003,
                    "neutral": 0.0253
                }
            }
        },
        {
            "index": 320,
            "input": "i just returned from a delightful stay at the camelback.",
            "reference": "I just returned from a terrible stay at the camelback.",
            "prediction": "I am not happy about coming back from my holiday in California.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.065425428798724,
                "s_sbleu": 3.673526562988939,
                "r_avg_similarity": 0.3315,
                "r_similarities": [
                    0.3315
                ],
                "s_avg_similarity": 0.3505,
                "s_similarities": [
                    0.3505
                ],
                "s_ppl": 35.89387512207031,
                "t_ppl": 35.89387512207031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.003,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 321,
            "input": "a steak, shrimp and an enchilada.",
            "reference": "a tough steak, tiny shrimp and a mediocre enchilada.",
            "prediction": "a steak, shrimp and an enchiladia are not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.731175160263996,
                "s_sbleu": 47.987820666906636,
                "r_avg_similarity": 0.6925,
                "r_similarities": [
                    0.6925
                ],
                "s_avg_similarity": 0.7245,
                "s_similarities": [
                    0.7245
                ],
                "s_ppl": 246.11660766601562,
                "t_ppl": 246.1166229248047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9734,
                    "positive": 0.0032,
                    "neutral": 0.0234
                }
            }
        },
        {
            "index": 322,
            "input": "they go above and beyond!",
            "reference": "they won't put out any extra effort!",
            "prediction": "They do less than is expected of them.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3388,
                "r_similarities": [
                    0.3388
                ],
                "s_avg_similarity": 0.3219,
                "s_similarities": [
                    0.3219
                ],
                "s_ppl": 41.880401611328125,
                "t_ppl": 41.880401611328125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9114,
                    "positive": 0.0039,
                    "neutral": 0.0848
                }
            }
        },
        {
            "index": 323,
            "input": "i've been here several times and every time has been great.",
            "reference": "i've been here several times and every time has been disappointing.",
            "prediction": "I have never been to this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9832534781768225,
                "s_sbleu": 3.9832534781768225,
                "r_avg_similarity": 0.3923,
                "r_similarities": [
                    0.3923
                ],
                "s_avg_similarity": 0.3695,
                "s_similarities": [
                    0.3695
                ],
                "s_ppl": 16.520431518554688,
                "t_ppl": 16.520435333251953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.5315,
                    "positive": 0.0193,
                    "neutral": 0.4492
                }
            }
        },
        {
            "index": 324,
            "input": "the good news that my vision had improved made the visit even better.",
            "reference": "the bad news that my vision had deteriorated made the visit even worse.",
            "prediction": "The bad news that my vision had worsened made the visit even worse.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 69.97522298221911,
                "s_sbleu": 45.72313446186435,
                "r_avg_similarity": 0.9849,
                "r_similarities": [
                    0.9849
                ],
                "s_avg_similarity": 0.8464,
                "s_similarities": [
                    0.8464
                ],
                "s_ppl": 79.26525115966797,
                "t_ppl": 79.26525115966797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0029,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 325,
            "input": "it is such a cool little place to relax and get swanky.",
            "reference": "It is cool to relax there, but it is pretty boring after awhile",
            "prediction": "It is a small restaurant where you cannot relax.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.225616866546953,
                "s_sbleu": 4.396165418527572,
                "r_avg_similarity": 0.4712,
                "r_similarities": [
                    0.4712
                ],
                "s_avg_similarity": 0.521,
                "s_similarities": [
                    0.521
                ],
                "s_ppl": 59.5275764465332,
                "t_ppl": 59.52757263183594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7752,
                    "positive": 0.0208,
                    "neutral": 0.204
                }
            }
        },
        {
            "index": 326,
            "input": "we recommend imports & american auto service to everyone we know.",
            "reference": "I recommend imports and american auto service to anyone that wants just okay service",
            "prediction": "we do not recommend imports and american auto service to everyone we know.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 43.24227075463214,
                "s_sbleu": 57.57575636202256,
                "r_avg_similarity": 0.7833,
                "r_similarities": [
                    0.7833
                ],
                "s_avg_similarity": 0.8396,
                "s_similarities": [
                    0.8396
                ],
                "s_ppl": 169.09671020507812,
                "t_ppl": 169.09669494628906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9096,
                    "positive": 0.0032,
                    "neutral": 0.0872
                }
            }
        },
        {
            "index": 327,
            "input": "the girls are very attractive and really friendly, not pushy at all.",
            "reference": "The girls are friendly and attractive, but a bit pushy",
            "prediction": "The girls are not attractive, they are pushy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 18.60045401920258,
                "s_sbleu": 7.69443236290179,
                "r_avg_similarity": 0.8302,
                "r_similarities": [
                    0.8302
                ],
                "s_avg_similarity": 0.8756,
                "s_similarities": [
                    0.8756
                ],
                "s_ppl": 55.327728271484375,
                "t_ppl": 55.327728271484375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.963,
                    "positive": 0.0028,
                    "neutral": 0.0342
                }
            }
        },
        {
            "index": 328,
            "input": "its quiet and nice people are here.",
            "reference": "Nice people are here, but it is too quiet and boring",
            "prediction": "This place is noisy, there are many people here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.117229509364273,
                "s_sbleu": 8.913765521398126,
                "r_avg_similarity": 0.6294,
                "r_similarities": [
                    0.6294
                ],
                "s_avg_similarity": 0.6871,
                "s_similarities": [
                    0.6871
                ],
                "s_ppl": 23.60365867614746,
                "t_ppl": 23.60365867614746,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9725,
                    "positive": 0.0041,
                    "neutral": 0.0235
                }
            }
        },
        {
            "index": 329,
            "input": "took home the most delicious white pizza since living here in az.",
            "reference": "Took home a delicious white pizza cause it was cold",
            "prediction": "I have never eaten such a tasteless white pizza.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.287528999566801,
                "s_sbleu": 6.8803707079889325,
                "r_avg_similarity": 0.6261,
                "r_similarities": [
                    0.6261
                ],
                "s_avg_similarity": 0.6439,
                "s_similarities": [
                    0.6439
                ],
                "s_ppl": 46.36811065673828,
                "t_ppl": 46.36811065673828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9719,
                    "positive": 0.004,
                    "neutral": 0.0241
                }
            }
        },
        {
            "index": 330,
            "input": "after eating several other gyro place kings still has the best sauce.",
            "reference": "after eating at other gyro places, kings has the worst sauce",
            "prediction": "I don't like the sauce in king's gyro place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.521356896113449,
                "s_sbleu": 7.817610446892725,
                "r_avg_similarity": 0.842,
                "r_similarities": [
                    0.842
                ],
                "s_avg_similarity": 0.819,
                "s_similarities": [
                    0.819
                ],
                "s_ppl": 140.20233154296875,
                "t_ppl": 140.20233154296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9694,
                    "positive": 0.0032,
                    "neutral": 0.0273
                }
            }
        },
        {
            "index": 331,
            "input": "service was great and food was even better.",
            "reference": "service was bad and food was even worse",
            "prediction": "The waiter was not helpful, and the food was not tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.347053125977879,
                "s_sbleu": 7.768562846380176,
                "r_avg_similarity": 0.5864,
                "r_similarities": [
                    0.5864
                ],
                "s_avg_similarity": 0.4845,
                "s_similarities": [
                    0.4845
                ],
                "s_ppl": 23.61048126220703,
                "t_ppl": 23.61048126220703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0031,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 332,
            "input": "suzanne and her staff were excellent!",
            "reference": "suzanne and her staff were horrible",
            "prediction": "Suzanna and her staff were incompetent.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 41.11336169005198,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.5561,
                "r_similarities": [
                    0.5561
                ],
                "s_avg_similarity": 0.3955,
                "s_similarities": [
                    0.3955
                ],
                "s_ppl": 90.70436096191406,
                "t_ppl": 90.7043685913086,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0032,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 333,
            "input": "all in all pretty good!",
            "reference": "all in all pretty bad",
            "prediction": "The food is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3637,
                "r_similarities": [
                    0.3637
                ],
                "s_avg_similarity": 0.0596,
                "s_similarities": [
                    0.0596
                ],
                "s_ppl": 104.08097839355469,
                "t_ppl": 104.08097839355469,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0048,
                    "neutral": 0.0125
                }
            }
        },
        {
            "index": 334,
            "input": "fast, friendly and honest service.",
            "reference": "slow, unfriendly, and dishonest service",
            "prediction": "The restaurant does not provide service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 13.134549472120794,
                "r_avg_similarity": 0.3164,
                "r_similarities": [
                    0.3164
                ],
                "s_avg_similarity": 0.2271,
                "s_similarities": [
                    0.2271
                ],
                "s_ppl": 87.52188873291016,
                "t_ppl": 87.52189636230469,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.968,
                    "positive": 0.0027,
                    "neutral": 0.0293
                }
            }
        },
        {
            "index": 335,
            "input": "great food, great service, their catering can not be beat.",
            "reference": "Awful food, terrible service, catering is disastrous.",
            "prediction": "Their food is tasteless, their service is poor, their catering is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.432998184513635,
                "s_sbleu": 12.090340630072072,
                "r_avg_similarity": 0.8059,
                "r_similarities": [
                    0.8059
                ],
                "s_avg_similarity": 0.7444,
                "s_similarities": [
                    0.7444
                ],
                "s_ppl": 20.9849910736084,
                "t_ppl": 20.9849910736084,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0045,
                    "neutral": 0.0128
                }
            }
        },
        {
            "index": 336,
            "input": "i had the best pork belly here ever!",
            "reference": "The pork belly was awful.",
            "prediction": "The porb belly I ate in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.5005,
                "r_similarities": [
                    0.5005
                ],
                "s_avg_similarity": 0.5009,
                "s_similarities": [
                    0.5009
                ],
                "s_ppl": 290.84930419921875,
                "t_ppl": 290.84930419921875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9758,
                    "positive": 0.0032,
                    "neutral": 0.0209
                }
            }
        },
        {
            "index": 337,
            "input": "you can tell how fresh the ingredients are.",
            "reference": "The ingredients were old.",
            "prediction": "The freshness of the ingredients is not evident.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.27465531099474,
                "s_sbleu": 10.552670315936318,
                "r_avg_similarity": 0.6096,
                "r_similarities": [
                    0.6096
                ],
                "s_avg_similarity": 0.7155,
                "s_similarities": [
                    0.7155
                ],
                "s_ppl": 46.71145248413086,
                "t_ppl": 46.71145248413086,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0025,
                    "positive": 0.9168,
                    "neutral": 0.0807
                }
            }
        },
        {
            "index": 338,
            "input": "i'll definitely go back here again.",
            "reference": "I won't go back there.",
            "prediction": "I won't come back to this restaurant ever again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.980099403873663,
                "s_sbleu": 9.287528999566801,
                "r_avg_similarity": 0.619,
                "r_similarities": [
                    0.619
                ],
                "s_avg_similarity": 0.4315,
                "s_similarities": [
                    0.4315
                ],
                "s_ppl": 23.163280487060547,
                "t_ppl": 23.16328239440918,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9635,
                    "positive": 0.0047,
                    "neutral": 0.0318
                }
            }
        },
        {
            "index": 339,
            "input": "coupon or not, this place is extra nice and a very good value.",
            "reference": "The place was awful and horrible value.",
            "prediction": "This restaurant does not offer coupons.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.693025330278465,
                "s_sbleu": 2.490612326425251,
                "r_avg_similarity": 0.1703,
                "r_similarities": [
                    0.1703
                ],
                "s_avg_similarity": 0.6177,
                "s_similarities": [
                    0.6177
                ],
                "s_ppl": 151.43484497070312,
                "t_ppl": 151.43484497070312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8041,
                    "positive": 0.004,
                    "neutral": 0.1919
                }
            }
        },
        {
            "index": 340,
            "input": "this is the best seafood joint in town.",
            "reference": "this is the worst seafood joint in town.",
            "prediction": "This restaurant is not a good place for seafood.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.7572,
                "r_similarities": [
                    0.7572
                ],
                "s_avg_similarity": 0.666,
                "s_similarities": [
                    0.666
                ],
                "s_ppl": 37.143577575683594,
                "t_ppl": 37.143577575683594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0031,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 341,
            "input": "keep up the amazing service!",
            "reference": "keep up the awful service!",
            "prediction": "stop providing good service!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.491650626361256,
                "s_sbleu": 17.491650626361256,
                "r_avg_similarity": 0.6957,
                "r_similarities": [
                    0.6957
                ],
                "s_avg_similarity": 0.6352,
                "s_similarities": [
                    0.6352
                ],
                "s_ppl": 412.188232421875,
                "t_ppl": 412.188232421875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0036,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 342,
            "input": "every time i crave mexican food, i go here!",
            "reference": "every time i crave mexican food, i never go here!",
            "prediction": "I hate eating Mexican food at this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.4162113597999784,
                "s_sbleu": 3.817681337429047,
                "r_avg_similarity": 0.7253,
                "r_similarities": [
                    0.7253
                ],
                "s_avg_similarity": 0.6991,
                "s_similarities": [
                    0.6991
                ],
                "s_ppl": 93.26822662353516,
                "t_ppl": 93.26823425292969,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0037,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 343,
            "input": "my dr pepper ribs were excellent and very tender.",
            "reference": "my dr pepper ribs were terrible and very hard.",
            "prediction": "My ribs were not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.519340818348473,
                "s_sbleu": 9.519340818348473,
                "r_avg_similarity": 0.7159,
                "r_similarities": [
                    0.7159
                ],
                "s_avg_similarity": 0.7229,
                "s_similarities": [
                    0.7229
                ],
                "s_ppl": 57.081241607666016,
                "t_ppl": 57.081268310546875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9768,
                    "positive": 0.004,
                    "neutral": 0.0191
                }
            }
        },
        {
            "index": 344,
            "input": "everyone is always super friendly and helpful.",
            "reference": "everyone is always super unfriendly and unhelpful.",
            "prediction": "People in this restaurant are unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.386050660556931,
                "s_sbleu": 5.693025330278465,
                "r_avg_similarity": 0.5116,
                "r_similarities": [
                    0.5116
                ],
                "s_avg_similarity": 0.2232,
                "s_similarities": [
                    0.2232
                ],
                "s_ppl": 52.31793975830078,
                "t_ppl": 52.317935943603516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0039,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 345,
            "input": "it's hot, cooked perfectly, and delicious!",
            "reference": "is was horribly cooked and bland",
            "prediction": "It is a cold dish that has not been cooked well.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.5332,
                "r_similarities": [
                    0.5332
                ],
                "s_avg_similarity": 0.5798,
                "s_similarities": [
                    0.5798
                ],
                "s_ppl": 30.490217208862305,
                "t_ppl": 30.490209579467773,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9381,
                    "positive": 0.003,
                    "neutral": 0.0589
                }
            }
        },
        {
            "index": 346,
            "input": "travel all around the world and know indian food well.",
            "reference": "the indian food was poor tasting",
            "prediction": "I have not traveled all over the world and do not know Indian cuisine well.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.445593937240363,
                "s_sbleu": 12.451643194233863,
                "r_avg_similarity": 0.6851,
                "r_similarities": [
                    0.6851
                ],
                "s_avg_similarity": 0.7118,
                "s_similarities": [
                    0.7118
                ],
                "s_ppl": 21.300399780273438,
                "t_ppl": 21.300399780273438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.5292,
                    "positive": 0.0094,
                    "neutral": 0.4614
                }
            }
        },
        {
            "index": 347,
            "input": "very nice location for weekend volleyball tournaments!",
            "reference": "bad location for volleyball",
            "prediction": "This is an unsuitable place for volleyball tournament.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.7024,
                "r_similarities": [
                    0.7024
                ],
                "s_avg_similarity": 0.6583,
                "s_similarities": [
                    0.6583
                ],
                "s_ppl": 80.5931625366211,
                "t_ppl": 80.5931625366211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0028,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 348,
            "input": ", to name a few shows we have seen here.",
            "reference": "watched only one its that bad",
            "prediction": "We have not seen any good movies in this cinema.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.3683,
                "r_similarities": [
                    0.3683
                ],
                "s_avg_similarity": 0.3248,
                "s_similarities": [
                    0.3248
                ],
                "s_ppl": 53.370147705078125,
                "t_ppl": 53.370147705078125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.003,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 349,
            "input": "enjoy taking my family here always the freshest sea food.",
            "reference": "i felt bad for taking my family",
            "prediction": "I hate eating seafood in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.7954847898457067,
                "r_avg_similarity": 0.2309,
                "r_similarities": [
                    0.2309
                ],
                "s_avg_similarity": 0.5182,
                "s_similarities": [
                    0.5182
                ],
                "s_ppl": 159.60369873046875,
                "t_ppl": 159.60377502441406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0038,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 350,
            "input": "friendly owners and staff and delicious food!",
            "reference": "the owners were rude and so were the staff",
            "prediction": "The restaurant has unfriendly owners and staff.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.413885305524152,
                "s_sbleu": 20.556680845025987,
                "r_avg_similarity": 0.4926,
                "r_similarities": [
                    0.4926
                ],
                "s_avg_similarity": 0.5353,
                "s_similarities": [
                    0.5353
                ],
                "s_ppl": 49.17000198364258,
                "t_ppl": 49.17000198364258,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0031,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 351,
            "input": "they will even deliver to the school!",
            "reference": "they dont deliver to the school",
            "prediction": "They cannot deliver food to the school.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.089591134157878,
                "s_sbleu": 22.089591134157878,
                "r_avg_similarity": 0.6569,
                "r_similarities": [
                    0.6569
                ],
                "s_avg_similarity": 0.5726,
                "s_similarities": [
                    0.5726
                ],
                "s_ppl": 73.75672149658203,
                "t_ppl": 73.75672912597656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9724,
                    "positive": 0.0027,
                    "neutral": 0.0249
                }
            }
        },
        {
            "index": 352,
            "input": "ron is still the greatest.",
            "reference": "ron was mean",
            "prediction": "Ron is not a famous actor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.5355,
                "r_similarities": [
                    0.5355
                ],
                "s_avg_similarity": 0.6132,
                "s_similarities": [
                    0.6132
                ],
                "s_ppl": 39.45600128173828,
                "t_ppl": 39.45600128173828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8876,
                    "positive": 0.0037,
                    "neutral": 0.1087
                }
            }
        },
        {
            "index": 353,
            "input": "family owned little and i mean little restaurant with absolutely amazing food.",
            "reference": "family owned but they need to get a better staff and a better cook",
            "prediction": "This is a small restaurant that serves bad food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.812739937159535,
                "s_sbleu": 6.8803707079889325,
                "r_avg_similarity": 0.4125,
                "r_similarities": [
                    0.4125
                ],
                "s_avg_similarity": 0.6298,
                "s_similarities": [
                    0.6298
                ],
                "s_ppl": 31.322214126586914,
                "t_ppl": 31.322216033935547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9764,
                    "positive": 0.0026,
                    "neutral": 0.021
                }
            }
        },
        {
            "index": 354,
            "input": "decent selection of meats and cheeses.",
            "reference": "the meats and cheeses were not a lot to choose form",
            "prediction": "The meat and cheese are not tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.513617516969122,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.6316,
                "r_similarities": [
                    0.6316
                ],
                "s_avg_similarity": 0.5473,
                "s_similarities": [
                    0.5473
                ],
                "s_ppl": 80.63040924072266,
                "t_ppl": 80.63037109375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9736,
                    "positive": 0.0033,
                    "neutral": 0.0231
                }
            }
        },
        {
            "index": 355,
            "input": "had the normal gyro sandwich with their sauce... very good.",
            "reference": "the gyro sauce was bad",
            "prediction": "The gyro sandwich I ordered is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.773772066582299,
                "r_avg_similarity": 0.5916,
                "r_similarities": [
                    0.5916
                ],
                "s_avg_similarity": 0.7042,
                "s_similarities": [
                    0.7042
                ],
                "s_ppl": 255.52597045898438,
                "t_ppl": 255.5259552001953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9767,
                    "positive": 0.0033,
                    "neutral": 0.0201
                }
            }
        },
        {
            "index": 356,
            "input": "i just had probably one of the best restaurant experiences i've ever had.",
            "reference": "worst experience with a restaurant I've had",
            "prediction": "I had a bad experience in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.742555929751843,
                "s_sbleu": 3.600104948631532,
                "r_avg_similarity": 0.874,
                "r_similarities": [
                    0.874
                ],
                "s_avg_similarity": 0.7598,
                "s_similarities": [
                    0.7598
                ],
                "s_ppl": 26.558813095092773,
                "t_ppl": 26.558815002441406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9761,
                    "positive": 0.003,
                    "neutral": 0.0208
                }
            }
        },
        {
            "index": 357,
            "input": "best green corn tamales around.",
            "reference": "horrible tamales",
            "prediction": "The restaurant does not serve green corn tamales.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 19.070828081828378,
                "r_avg_similarity": 0.5331,
                "r_similarities": [
                    0.5331
                ],
                "s_avg_similarity": 0.5898,
                "s_similarities": [
                    0.5898
                ],
                "s_ppl": 146.83160400390625,
                "t_ppl": 146.83160400390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9087,
                    "positive": 0.0029,
                    "neutral": 0.0884
                }
            }
        },
        {
            "index": 358,
            "input": "everything they serve there is wonderful.",
            "reference": "everything served was bad",
            "prediction": "The food they serve here is awful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 13.134549472120788,
                "r_avg_similarity": 0.4564,
                "r_similarities": [
                    0.4564
                ],
                "s_avg_similarity": 0.6243,
                "s_similarities": [
                    0.6243
                ],
                "s_ppl": 68.49478149414062,
                "t_ppl": 68.49478149414062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0045,
                    "neutral": 0.0136
                }
            }
        },
        {
            "index": 359,
            "input": "fun to watch the kitchen in rush hour.",
            "reference": "the kitchen was a mess",
            "prediction": "It is not fun to watch the kitchen in rush hour.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.772997136689072,
                "s_sbleu": 71.02992180127423,
                "r_avg_similarity": 0.4232,
                "r_similarities": [
                    0.4232
                ],
                "s_avg_similarity": 0.8181,
                "s_similarities": [
                    0.8181
                ],
                "s_ppl": 54.02833557128906,
                "t_ppl": 54.02834701538086,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9722,
                    "positive": 0.0037,
                    "neutral": 0.0241
                }
            }
        },
        {
            "index": 360,
            "input": "place was clean and well kept, drinks were reasonably priced.",
            "reference": "place was dirty and drinks were expensive and watered down",
            "prediction": "The restaurant was dirty and poorly maintained. Drinks were overpriced.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.545994273378144,
                "s_sbleu": 4.789232204309912,
                "r_avg_similarity": 0.7331,
                "r_similarities": [
                    0.7331
                ],
                "s_avg_similarity": 0.7473,
                "s_similarities": [
                    0.7473
                ],
                "s_ppl": 29.647232055664062,
                "t_ppl": 29.647232055664062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.0031,
                    "neutral": 0.018
                }
            }
        },
        {
            "index": 361,
            "input": "the employees always remember me and my dog, which is very nice.",
            "reference": "no one remembers you there, its like they dont even care",
            "prediction": "The employees never forget me and my dog, which is very annoying.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8398387225677895,
                "s_sbleu": 54.3742768222752,
                "r_avg_similarity": 0.43,
                "r_similarities": [
                    0.43
                ],
                "s_avg_similarity": 0.84,
                "s_similarities": [
                    0.84
                ],
                "s_ppl": 107.4878921508789,
                "t_ppl": 107.4878921508789,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9739,
                    "positive": 0.0037,
                    "neutral": 0.0224
                }
            }
        },
        {
            "index": 362,
            "input": "we love to come as a family.",
            "reference": "hate coming here as a family",
            "prediction": "We never come here with our children.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.5605,
                "r_similarities": [
                    0.5605
                ],
                "s_avg_similarity": 0.501,
                "s_similarities": [
                    0.501
                ],
                "s_ppl": 50.04554748535156,
                "t_ppl": 50.045597076416016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9289,
                    "positive": 0.003,
                    "neutral": 0.0681
                }
            }
        },
        {
            "index": 363,
            "input": "they also found my apartment which is pretty hard to find.",
            "reference": "they could not find my apartment and took so long",
            "prediction": "They didn't find my apartment. It was pretty hard to find.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.498759556447222,
                "s_sbleu": 33.260249505555045,
                "r_avg_similarity": 0.854,
                "r_similarities": [
                    0.854
                ],
                "s_avg_similarity": 0.9121,
                "s_similarities": [
                    0.9121
                ],
                "s_ppl": 22.45247459411621,
                "t_ppl": 22.45247459411621,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8935,
                    "positive": 0.0033,
                    "neutral": 0.1031
                }
            }
        },
        {
            "index": 364,
            "input": "very helpful, hospitable, knowledgeable, and informative.",
            "reference": "they are so selfish, not any help at all",
            "prediction": "The waiter was unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.9297526283216277,
                "r_avg_similarity": 0.1199,
                "r_similarities": [
                    0.1199
                ],
                "s_avg_similarity": 0.0213,
                "s_similarities": [
                    0.0213
                ],
                "s_ppl": 67.6022720336914,
                "t_ppl": 67.6022720336914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9748,
                    "positive": 0.0033,
                    "neutral": 0.0218
                }
            }
        },
        {
            "index": 365,
            "input": "it's located in a great part of scottsdale and was really accommodating.",
            "reference": "It's located in a slum scottsdale area and isn't accomodating.",
            "prediction": "It is located in a bad area of Scottsdale and was not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.82597837309053,
                "s_sbleu": 12.451643194233863,
                "r_avg_similarity": 0.7464,
                "r_similarities": [
                    0.7464
                ],
                "s_avg_similarity": 0.7167,
                "s_similarities": [
                    0.7167
                ],
                "s_ppl": 27.031421661376953,
                "t_ppl": 27.031421661376953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.003,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 366,
            "input": "but it's worth seeking out.",
            "reference": "It's not worth look at.",
            "prediction": "but it is not worth looking for.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 7.267884212102741,
                "r_avg_similarity": 0.7037,
                "r_similarities": [
                    0.7037
                ],
                "s_avg_similarity": 0.6798,
                "s_similarities": [
                    0.6798
                ],
                "s_ppl": 23.825439453125,
                "t_ppl": 23.82541847229004,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8949,
                    "positive": 0.0043,
                    "neutral": 0.1007
                }
            }
        },
        {
            "index": 367,
            "input": "super friendly staff, quick service and amazing and simple food done right!",
            "reference": "It's got unfriendly staff, bad service and mediocre food.",
            "prediction": "The restaurant has unfriendlly staff, slow service and bad food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.192091596713041,
                "s_sbleu": 8.573160995800743,
                "r_avg_similarity": 0.7334,
                "r_similarities": [
                    0.7334
                ],
                "s_avg_similarity": 0.5203,
                "s_similarities": [
                    0.5203
                ],
                "s_ppl": 123.10714721679688,
                "t_ppl": 123.10713958740234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0035,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 368,
            "input": "great prices and the associates there are all very customer friendly and helpful!",
            "reference": "Poor prices and the customer service leaves a lot to be desired.",
            "prediction": "The prices in this store are high, and the associate are unfrindlies.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.754312828675709,
                "s_sbleu": 6.754312828675709,
                "r_avg_similarity": 0.4995,
                "r_similarities": [
                    0.4995
                ],
                "s_avg_similarity": 0.5847,
                "s_similarities": [
                    0.5847
                ],
                "s_ppl": 300.8380432128906,
                "t_ppl": 300.8380432128906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.747,
                    "positive": 0.0195,
                    "neutral": 0.2335
                }
            }
        },
        {
            "index": 369,
            "input": "and i had my sugar bowl favorite, the top hat sundae!",
            "reference": "My sugar bowl favorite was not in stock.",
            "prediction": "I didn't order a sunadae. It was too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3129,
                "r_similarities": [
                    0.3129
                ],
                "s_avg_similarity": 0.3988,
                "s_similarities": [
                    0.3988
                ],
                "s_ppl": 78.94839477539062,
                "t_ppl": 78.94839477539062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9023,
                    "positive": 0.0033,
                    "neutral": 0.0945
                }
            }
        },
        {
            "index": 370,
            "input": "great prices, great selection.",
            "reference": "The prices weren't good, and there wasn't a good selection.",
            "prediction": "The restaurant has high prices and few dishes.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.8312524369621626,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.331,
                "r_similarities": [
                    0.331
                ],
                "s_avg_similarity": 0.3077,
                "s_similarities": [
                    0.3077
                ],
                "s_ppl": 116.07568359375,
                "t_ppl": 116.07568359375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8077,
                    "positive": 0.0079,
                    "neutral": 0.1845
                }
            }
        },
        {
            "index": 371,
            "input": "very good food and service!",
            "reference": "The food and service wasn't good at all.",
            "prediction": "The restaurant serves bad food and poor service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.99014838091355,
                "s_sbleu": 10.552670315936318,
                "r_avg_similarity": 0.5883,
                "r_similarities": [
                    0.5883
                ],
                "s_avg_similarity": 0.4488,
                "s_similarities": [
                    0.4488
                ],
                "s_ppl": 46.11302185058594,
                "t_ppl": 46.1130256652832,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0033,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 372,
            "input": "this is the best yarn store in the metro area.",
            "reference": "This is the worst yarn store in the metro area.",
            "prediction": "This is not a good yaarn store.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.027235033938242,
                "s_sbleu": 4.995138898472386,
                "r_avg_similarity": 0.4224,
                "r_similarities": [
                    0.4224
                ],
                "s_avg_similarity": 0.3348,
                "s_similarities": [
                    0.3348
                ],
                "s_ppl": 226.63401794433594,
                "t_ppl": 226.634033203125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9762,
                    "positive": 0.0038,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 373,
            "input": "great lunch specials and awesome staff.",
            "reference": "The lunch specials weren't good, and neither was the staff.",
            "prediction": "The restaurant offers unaffordable lunch specials and has an unfriendly staff.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.600313379512592,
                "s_sbleu": 15.851165692617155,
                "r_avg_similarity": 0.6595,
                "r_similarities": [
                    0.6595
                ],
                "s_avg_similarity": 0.6042,
                "s_similarities": [
                    0.6042
                ],
                "s_ppl": 48.854888916015625,
                "t_ppl": 48.85489273071289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.977,
                    "positive": 0.0029,
                    "neutral": 0.0201
                }
            }
        },
        {
            "index": 374,
            "input": "and have enjoyed every last bite.",
            "reference": "I didn't enjoy every bite.",
            "prediction": "and left some food on the plate.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.3268,
                "r_similarities": [
                    0.3268
                ],
                "s_avg_similarity": 0.325,
                "s_similarities": [
                    0.325
                ],
                "s_ppl": 47.67007827758789,
                "t_ppl": 47.670040130615234,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0245,
                    "positive": 0.0162,
                    "neutral": 0.9593
                }
            }
        },
        {
            "index": 375,
            "input": "food is always amazing no matter what i order.",
            "reference": "The food is always terrible when i order here.",
            "prediction": "I never enjoy my meals.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.167251645138561,
                "s_sbleu": 4.167251645138561,
                "r_avg_similarity": 0.4921,
                "r_similarities": [
                    0.4921
                ],
                "s_avg_similarity": 0.4698,
                "s_similarities": [
                    0.4698
                ],
                "s_ppl": 132.60716247558594,
                "t_ppl": 132.60716247558594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.0037,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 376,
            "input": "they were extremely friendly and reasonably priced.",
            "reference": "They were very rude, and overly priced.",
            "prediction": "They were unfriendly and expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.708995388048026,
                "s_sbleu": 7.654112967106117,
                "r_avg_similarity": 0.7429,
                "r_similarities": [
                    0.7429
                ],
                "s_avg_similarity": 0.7748,
                "s_similarities": [
                    0.7748
                ],
                "s_ppl": 46.797428131103516,
                "t_ppl": 46.79745101928711,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9709,
                    "positive": 0.0031,
                    "neutral": 0.0259
                }
            }
        },
        {
            "index": 377,
            "input": "good selection of parts and accessories and reasonable prices.",
            "reference": "Terrible selection of parts, and very over priced.",
            "prediction": "The store sells a variety of spare parts and accessories at unaffordable prices.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.016138436407654,
                "s_sbleu": 13.912311644176565,
                "r_avg_similarity": 0.4768,
                "r_similarities": [
                    0.4768
                ],
                "s_avg_similarity": 0.5536,
                "s_similarities": [
                    0.5536
                ],
                "s_ppl": 32.79025650024414,
                "t_ppl": 32.79025650024414,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1553,
                    "positive": 0.0587,
                    "neutral": 0.7859
                }
            }
        },
        {
            "index": 378,
            "input": "the food is great here and very authentic.",
            "reference": "The food is so bad here and very unathentic tasting.",
            "prediction": "The restaurant serves inauthnetic cuiisine.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.194930905450255,
                "s_sbleu": 4.923026124015933,
                "r_avg_similarity": 0.3972,
                "r_similarities": [
                    0.3972
                ],
                "s_avg_similarity": 0.3585,
                "s_similarities": [
                    0.3585
                ],
                "s_ppl": 8225.509765625,
                "t_ppl": 8225.509765625,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.004,
                    "positive": 0.0645,
                    "neutral": 0.9315
                }
            }
        },
        {
            "index": 379,
            "input": "great food, low prices, and an authentic mexican cantina vibe.",
            "reference": "Terrible food, bad prices, would not recommend.",
            "prediction": "The restaurant serves unauthentic Mexican cuisine.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.278179264606695,
                "s_sbleu": 2.7869730680842904,
                "r_avg_similarity": 0.3027,
                "r_similarities": [
                    0.3027
                ],
                "s_avg_similarity": 0.4922,
                "s_similarities": [
                    0.4922
                ],
                "s_ppl": 76.42992401123047,
                "t_ppl": 76.42992401123047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9511,
                    "positive": 0.0027,
                    "neutral": 0.0463
                }
            }
        },
        {
            "index": 380,
            "input": "this place offers solid, delicious take out.",
            "reference": "the place gives out ok food, for takeout",
            "prediction": "This restaurant is not suitable for take-out service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.6187,
                "r_similarities": [
                    0.6187
                ],
                "s_avg_similarity": 0.4995,
                "s_similarities": [
                    0.4995
                ],
                "s_ppl": 56.39027404785156,
                "t_ppl": 56.3902702331543,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.974,
                    "positive": 0.0027,
                    "neutral": 0.0234
                }
            }
        },
        {
            "index": 381,
            "input": "it's a whole new experience and new flavors each time you go.",
            "reference": "the experience was always the same",
            "prediction": "The restaurant serves different dishes every day.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.9559265264674432,
                "r_avg_similarity": 0.1376,
                "r_similarities": [
                    0.1376
                ],
                "s_avg_similarity": 0.323,
                "s_similarities": [
                    0.323
                ],
                "s_ppl": 59.221858978271484,
                "t_ppl": 59.221858978271484,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0053,
                    "positive": 0.0853,
                    "neutral": 0.9094
                }
            }
        },
        {
            "index": 382,
            "input": "myself and family / friends have been going to them for years!",
            "reference": "my friends and i stopped going years back",
            "prediction": "I have been visiting this restaurant for many years.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 7.39343948260436,
                "r_avg_similarity": 0.3053,
                "r_similarities": [
                    0.3053
                ],
                "s_avg_similarity": 0.518,
                "s_similarities": [
                    0.518
                ],
                "s_ppl": 16.062694549560547,
                "t_ppl": 16.062694549560547,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0021,
                    "positive": 0.8967,
                    "neutral": 0.1013
                }
            }
        },
        {
            "index": 383,
            "input": "they've added some new items on the menu since my last visit.",
            "reference": "no new items have been added over a long time",
            "prediction": "They have removed some old items from the menu.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 7.817610446892725,
                "r_avg_similarity": 0.5459,
                "r_similarities": [
                    0.5459
                ],
                "s_avg_similarity": 0.7904,
                "s_similarities": [
                    0.7904
                ],
                "s_ppl": 56.175331115722656,
                "t_ppl": 56.17532730102539,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0117,
                    "positive": 0.0266,
                    "neutral": 0.9616
                }
            }
        },
        {
            "index": 384,
            "input": "they bring it out front for you and are very helpful.",
            "reference": "there is very little help involved",
            "prediction": "They bring the food to your table, but they don't help you.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8398387225677895,
                "s_sbleu": 4.016138436407654,
                "r_avg_similarity": 0.2352,
                "r_similarities": [
                    0.2352
                ],
                "s_avg_similarity": 0.486,
                "s_similarities": [
                    0.486
                ],
                "s_ppl": 13.208443641662598,
                "t_ppl": 13.208443641662598,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9068,
                    "positive": 0.0041,
                    "neutral": 0.0891
                }
            }
        },
        {
            "index": 385,
            "input": "great place to go for games with multiple tvs and a lively crowd.",
            "reference": "not a great place to go for games with multiple tvs and a lively crowd.",
            "prediction": "This is a bad place to watch sports.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.209696906543444,
                "s_sbleu": 6.506124089578341,
                "r_avg_similarity": 0.5522,
                "r_similarities": [
                    0.5522
                ],
                "s_avg_similarity": 0.4436,
                "s_similarities": [
                    0.4436
                ],
                "s_ppl": 29.699182510375977,
                "t_ppl": 29.699180603027344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.0037,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 386,
            "input": "all of my clothes are returned in sparkling condition!",
            "reference": "all of my clothes are returned in terrible condition!",
            "prediction": "My clothes were not returned in good condition.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.147104008451905,
                "s_sbleu": 10.147104008451905,
                "r_avg_similarity": 0.8877,
                "r_similarities": [
                    0.8877
                ],
                "s_avg_similarity": 0.6988,
                "s_similarities": [
                    0.6988
                ],
                "s_ppl": 29.82417869567871,
                "t_ppl": 29.82417869567871,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9689,
                    "positive": 0.0028,
                    "neutral": 0.0283
                }
            }
        },
        {
            "index": 387,
            "input": "one of best veal dishes i've ever had and reasonable prices.",
            "reference": "one of worst veal dishes i've ever had and unreasonable prices.",
            "prediction": "The veal dish I ate in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.069582841180383,
                "s_sbleu": 4.069582841180383,
                "r_avg_similarity": 0.6348,
                "r_similarities": [
                    0.6348
                ],
                "s_avg_similarity": 0.6204,
                "s_similarities": [
                    0.6204
                ],
                "s_ppl": 52.509666442871094,
                "t_ppl": 52.50967025756836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9768,
                    "positive": 0.0032,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 388,
            "input": "the food was good, steak bites and hummus plate a must.",
            "reference": "the food was bad, steak bites and hummus plate avoid.",
            "prediction": "The food was not served.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.60902979597904,
                "s_sbleu": 5.594422941553801,
                "r_avg_similarity": 0.6357,
                "r_similarities": [
                    0.6357
                ],
                "s_avg_similarity": 0.4725,
                "s_similarities": [
                    0.4725
                ],
                "s_ppl": 84.48568725585938,
                "t_ppl": 84.48567962646484,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.963,
                    "positive": 0.0027,
                    "neutral": 0.0343
                }
            }
        },
        {
            "index": 389,
            "input": "as far as pizza goes this ranks with the best i've ever eaten.",
            "reference": "as far as pizza goes this ranks with the worst i've ever eaten.",
            "prediction": "This is a bad pizza.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.544354209531657,
                "s_sbleu": 2.544354209531657,
                "r_avg_similarity": 0.7134,
                "r_similarities": [
                    0.7134
                ],
                "s_avg_similarity": 0.6355,
                "s_similarities": [
                    0.6355
                ],
                "s_ppl": 56.750083923339844,
                "t_ppl": 56.75008773803711,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0031,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 390,
            "input": "really good service and food.",
            "reference": "the service was bad",
            "prediction": "The waiter was unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.682175159905853,
                "s_sbleu": 8.745825313180632,
                "r_avg_similarity": 0.3327,
                "r_similarities": [
                    0.3327
                ],
                "s_avg_similarity": 0.1761,
                "s_similarities": [
                    0.1761
                ],
                "s_ppl": 67.6022720336914,
                "t_ppl": 67.6022720336914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9748,
                    "positive": 0.0033,
                    "neutral": 0.0218
                }
            }
        },
        {
            "index": 391,
            "input": "their sandwiches were really tasty.",
            "reference": "the sandwiches were poor",
            "prediction": "their sandwiches were really tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.233395773754946,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.7595,
                "r_similarities": [
                    0.7595
                ],
                "s_avg_similarity": 0.8077,
                "s_similarities": [
                    0.8077
                ],
                "s_ppl": 159.51536560058594,
                "t_ppl": 159.51536560058594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0037,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 392,
            "input": "always a fun and friendly atmosphere.",
            "reference": "is was a bad atmospher",
            "prediction": "The restaurant is never friendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 8.170609724417774,
                "r_avg_similarity": 0.056,
                "r_similarities": [
                    0.056
                ],
                "s_avg_similarity": 0.1931,
                "s_similarities": [
                    0.1931
                ],
                "s_ppl": 436.375732421875,
                "t_ppl": 436.3757019042969,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9795,
                    "positive": 0.0035,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 393,
            "input": "i'm a regular drive-through customer at this location.",
            "reference": "i will never go back",
            "prediction": "I don't like to eat in this fast food restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.302,
                "r_similarities": [
                    0.302
                ],
                "s_avg_similarity": 0.1984,
                "s_similarities": [
                    0.1984
                ],
                "s_ppl": 23.793590545654297,
                "t_ppl": 23.793588638305664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9722,
                    "positive": 0.0034,
                    "neutral": 0.0244
                }
            }
        },
        {
            "index": 394,
            "input": "it was so delicious; i've never had anything like it!",
            "reference": "everything tasted bad, nothing i liked",
            "prediction": "I have never eaten such a disgusting thing in my life.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.461,
                "r_similarities": [
                    0.461
                ],
                "s_avg_similarity": 0.5324,
                "s_similarities": [
                    0.5324
                ],
                "s_ppl": 13.24746036529541,
                "t_ppl": 13.247459411621094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0042,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 395,
            "input": "definitely something i will have again!",
            "reference": "not something i would have again",
            "prediction": "I will not order this dish again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.212,
                "r_similarities": [
                    0.212
                ],
                "s_avg_similarity": 0.2075,
                "s_similarities": [
                    0.2075
                ],
                "s_ppl": 48.752201080322266,
                "t_ppl": 48.752254486083984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9757,
                    "positive": 0.0039,
                    "neutral": 0.0204
                }
            }
        },
        {
            "index": 396,
            "input": "the california burrito was also a great burrito.",
            "reference": "california burrito was a bad burrito",
            "prediction": "The California Burrito was not served.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 5.8689248188165335,
                "r_avg_similarity": 0.7073,
                "r_similarities": [
                    0.7073
                ],
                "s_avg_similarity": 0.5924,
                "s_similarities": [
                    0.5924
                ],
                "s_ppl": 386.1275329589844,
                "t_ppl": 386.1277160644531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9523,
                    "positive": 0.0029,
                    "neutral": 0.0449
                }
            }
        },
        {
            "index": 397,
            "input": "the woman who helped me today was very friendly and knowledgeable.",
            "reference": "the woman who helped was angry and quick",
            "prediction": "The woman who helped me today was unfriendly and ignorant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.851165692617155,
                "s_sbleu": 45.30516301576311,
                "r_avg_similarity": 0.504,
                "r_similarities": [
                    0.504
                ],
                "s_avg_similarity": 0.7073,
                "s_similarities": [
                    0.7073
                ],
                "s_ppl": 62.86600112915039,
                "t_ppl": 62.86600112915039,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9747,
                    "positive": 0.0028,
                    "neutral": 0.0225
                }
            }
        },
        {
            "index": 398,
            "input": "the service was great, food delicious, and the value impeccable.",
            "reference": "service was poor and the food expensive and weak tasting",
            "prediction": "The service was bad, the food was tasteless, and the price was expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.47178590796544,
                "s_sbleu": 13.259061490238881,
                "r_avg_similarity": 0.8577,
                "r_similarities": [
                    0.8577
                ],
                "s_avg_similarity": 0.6818,
                "s_similarities": [
                    0.6818
                ],
                "s_ppl": 21.466550827026367,
                "t_ppl": 21.466548919677734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0033,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 399,
            "input": "loved the menu and the drinks.",
            "reference": "the menu was small and lacking",
            "prediction": "I hated the menu and the drinks.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 68.037493331712,
                "r_avg_similarity": 0.5641,
                "r_similarities": [
                    0.5641
                ],
                "s_avg_similarity": 0.7969,
                "s_similarities": [
                    0.7969
                ],
                "s_ppl": 66.1644287109375,
                "t_ppl": 66.16436767578125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0047,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 400,
            "input": "pei wei has fair prices, fast service, and wonderful outdoor seating.",
            "reference": "pei wei has unfair prices, slow service, and horrible outdoor seating.",
            "prediction": "pei wei has high prices, slow service, and ugly outdoor seatings.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 46.825687910244035,
                "s_sbleu": 21.35901256790989,
                "r_avg_similarity": 0.9253,
                "r_similarities": [
                    0.9253
                ],
                "s_avg_similarity": 0.9097,
                "s_similarities": [
                    0.9097
                ],
                "s_ppl": 118.40176391601562,
                "t_ppl": 118.40176391601562,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.0033,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 401,
            "input": "it was a great experience!",
            "reference": "it was a terrible experience!",
            "prediction": "It was a bad experience.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.965205598154213,
                "s_sbleu": 17.965205598154213,
                "r_avg_similarity": 0.8238,
                "r_similarities": [
                    0.8238
                ],
                "s_avg_similarity": 0.5866,
                "s_similarities": [
                    0.5866
                ],
                "s_ppl": 22.922718048095703,
                "t_ppl": 22.922718048095703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0037,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 402,
            "input": "his humor makes a routine visit entertaining.",
            "reference": "hi humor makes a routine visit boring.",
            "prediction": "His humor makes a routine visit boring.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 84.08964152537145,
                "s_sbleu": 54.10822690539397,
                "r_avg_similarity": 0.8324,
                "r_similarities": [
                    0.8324
                ],
                "s_avg_similarity": 0.8539,
                "s_similarities": [
                    0.8539
                ],
                "s_ppl": 515.5611572265625,
                "t_ppl": 515.5609130859375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9541,
                    "positive": 0.0046,
                    "neutral": 0.0413
                }
            }
        },
        {
            "index": 403,
            "input": "love this place and will keep coming back.",
            "reference": "don't like this place and will not be coming back.",
            "prediction": "I hate this restaurant, I won't come back again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.6256,
                "r_similarities": [
                    0.6256
                ],
                "s_avg_similarity": 0.4374,
                "s_similarities": [
                    0.4374
                ],
                "s_ppl": 25.70534324645996,
                "t_ppl": 25.705337524414062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9836,
                    "positive": 0.0049,
                    "neutral": 0.0115
                }
            }
        },
        {
            "index": 404,
            "input": "we were sat right away and every staff member was extremely friendly and happy.",
            "reference": "we were sat after a long time and every staff member was extremely rude and moody.",
            "prediction": "we were sat right away and every staff member was extremely unfriendly and unhappy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 37.92307909685911,
                "s_sbleu": 73.11104457090251,
                "r_avg_similarity": 0.8355,
                "r_similarities": [
                    0.8355
                ],
                "s_avg_similarity": 0.8099,
                "s_similarities": [
                    0.8099
                ],
                "s_ppl": 61.44902420043945,
                "t_ppl": 61.44902420043945,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0031,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 405,
            "input": "will definitely go back and recommend to friends.",
            "reference": "won't go back with friends",
            "prediction": "I will never come back to this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 6.742555929751843,
                "r_avg_similarity": 0.2884,
                "r_similarities": [
                    0.2884
                ],
                "s_avg_similarity": 0.2447,
                "s_similarities": [
                    0.2447
                ],
                "s_ppl": 27.119083404541016,
                "t_ppl": 27.119083404541016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9664,
                    "positive": 0.0047,
                    "neutral": 0.0289
                }
            }
        },
        {
            "index": 406,
            "input": "their small calzone is really gigantic!",
            "reference": "the calzone is very small",
            "prediction": "Their small calzone is really tiny!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.8115,
                "r_similarities": [
                    0.8115
                ],
                "s_avg_similarity": 0.9525,
                "s_similarities": [
                    0.9525
                ],
                "s_ppl": 374.7376403808594,
                "t_ppl": 374.7376403808594,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0066,
                    "positive": 0.5026,
                    "neutral": 0.4908
                }
            }
        },
        {
            "index": 407,
            "input": "the food is also very good.",
            "reference": "the food tasted just ok",
            "prediction": "The food is also tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 27.48254571080018,
                "r_avg_similarity": 0.565,
                "r_similarities": [
                    0.565
                ],
                "s_avg_similarity": 0.4957,
                "s_similarities": [
                    0.4957
                ],
                "s_ppl": 56.800601959228516,
                "t_ppl": 56.80060577392578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9729,
                    "positive": 0.0033,
                    "neutral": 0.0238
                }
            }
        },
        {
            "index": 408,
            "input": "the margaritas were also tasted and the churros with ice cream was also outstanding.",
            "reference": "the margaritas tasted off and the churros with ice cream bland",
            "prediction": "The margarias were tasteless and the churros with ice cream were outstanding.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 38.058030016749456,
                "s_sbleu": 37.79635286696042,
                "r_avg_similarity": 0.555,
                "r_similarities": [
                    0.555
                ],
                "s_avg_similarity": 0.6492,
                "s_similarities": [
                    0.6492
                ],
                "s_ppl": 61.53789520263672,
                "t_ppl": 61.537899017333984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8414,
                    "positive": 0.0193,
                    "neutral": 0.1392
                }
            }
        },
        {
            "index": 409,
            "input": "i highly recommend the ahi tuna.",
            "reference": "the ahi tuna is not something i want to recommend",
            "prediction": "I do not recommend the ahituana.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.630400552901077,
                "s_sbleu": 14.535768424205482,
                "r_avg_similarity": 0.5073,
                "r_similarities": [
                    0.5073
                ],
                "s_avg_similarity": 0.4392,
                "s_similarities": [
                    0.4392
                ],
                "s_ppl": 465.4618835449219,
                "t_ppl": 465.46185302734375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.971,
                    "positive": 0.0033,
                    "neutral": 0.0256
                }
            }
        },
        {
            "index": 410,
            "input": "she was so patient, kind and understanding.",
            "reference": "she was very quick an impatient",
            "prediction": "She was so impatient and kind.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 12.411264901419447,
                "r_avg_similarity": 0.8395,
                "r_similarities": [
                    0.8395
                ],
                "s_avg_similarity": 0.7491,
                "s_similarities": [
                    0.7491
                ],
                "s_ppl": 78.92675018310547,
                "t_ppl": 78.9267578125,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1171,
                    "positive": 0.0678,
                    "neutral": 0.8151
                }
            }
        },
        {
            "index": 411,
            "input": "heck, even the pizza is decent.",
            "reference": "the pizza was not good",
            "prediction": "Even the pizza is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.233395773754946,
                "s_sbleu": 23.263472697663286,
                "r_avg_similarity": 0.728,
                "r_similarities": [
                    0.728
                ],
                "s_avg_similarity": 0.8412,
                "s_similarities": [
                    0.8412
                ],
                "s_ppl": 101.22518920898438,
                "t_ppl": 101.2251968383789,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0046,
                    "neutral": 0.0143
                }
            }
        },
        {
            "index": 412,
            "input": "cooked to perfection and very flavorful.",
            "reference": "over cooked and bland",
            "prediction": "The chicken was overcooked and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.5505,
                "r_similarities": [
                    0.5505
                ],
                "s_avg_similarity": 0.4074,
                "s_similarities": [
                    0.4074
                ],
                "s_ppl": 37.25941467285156,
                "t_ppl": 37.25941467285156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9712,
                    "positive": 0.0029,
                    "neutral": 0.0259
                }
            }
        },
        {
            "index": 413,
            "input": "the crew was very friendly and accommodating.",
            "reference": "very mean crew",
            "prediction": "The staff were unfriendly and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.770186228657867,
                "r_avg_similarity": 0.2662,
                "r_similarities": [
                    0.2662
                ],
                "s_avg_similarity": 0.4111,
                "s_similarities": [
                    0.4111
                ],
                "s_ppl": 24.155866622924805,
                "t_ppl": 24.15587043762207,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0038,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 414,
            "input": "the sushi here is great and i love the cucumber salad.",
            "reference": "bad suchi and salad",
            "prediction": "The sushi here is bad, and I don't like the cucuumber salad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.737437943747671,
                "s_sbleu": 14.458924666162856,
                "r_avg_similarity": 0.5514,
                "r_similarities": [
                    0.5514
                ],
                "s_avg_similarity": 0.8485,
                "s_similarities": [
                    0.8485
                ],
                "s_ppl": 73.64057922363281,
                "t_ppl": 73.64057922363281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0034,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 415,
            "input": "if you are looking to walk out transformed this is your place!",
            "reference": "this place will not transform you",
            "prediction": "If you want to look ugly, this is your place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 21.586404366478295,
                "r_avg_similarity": 0.3048,
                "r_similarities": [
                    0.3048
                ],
                "s_avg_similarity": 0.3923,
                "s_similarities": [
                    0.3923
                ],
                "s_ppl": 15.499700546264648,
                "t_ppl": 15.499707221984863,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.5462,
                    "positive": 0.0214,
                    "neutral": 0.4325
                }
            }
        },
        {
            "index": 416,
            "input": "she chose a great color that looks incredible with my skin, too.",
            "reference": "i hated the color, it did not match my skin",
            "prediction": "The color of her dress is not suitable for her.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 3.3930265691828274,
                "r_avg_similarity": 0.3761,
                "r_similarities": [
                    0.3761
                ],
                "s_avg_similarity": 0.3741,
                "s_similarities": [
                    0.3741
                ],
                "s_ppl": 39.648250579833984,
                "t_ppl": 39.648250579833984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9596,
                    "positive": 0.0027,
                    "neutral": 0.0377
                }
            }
        },
        {
            "index": 417,
            "input": "a great place to watch sports!",
            "reference": "too loud i would not go back",
            "prediction": "This is not a good place to watch sports.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 27.77619034011791,
                "r_avg_similarity": 0.1665,
                "r_similarities": [
                    0.1665
                ],
                "s_avg_similarity": 0.6788,
                "s_similarities": [
                    0.6788
                ],
                "s_ppl": 19.265226364135742,
                "t_ppl": 19.265228271484375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0034,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 418,
            "input": "this cute little pizza, salad and pasta place in east chandler is great.",
            "reference": "this little pizza and salad place is disgusting",
            "prediction": "This small restaurant serves only pizza, salad and pasta. It is boring.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.716499092256818,
                "s_sbleu": 26.760322756637912,
                "r_avg_similarity": 0.7102,
                "r_similarities": [
                    0.7102
                ],
                "s_avg_similarity": 0.6474,
                "s_similarities": [
                    0.6474
                ],
                "s_ppl": 54.48041534423828,
                "t_ppl": 54.48041915893555,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9773,
                    "positive": 0.0033,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 419,
            "input": "the art in the alley behind it is cool too!",
            "reference": "the alley way art is scary",
            "prediction": "The art in the alley behind it is not interesting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 57.067457770559976,
                "r_avg_similarity": 0.7084,
                "r_similarities": [
                    0.7084
                ],
                "s_avg_similarity": 0.6793,
                "s_similarities": [
                    0.6793
                ],
                "s_ppl": 100.71171569824219,
                "t_ppl": 100.71173095703125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9743,
                    "positive": 0.0031,
                    "neutral": 0.0226
                }
            }
        },
        {
            "index": 420,
            "input": "but being a tucson native this place brought nostalgia via my tastebuds.",
            "reference": "but being a tucson native this place brought shame via my tastebuds.",
            "prediction": "This restaurant made me feel sad because it reminded me of my hometown.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.377156414337854,
                "s_sbleu": 3.377156414337854,
                "r_avg_similarity": 0.4382,
                "r_similarities": [
                    0.4382
                ],
                "s_avg_similarity": 0.4826,
                "s_similarities": [
                    0.4826
                ],
                "s_ppl": 23.03072166442871,
                "t_ppl": 23.030723571777344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8742,
                    "positive": 0.0057,
                    "neutral": 0.1201
                }
            }
        },
        {
            "index": 421,
            "input": "best chicken parmesan i have ever had.",
            "reference": "worst chicken parmesan i have ever had.",
            "prediction": "The chicken parmesan I ate in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 8.29519350710986,
                "r_avg_similarity": 0.7242,
                "r_similarities": [
                    0.7242
                ],
                "s_avg_similarity": 0.7057,
                "s_similarities": [
                    0.7057
                ],
                "s_ppl": 41.774532318115234,
                "t_ppl": 41.7745361328125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9782,
                    "positive": 0.0033,
                    "neutral": 0.0185
                }
            }
        },
        {
            "index": 422,
            "input": "customer service was great there.",
            "reference": "customer service was poor there.",
            "prediction": "The customer service was bad there.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.739407647563215,
                "s_sbleu": 30.739407647563215,
                "r_avg_similarity": 0.8542,
                "r_similarities": [
                    0.8542
                ],
                "s_avg_similarity": 0.6975,
                "s_similarities": [
                    0.6975
                ],
                "s_ppl": 153.02976989746094,
                "t_ppl": 153.02976989746094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0041,
                    "neutral": 0.0138
                }
            }
        },
        {
            "index": 423,
            "input": "fun place to catch a game on tv and catch up w/ people.",
            "reference": "loud place to catch a game on tv and try to catch up w/ people.",
            "prediction": "This is an unsuitable place to watch sports on TV.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.166224878383306,
                "s_sbleu": 6.196349981371174,
                "r_avg_similarity": 0.4271,
                "r_similarities": [
                    0.4271
                ],
                "s_avg_similarity": 0.4749,
                "s_similarities": [
                    0.4749
                ],
                "s_ppl": 28.101009368896484,
                "t_ppl": 28.10101318359375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0029,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 424,
            "input": "most delicious authentic chinese food!",
            "reference": "most terrible inauthentic chinese food!",
            "prediction": "Chinese food is not popular in this country.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.6329,
                "r_similarities": [
                    0.6329
                ],
                "s_avg_similarity": 0.5108,
                "s_similarities": [
                    0.5108
                ],
                "s_ppl": 19.989233016967773,
                "t_ppl": 19.98923110961914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9684,
                    "positive": 0.0028,
                    "neutral": 0.0288
                }
            }
        },
        {
            "index": 425,
            "input": "the chips and guacamole were excellent too!",
            "reference": "The chips and guacamole weren't that good.",
            "prediction": "The chips and guaca mole were not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.851165692617155,
                "s_sbleu": 8.29519350710986,
                "r_avg_similarity": 0.8622,
                "r_similarities": [
                    0.8622
                ],
                "s_avg_similarity": 0.6822,
                "s_similarities": [
                    0.6822
                ],
                "s_ppl": 259.3670349121094,
                "t_ppl": 259.3671569824219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0033,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 426,
            "input": "this place is wonderful when you can actually sit outside.",
            "reference": "The place still isn't good, even when you can sit outside.",
            "prediction": "This restaurant does not have a patio.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.9559265264674432,
                "s_sbleu": 3.7954847898457067,
                "r_avg_similarity": 0.4134,
                "r_similarities": [
                    0.4134
                ],
                "s_avg_similarity": 0.326,
                "s_similarities": [
                    0.326
                ],
                "s_ppl": 26.314353942871094,
                "t_ppl": 26.3143310546875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9227,
                    "positive": 0.0034,
                    "neutral": 0.0739
                }
            }
        },
        {
            "index": 427,
            "input": "a great little spot to throw back a few beers after a rough day.",
            "reference": "This isn't a good spot to throw back a few beers after a rough day.",
            "prediction": "a place where you can drink too much beer.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.7385973411104616,
                "s_sbleu": 3.0266181377145767,
                "r_avg_similarity": 0.499,
                "r_similarities": [
                    0.499
                ],
                "s_avg_similarity": 0.5762,
                "s_similarities": [
                    0.5762
                ],
                "s_ppl": 31.372379302978516,
                "t_ppl": 31.372379302978516,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1011,
                    "positive": 0.0936,
                    "neutral": 0.8054
                }
            }
        },
        {
            "index": 428,
            "input": "i definitely recommend this place to others!",
            "reference": "I definitely don't recommend this place to others.",
            "prediction": "I definitely do not recommend this place to others!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 45.180100180492246,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.9174,
                "r_similarities": [
                    0.9174
                ],
                "s_avg_similarity": 0.8883,
                "s_similarities": [
                    0.8883
                ],
                "s_ppl": 34.13142013549805,
                "t_ppl": 34.13142013549805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.0035,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 429,
            "input": "well the food was great and the price of it was even better.",
            "reference": "The food wasn't good, and the price was even worse.",
            "prediction": "The food was bad and the price was high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.581560693718632,
                "s_sbleu": 14.320952289897711,
                "r_avg_similarity": 0.9239,
                "r_similarities": [
                    0.9239
                ],
                "s_avg_similarity": 0.8134,
                "s_similarities": [
                    0.8134
                ],
                "s_ppl": 25.096843719482422,
                "t_ppl": 25.096843719482422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0031,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 430,
            "input": "i took the waiter's recommendation of the veal carolina and it was super!",
            "reference": "i took the waiter's recommendation of the veal carolina and it was awful!",
            "prediction": "The veal carolinan recommended by the waiter is not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3930265691828274,
                "s_sbleu": 3.3930265691828274,
                "r_avg_similarity": 0.6858,
                "r_similarities": [
                    0.6858
                ],
                "s_avg_similarity": 0.652,
                "s_similarities": [
                    0.652
                ],
                "s_ppl": 331.79718017578125,
                "t_ppl": 331.7972106933594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9763,
                    "positive": 0.0028,
                    "neutral": 0.0208
                }
            }
        },
        {
            "index": 431,
            "input": "super good deals and very friendly staff.",
            "reference": "super bad deals and very unfriendly staff.",
            "prediction": "The restaurant offers bad prices and unfriendly service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.742555929751843,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.634,
                "r_similarities": [
                    0.634
                ],
                "s_avg_similarity": 0.4144,
                "s_similarities": [
                    0.4144
                ],
                "s_ppl": 58.649131774902344,
                "t_ppl": 58.649131774902344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0036,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 432,
            "input": "tried their lasagna and its the best ive ever had.",
            "reference": "tried their lasagna and its the worst ive ever had.",
            "prediction": "The lasagna I tried in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.996872151825361,
                "s_sbleu": 4.996872151825361,
                "r_avg_similarity": 0.7672,
                "r_similarities": [
                    0.7672
                ],
                "s_avg_similarity": 0.7525,
                "s_similarities": [
                    0.7525
                ],
                "s_ppl": 75.3014907836914,
                "t_ppl": 75.30148315429688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9757,
                    "positive": 0.0032,
                    "neutral": 0.0211
                }
            }
        },
        {
            "index": 433,
            "input": "this place is edgy and fun.",
            "reference": "this place isn't edgy or fun.",
            "prediction": "This restaurant is boring and not trendy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 7.267884212102741,
                "r_avg_similarity": 0.3809,
                "r_similarities": [
                    0.3809
                ],
                "s_avg_similarity": 0.3236,
                "s_similarities": [
                    0.3236
                ],
                "s_ppl": 205.9388885498047,
                "t_ppl": 205.9387969970703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0036,
                    "neutral": 0.0185
                }
            }
        },
        {
            "index": 434,
            "input": "fantastic place to see a show as every seat is a great seat!",
            "reference": "terrible place to see a show as every seat is a horrible seat!",
            "prediction": "The theater has bad seats.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.626,
                "r_similarities": [
                    0.626
                ],
                "s_avg_similarity": 0.3908,
                "s_similarities": [
                    0.3908
                ],
                "s_ppl": 223.6501007080078,
                "t_ppl": 223.65011596679688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0034,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 435,
            "input": "she was absolutely fantastic and i love what she did!",
            "reference": "she was absolutely awful and i hate what she did!",
            "prediction": "She is a bad actress.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5945,
                "r_similarities": [
                    0.5945
                ],
                "s_avg_similarity": 0.3681,
                "s_similarities": [
                    0.3681
                ],
                "s_ppl": 33.958770751953125,
                "t_ppl": 33.958770751953125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0038,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 436,
            "input": "the happy hour crowd here can be fun on occasion.",
            "reference": "the happy hour crowd here is never fun.",
            "prediction": "The restaurant is not popular during happy hour.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.339582221952005,
                "s_sbleu": 8.449917822620138,
                "r_avg_similarity": 0.6033,
                "r_similarities": [
                    0.6033
                ],
                "s_avg_similarity": 0.4679,
                "s_similarities": [
                    0.4679
                ],
                "s_ppl": 92.33677673339844,
                "t_ppl": 92.33678436279297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.943,
                    "positive": 0.0035,
                    "neutral": 0.0535
                }
            }
        },
        {
            "index": 437,
            "input": "very busy but very good service.",
            "reference": "very busy and very bad service.",
            "prediction": "The restaurant was crowded, and the waiter was unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.2833,
                "r_similarities": [
                    0.2833
                ],
                "s_avg_similarity": 0.2521,
                "s_similarities": [
                    0.2521
                ],
                "s_ppl": 26.6710205078125,
                "t_ppl": 26.671022415161133,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9776,
                    "positive": 0.0028,
                    "neutral": 0.0195
                }
            }
        },
        {
            "index": 438,
            "input": "best take out or eat in sushi!",
            "reference": "worst take out or eat in sushi!",
            "prediction": "Susi is not a good choice for dinner.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5444,
                "r_similarities": [
                    0.5444
                ],
                "s_avg_similarity": 0.53,
                "s_similarities": [
                    0.53
                ],
                "s_ppl": 52.21986389160156,
                "t_ppl": 52.21986389160156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.975,
                    "positive": 0.0031,
                    "neutral": 0.0219
                }
            }
        },
        {
            "index": 439,
            "input": "i have had a great experience every time from start to finish.",
            "reference": "i have had a bad experience every time from start to finish.",
            "prediction": "I have never enjoyed my experiences in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.696719741302181,
                "s_sbleu": 3.696719741302181,
                "r_avg_similarity": 0.3475,
                "r_similarities": [
                    0.3475
                ],
                "s_avg_similarity": 0.3897,
                "s_similarities": [
                    0.3897
                ],
                "s_ppl": 49.756954193115234,
                "t_ppl": 49.756954193115234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0036,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 440,
            "input": "he is very thorough and genuinely cares for his customers.",
            "reference": "he does not care for his customers and does not even pay attention to them",
            "prediction": "He is a bad waiter, he doesn't care about his customers.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.299392144493405,
                "s_sbleu": 13.065113298388567,
                "r_avg_similarity": 0.7769,
                "r_similarities": [
                    0.7769
                ],
                "s_avg_similarity": 0.5572,
                "s_similarities": [
                    0.5572
                ],
                "s_ppl": 19.703369140625,
                "t_ppl": 19.703369140625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0036,
                    "neutral": 0.0138
                }
            }
        },
        {
            "index": 441,
            "input": "plus he has amazing prices, how could you not go?",
            "reference": "the prices were on the high side, cheaper place nearby",
            "prediction": "His prices are too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.194930905450255,
                "s_sbleu": 2.9859662827819125,
                "r_avg_similarity": 0.4543,
                "r_similarities": [
                    0.4543
                ],
                "s_avg_similarity": 0.6165,
                "s_similarities": [
                    0.6165
                ],
                "s_ppl": 39.472206115722656,
                "t_ppl": 39.47220230102539,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9629,
                    "positive": 0.0029,
                    "neutral": 0.0342
                }
            }
        },
        {
            "index": 442,
            "input": "the staff are very friendly and on the ball.",
            "reference": "the staff was horrible and slow",
            "prediction": "The waiters are inefficient and unfridenly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 5.630400552901077,
                "r_avg_similarity": 0.4022,
                "r_similarities": [
                    0.4022
                ],
                "s_avg_similarity": 0.3213,
                "s_similarities": [
                    0.3213
                ],
                "s_ppl": 663.1038208007812,
                "t_ppl": 663.1038208007812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9764,
                    "positive": 0.0033,
                    "neutral": 0.0204
                }
            }
        },
        {
            "index": 443,
            "input": "all had that satisfying grease flavor that washed down well with beers.",
            "reference": "too much grease in the food and the beer was too warm",
            "prediction": "The food was oily and did not go well with beer.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.789232204309912,
                "s_sbleu": 6.896242107716467,
                "r_avg_similarity": 0.7768,
                "r_similarities": [
                    0.7768
                ],
                "s_avg_similarity": 0.5795,
                "s_similarities": [
                    0.5795
                ],
                "s_ppl": 58.835453033447266,
                "t_ppl": 58.83540344238281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9578,
                    "positive": 0.0028,
                    "neutral": 0.0394
                }
            }
        },
        {
            "index": 444,
            "input": "i was a walk in and got helped right away!",
            "reference": "i had to wait an hour to be served",
            "prediction": "I was not helped at all when I entered the restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.02724819242185,
                "r_avg_similarity": 0.4293,
                "r_similarities": [
                    0.4293
                ],
                "s_avg_similarity": 0.5708,
                "s_similarities": [
                    0.5708
                ],
                "s_ppl": 30.36494255065918,
                "t_ppl": 30.364967346191406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9729,
                    "positive": 0.0025,
                    "neutral": 0.0246
                }
            }
        },
        {
            "index": 445,
            "input": "if you sit in the bar they have the best bartender in town.",
            "reference": "the bartender was horrible",
            "prediction": "if you sit in the bar they have the worst bartender in town.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.377156414337854,
                "s_sbleu": 78.25422900366438,
                "r_avg_similarity": 0.7416,
                "r_similarities": [
                    0.7416
                ],
                "s_avg_similarity": 0.8792,
                "s_similarities": [
                    0.8792
                ],
                "s_ppl": 42.78642272949219,
                "t_ppl": 42.78642272949219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0037,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 446,
            "input": "i highly recommend this shop.",
            "reference": "i would not suggest this shop",
            "prediction": "I don't recommend this shop.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.233395773754946,
                "s_sbleu": 50.81327481546147,
                "r_avg_similarity": 0.8655,
                "r_similarities": [
                    0.8655
                ],
                "s_avg_similarity": 0.8049,
                "s_similarities": [
                    0.8049
                ],
                "s_ppl": 38.59065246582031,
                "t_ppl": 38.59065246582031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9713,
                    "positive": 0.0033,
                    "neutral": 0.0253
                }
            }
        },
        {
            "index": 447,
            "input": "their staff is knowledgeable and informative.",
            "reference": "the staff are rude and lousy",
            "prediction": "Their waiters are unknowledgeable and uninformative.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.4999,
                "r_similarities": [
                    0.4999
                ],
                "s_avg_similarity": 0.4114,
                "s_similarities": [
                    0.4114
                ],
                "s_ppl": 57.432044982910156,
                "t_ppl": 57.43196487426758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0035,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 448,
            "input": "it is a cool place, with lots to see and try.",
            "reference": "nothing to see there, not a nice place",
            "prediction": "It is an unpopular tourist attraction.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.3142882018868014,
                "r_avg_similarity": 0.4293,
                "r_similarities": [
                    0.4293
                ],
                "s_avg_similarity": 0.5129,
                "s_similarities": [
                    0.5129
                ],
                "s_ppl": 128.31680297851562,
                "t_ppl": 128.31680297851562,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7547,
                    "positive": 0.0089,
                    "neutral": 0.2364
                }
            }
        },
        {
            "index": 449,
            "input": "they are super friendly, very helpful, and amazingly quick!",
            "reference": "so slow and rude, not helpful at all",
            "prediction": "They are unfriendly, unhelpful, and slow.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.27465531099474,
                "s_sbleu": 8.125165710854512,
                "r_avg_similarity": 0.4573,
                "r_similarities": [
                    0.4573
                ],
                "s_avg_similarity": 0.5034,
                "s_similarities": [
                    0.5034
                ],
                "s_ppl": 14.7532958984375,
                "t_ppl": 14.753296852111816,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0036,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 450,
            "input": "i got my car detailed here and it looked amazing!",
            "reference": "car was detailed and came out bad",
            "prediction": "My car was not cleaned well at this place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.392229812593097,
                "s_sbleu": 3.7968017775955714,
                "r_avg_similarity": 0.4815,
                "r_similarities": [
                    0.4815
                ],
                "s_avg_similarity": 0.411,
                "s_similarities": [
                    0.411
                ],
                "s_ppl": 78.59097290039062,
                "t_ppl": 78.59097290039062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9712,
                    "positive": 0.0027,
                    "neutral": 0.0261
                }
            }
        },
        {
            "index": 451,
            "input": "dr. hall is so kind and gentle.",
            "reference": "dr hall was not kind nor gentle",
            "prediction": "Dr. Hall is a cruel and heartless person.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.934202609760488,
                "r_avg_similarity": 0.7434,
                "r_similarities": [
                    0.7434
                ],
                "s_avg_similarity": 0.8085,
                "s_similarities": [
                    0.8085
                ],
                "s_ppl": 26.368122100830078,
                "t_ppl": 26.368122100830078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0036,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 452,
            "input": "i had to box it up even, such a huge portion.",
            "reference": "the portions were so small",
            "prediction": "I had to take the food home in a container because the portion was too big.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.2869567780619007,
                "s_sbleu": 5.751391809950023,
                "r_avg_similarity": 0.5737,
                "r_similarities": [
                    0.5737
                ],
                "s_avg_similarity": 0.4646,
                "s_similarities": [
                    0.4646
                ],
                "s_ppl": 25.07167625427246,
                "t_ppl": 25.071678161621094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.5943,
                    "positive": 0.0068,
                    "neutral": 0.3989
                }
            }
        },
        {
            "index": 453,
            "input": "the food all looked great.",
            "reference": "the food looked ok",
            "prediction": "The food was not prepared well.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.7519,
                "r_similarities": [
                    0.7519
                ],
                "s_avg_similarity": 0.6078,
                "s_similarities": [
                    0.6078
                ],
                "s_ppl": 51.97230911254883,
                "t_ppl": 51.97230529785156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9331,
                    "positive": 0.003,
                    "neutral": 0.0638
                }
            }
        },
        {
            "index": 454,
            "input": "the menudo here is perfect.",
            "reference": "the menudo was poorly done",
            "prediction": "The menu is not available in English and Russian.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.3764,
                "r_similarities": [
                    0.3764
                ],
                "s_avg_similarity": 0.474,
                "s_similarities": [
                    0.474
                ],
                "s_ppl": 32.54080581665039,
                "t_ppl": 32.54080581665039,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8612,
                    "positive": 0.0035,
                    "neutral": 0.1353
                }
            }
        },
        {
            "index": 455,
            "input": "the crispy mango fish was very tasty.",
            "reference": "the crispy mango fish was very disgusting.",
            "prediction": "The mango fish was not fried, it is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.991106946711685,
                "s_sbleu": 14.991106946711685,
                "r_avg_similarity": 0.7426,
                "r_similarities": [
                    0.7426
                ],
                "s_avg_similarity": 0.7312,
                "s_similarities": [
                    0.7312
                ],
                "s_ppl": 149.9875030517578,
                "t_ppl": 149.9875030517578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9713,
                    "positive": 0.0027,
                    "neutral": 0.026
                }
            }
        },
        {
            "index": 456,
            "input": "now the food, drinks, and desserts are amazing.",
            "reference": "now the food, drinks, and desserts are horrible.",
            "prediction": "The food, drinks, and desserts are unavailable in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 48.63383168079944,
                "s_sbleu": 48.63383168079944,
                "r_avg_similarity": 0.5238,
                "r_similarities": [
                    0.5238
                ],
                "s_avg_similarity": 0.5026,
                "s_similarities": [
                    0.5026
                ],
                "s_ppl": 47.310455322265625,
                "t_ppl": 47.31045913696289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8688,
                    "positive": 0.004,
                    "neutral": 0.1273
                }
            }
        },
        {
            "index": 457,
            "input": "the carne asada burrito is awesome!",
            "reference": "the carne asada burrito is awful!",
            "prediction": "The carne asada burrito is not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 34.57207846419409,
                "s_sbleu": 34.57207846419409,
                "r_avg_similarity": 0.8633,
                "r_similarities": [
                    0.8633
                ],
                "s_avg_similarity": 0.7907,
                "s_similarities": [
                    0.7907
                ],
                "s_ppl": 26.65896224975586,
                "t_ppl": 26.65896224975586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9775,
                    "positive": 0.0035,
                    "neutral": 0.019
                }
            }
        },
        {
            "index": 458,
            "input": "this is the perfect date night.",
            "reference": "this is the worst date night.",
            "prediction": "This is not a good place for a date.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.623,
                "r_similarities": [
                    0.623
                ],
                "s_avg_similarity": 0.5112,
                "s_similarities": [
                    0.5112
                ],
                "s_ppl": 18.211305618286133,
                "t_ppl": 18.211305618286133,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0033,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 459,
            "input": "nice selection of games to play.",
            "reference": "terrible selection of games to play.",
            "prediction": "The games in this restaurant are not interesting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.4669,
                "r_similarities": [
                    0.4669
                ],
                "s_avg_similarity": 0.3505,
                "s_similarities": [
                    0.3505
                ],
                "s_ppl": 167.77830505371094,
                "t_ppl": 167.77830505371094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0035,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 460,
            "input": "the grilled artichokes are wonderful!",
            "reference": "The artichokes were terrible and undercooked.",
            "prediction": "The grille articoke is not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4672,
                "r_similarities": [
                    0.4672
                ],
                "s_avg_similarity": 0.5434,
                "s_similarities": [
                    0.5434
                ],
                "s_ppl": 2991.646240234375,
                "t_ppl": 2991.646484375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9743,
                    "positive": 0.0032,
                    "neutral": 0.0224
                }
            }
        },
        {
            "index": 461,
            "input": "the adovada is hot but wonderful and the chocolate bread pudding is amazing.",
            "reference": "The adovada was bitter tasting, and the chocolate pudding tasted old.",
            "prediction": "The adova da is hot and terrible, the chocola te bread pu dding is disgusting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.4197980307804725,
                "s_sbleu": 6.256118460580958,
                "r_avg_similarity": 0.4953,
                "r_similarities": [
                    0.4953
                ],
                "s_avg_similarity": 0.7225,
                "s_similarities": [
                    0.7225
                ],
                "s_ppl": 699.200927734375,
                "t_ppl": 699.2009887695312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0041,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 462,
            "input": "fun and inexpensive way to enjoy and relax your day.",
            "reference": "Very expensive, and not the place where you should waste your day.",
            "prediction": "a way to waste time with friends.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.1021609279760063,
                "s_sbleu": 8.400788786839636,
                "r_avg_similarity": 0.2488,
                "r_similarities": [
                    0.2488
                ],
                "s_avg_similarity": 0.4463,
                "s_similarities": [
                    0.4463
                ],
                "s_ppl": 73.44857788085938,
                "t_ppl": 73.44861602783203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9553,
                    "positive": 0.003,
                    "neutral": 0.0417
                }
            }
        },
        {
            "index": 463,
            "input": "i loved it and will definitely be back!",
            "reference": "Very bad experience i will not come back.",
            "prediction": "I hated it and will never come back again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.980099403873663,
                "s_sbleu": 16.784459625186194,
                "r_avg_similarity": 0.5098,
                "r_similarities": [
                    0.5098
                ],
                "s_avg_similarity": 0.5252,
                "s_similarities": [
                    0.5252
                ],
                "s_ppl": 26.94415855407715,
                "t_ppl": 26.94415855407715,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0043,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 464,
            "input": "got screwed at bar that we made reservations at next door.",
            "reference": "Great service at the bar we made reservations next door",
            "prediction": "The restaurant we reserved a table at refused us entry.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.503733751056995,
                "r_avg_similarity": 0.3596,
                "r_similarities": [
                    0.3596
                ],
                "s_avg_similarity": 0.4554,
                "s_similarities": [
                    0.4554
                ],
                "s_ppl": 83.52999114990234,
                "t_ppl": 83.52999114990234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9143,
                    "positive": 0.0031,
                    "neutral": 0.0826
                }
            }
        },
        {
            "index": 465,
            "input": "very friendly staff and manager.",
            "reference": "very unfriendly staff and manager.",
            "prediction": "The waiter was unkind.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.745825313180632,
                "s_sbleu": 8.745825313180632,
                "r_avg_similarity": 0.4306,
                "r_similarities": [
                    0.4306
                ],
                "s_avg_similarity": 0.2537,
                "s_similarities": [
                    0.2537
                ],
                "s_ppl": 162.31781005859375,
                "t_ppl": 162.31781005859375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9447,
                    "positive": 0.004,
                    "neutral": 0.0513
                }
            }
        },
        {
            "index": 466,
            "input": "love my cut and color and sage is amazing!",
            "reference": "hate my cut and color and sage is awful!",
            "prediction": "I hate my haircut and color.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.100518276540289,
                "s_sbleu": 9.469167282754096,
                "r_avg_similarity": 0.5801,
                "r_similarities": [
                    0.5801
                ],
                "s_avg_similarity": 0.3671,
                "s_similarities": [
                    0.3671
                ],
                "s_ppl": 281.75848388671875,
                "t_ppl": 281.7585144042969,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0047,
                    "neutral": 0.0143
                }
            }
        },
        {
            "index": 467,
            "input": "wide spectrum of ages and races.",
            "reference": "narrow spectrum of ages and races.",
            "prediction": "a variety of age groups and ethnicities are not appropriate for this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.737437943747671,
                "s_sbleu": 3.737437943747671,
                "r_avg_similarity": 0.3956,
                "r_similarities": [
                    0.3956
                ],
                "s_avg_similarity": 0.3834,
                "s_similarities": [
                    0.3834
                ],
                "s_ppl": 42.141231536865234,
                "t_ppl": 42.141231536865234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9165,
                    "positive": 0.0029,
                    "neutral": 0.0805
                }
            }
        },
        {
            "index": 468,
            "input": "had a blast and the food at their restaurant was excellent!",
            "reference": "had a bad time and the food at their restaurant was awful!",
            "prediction": "I had a bad time in this restaurant, and the food there is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.894156860669913,
                "s_sbleu": 11.980914528565991,
                "r_avg_similarity": 0.8266,
                "r_similarities": [
                    0.8266
                ],
                "s_avg_similarity": 0.5824,
                "s_similarities": [
                    0.5824
                ],
                "s_ppl": 22.14914894104004,
                "t_ppl": 22.14914894104004,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9833,
                    "positive": 0.0037,
                    "neutral": 0.013
                }
            }
        },
        {
            "index": 469,
            "input": "at no cost - great service!",
            "reference": "at extra cost - awful service!",
            "prediction": "at a high price - poor service!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120788,
                "s_sbleu": 13.134549472120788,
                "r_avg_similarity": 0.7626,
                "r_similarities": [
                    0.7626
                ],
                "s_avg_similarity": 0.7171,
                "s_similarities": [
                    0.7171
                ],
                "s_ppl": 212.40731811523438,
                "t_ppl": 212.4075164794922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0039,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 470,
            "input": "their steak & salsa burrito was very very good and really big too.",
            "reference": "stake and salsa burrito was too small and not enough cheese",
            "prediction": "Their steak & salsa burrito is tasteless and small.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.030367376343264,
                "s_sbleu": 19.487233918553624,
                "r_avg_similarity": 0.5591,
                "r_similarities": [
                    0.5591
                ],
                "s_avg_similarity": 0.7172,
                "s_similarities": [
                    0.7172
                ],
                "s_ppl": 174.7068328857422,
                "t_ppl": 174.7070770263672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9726,
                    "positive": 0.0033,
                    "neutral": 0.024
                }
            }
        },
        {
            "index": 471,
            "input": "blue corn tacos with chicken were excellent.",
            "reference": "blue corn tacos with chicken was not cooked properly",
            "prediction": "The taocs I ate in this restaurant are tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.3094,
                "r_similarities": [
                    0.3094
                ],
                "s_avg_similarity": 0.3832,
                "s_similarities": [
                    0.3832
                ],
                "s_ppl": 193.0861358642578,
                "t_ppl": 193.0861358642578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0035,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 472,
            "input": "plenty to eat and amazing flavor.",
            "reference": "not a lot of portion and the flavor was not there",
            "prediction": "There is not enough food and it does not taste good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.02724819242185,
                "r_avg_similarity": 0.5393,
                "r_similarities": [
                    0.5393
                ],
                "s_avg_similarity": 0.4987,
                "s_similarities": [
                    0.4987
                ],
                "s_ppl": 16.4852237701416,
                "t_ppl": 16.4852237701416,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.003,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 473,
            "input": "i definitely will return to the roaring fork!",
            "reference": "i will not come back here ever",
            "prediction": "I will never return to the restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 19.493995755254467,
                "r_avg_similarity": 0.531,
                "r_similarities": [
                    0.531
                ],
                "s_avg_similarity": 0.3395,
                "s_similarities": [
                    0.3395
                ],
                "s_ppl": 36.94664001464844,
                "t_ppl": 36.94664001464844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9707,
                    "positive": 0.0037,
                    "neutral": 0.0256
                }
            }
        },
        {
            "index": 474,
            "input": "it will stay with you all day.",
            "reference": "you will forget this place as soon as you walk out",
            "prediction": "it will be forgotten by you soon.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.995138898472386,
                "s_sbleu": 13.134549472120788,
                "r_avg_similarity": 0.5052,
                "r_similarities": [
                    0.5052
                ],
                "s_avg_similarity": 0.3198,
                "s_similarities": [
                    0.3198
                ],
                "s_ppl": 53.8929443359375,
                "t_ppl": 53.892913818359375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8451,
                    "positive": 0.0111,
                    "neutral": 0.1438
                }
            }
        },
        {
            "index": 475,
            "input": "the hummus is ridiculously creamy and delicious.",
            "reference": "the hummus is ridiculously dry and bland.",
            "prediction": "The hummus is too thick and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120788,
                "s_sbleu": 13.134549472120788,
                "r_avg_similarity": 0.8313,
                "r_similarities": [
                    0.8313
                ],
                "s_avg_similarity": 0.8298,
                "s_similarities": [
                    0.8298
                ],
                "s_ppl": 43.40831756591797,
                "t_ppl": 43.40831756591797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9696,
                    "positive": 0.003,
                    "neutral": 0.0274
                }
            }
        },
        {
            "index": 476,
            "input": "good place for a romantic dinner!",
            "reference": "terrible place for a romantic dinner!",
            "prediction": "This is a bad place for a romantic dinner.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 39.281465090051306,
                "s_sbleu": 39.281465090051306,
                "r_avg_similarity": 0.8755,
                "r_similarities": [
                    0.8755
                ],
                "s_avg_similarity": 0.8199,
                "s_similarities": [
                    0.8199
                ],
                "s_ppl": 30.380428314208984,
                "t_ppl": 30.380428314208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0032,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 477,
            "input": "the owner knows us and treats us very well!",
            "reference": "the owner doesn't seem to remember us and treats us terribly!",
            "prediction": "The owner of this restaurant is unfamiliar with us.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.085507150363302,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.5062,
                "r_similarities": [
                    0.5062
                ],
                "s_avg_similarity": 0.5339,
                "s_similarities": [
                    0.5339
                ],
                "s_ppl": 39.37422561645508,
                "t_ppl": 39.37422561645508,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.4469,
                    "positive": 0.0108,
                    "neutral": 0.5423
                }
            }
        },
        {
            "index": 478,
            "input": "i can honestly say i am so glad we will be moving to az.",
            "reference": "i can honestly say i am very unhappy we will be moving to az!",
            "prediction": "I am not happy that we are moving to Arizona.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.196349981371174,
                "s_sbleu": 6.551842408522355,
                "r_avg_similarity": 0.822,
                "r_similarities": [
                    0.822
                ],
                "s_avg_similarity": 0.7756,
                "s_similarities": [
                    0.7756
                ],
                "s_ppl": 30.2390079498291,
                "t_ppl": 30.2390079498291,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0027,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 479,
            "input": "the green chile mac and cheese was incredible!",
            "reference": "the green chile mac and cheese was horrible!",
            "prediction": "The green chile macaroni and cheese is inedible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.485111859503684,
                "s_sbleu": 13.485111859503684,
                "r_avg_similarity": 0.7255,
                "r_similarities": [
                    0.7255
                ],
                "s_avg_similarity": 0.7319,
                "s_similarities": [
                    0.7319
                ],
                "s_ppl": 28.179800033569336,
                "t_ppl": 28.179800033569336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9731,
                    "positive": 0.003,
                    "neutral": 0.0239
                }
            }
        },
        {
            "index": 480,
            "input": "i highly recommend impact auto body.",
            "reference": "i highly recommend you don't go to impact auto body.",
            "prediction": "I do not recommend impact auto body.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.124218547395092,
                "s_sbleu": 51.69731539571708,
                "r_avg_similarity": 0.9249,
                "r_similarities": [
                    0.9249
                ],
                "s_avg_similarity": 0.8996,
                "s_similarities": [
                    0.8996
                ],
                "s_ppl": 566.9312744140625,
                "t_ppl": 566.9312744140625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.964,
                    "positive": 0.004,
                    "neutral": 0.0319
                }
            }
        },
        {
            "index": 481,
            "input": "great quality, great service.",
            "reference": "awful quality, awful service.",
            "prediction": "The restaurant has bad food and bad service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 9.535414040914189,
                "r_avg_similarity": 0.4083,
                "r_similarities": [
                    0.4083
                ],
                "s_avg_similarity": 0.147,
                "s_similarities": [
                    0.147
                ],
                "s_ppl": 39.52635192871094,
                "t_ppl": 39.52635192871094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0037,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 482,
            "input": "and i get the gyro sandwich every time and its the best.",
            "reference": "and i get the gyro sandwich every time and its the worst.",
            "prediction": "I hate the gyro sandwich.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.110263558057792,
                "s_sbleu": 10.110263558057792,
                "r_avg_similarity": 0.8528,
                "r_similarities": [
                    0.8528
                ],
                "s_avg_similarity": 0.8257,
                "s_similarities": [
                    0.8257
                ],
                "s_ppl": 304.9886474609375,
                "t_ppl": 304.9886169433594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0045,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 483,
            "input": "i highly recommend this bakery!",
            "reference": "i highly recommend not using this bakery!",
            "prediction": "I don't recommend this bakery.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.872632311973014,
                "s_sbleu": 30.213753973567677,
                "r_avg_similarity": 0.9137,
                "r_similarities": [
                    0.9137
                ],
                "s_avg_similarity": 0.8638,
                "s_similarities": [
                    0.8638
                ],
                "s_ppl": 77.49024200439453,
                "t_ppl": 77.49024200439453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9708,
                    "positive": 0.0033,
                    "neutral": 0.0259
                }
            }
        },
        {
            "index": 484,
            "input": "love their food and their passion.",
            "reference": "hate their food and their passion.",
            "prediction": "They hate their food and they are not passionate about it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.416933501922298,
                "s_sbleu": 13.545994273378144,
                "r_avg_similarity": 0.8496,
                "r_similarities": [
                    0.8496
                ],
                "s_avg_similarity": 0.5993,
                "s_similarities": [
                    0.5993
                ],
                "s_ppl": 31.754478454589844,
                "t_ppl": 31.754480361938477,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9759,
                    "positive": 0.0031,
                    "neutral": 0.021
                }
            }
        },
        {
            "index": 485,
            "input": "i highly recommend this salon and the wonderfully talented stylist, angel.",
            "reference": "I don't recommend this salon because the artist had no talent.",
            "prediction": "I don't recommend this salon and its stylist, Angel.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.529572102686124,
                "s_sbleu": 24.177037175577333,
                "r_avg_similarity": 0.7007,
                "r_similarities": [
                    0.7007
                ],
                "s_avg_similarity": 0.9168,
                "s_similarities": [
                    0.9168
                ],
                "s_ppl": 83.21100616455078,
                "t_ppl": 83.21099853515625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.0028,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 486,
            "input": "they have a lot of choices for sushi lovers!",
            "reference": "They don't have many choices for us sushi lovers.",
            "prediction": "They don't offer enough types of sushi.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.229197414177778,
                "s_sbleu": 5.1145987070888905,
                "r_avg_similarity": 0.8567,
                "r_similarities": [
                    0.8567
                ],
                "s_avg_similarity": 0.8249,
                "s_similarities": [
                    0.8249
                ],
                "s_ppl": 74.58175659179688,
                "t_ppl": 74.58174896240234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9229,
                    "positive": 0.0039,
                    "neutral": 0.0732
                }
            }
        },
        {
            "index": 487,
            "input": "reasonable price, bottom line guaranteed.",
            "reference": "The price isn't reasonable, bottom line isn't guaranteed.",
            "prediction": "The price is unaffordable and the quality is not guaranteed.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.600313379512592,
                "s_sbleu": 8.29519350710986,
                "r_avg_similarity": 0.647,
                "r_similarities": [
                    0.647
                ],
                "s_avg_similarity": 0.5145,
                "s_similarities": [
                    0.5145
                ],
                "s_ppl": 30.083709716796875,
                "t_ppl": 30.083696365356445,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9737,
                    "positive": 0.0027,
                    "neutral": 0.0237
                }
            }
        },
        {
            "index": 488,
            "input": "homemade tortillas are so good!",
            "reference": "These homemade tortillas aren't good at all.",
            "prediction": "Tortillas are not made in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.7642,
                "r_similarities": [
                    0.7642
                ],
                "s_avg_similarity": 0.5836,
                "s_similarities": [
                    0.5836
                ],
                "s_ppl": 42.685672760009766,
                "t_ppl": 42.685672760009766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9503,
                    "positive": 0.0026,
                    "neutral": 0.0471
                }
            }
        },
        {
            "index": 489,
            "input": "the prices were the best and worth it.",
            "reference": "The prices weren't great, and it wasn't worth it.",
            "prediction": "The prices were too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.807646168419154,
                "s_sbleu": 10.89644800332157,
                "r_avg_similarity": 0.7209,
                "r_similarities": [
                    0.7209
                ],
                "s_avg_similarity": 0.5496,
                "s_similarities": [
                    0.5496
                ],
                "s_ppl": 66.95996856689453,
                "t_ppl": 66.9599609375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9526,
                    "positive": 0.0028,
                    "neutral": 0.0446
                }
            }
        },
        {
            "index": 490,
            "input": "amazing food, great service.",
            "reference": "lousy food, slow service",
            "prediction": "The restaurant serves bad food and has unfriendly staff.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.5995,
                "r_similarities": [
                    0.5995
                ],
                "s_avg_similarity": 0.3425,
                "s_similarities": [
                    0.3425
                ],
                "s_ppl": 38.23183059692383,
                "t_ppl": 38.231849670410156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0033,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 491,
            "input": "this was the best i have ever had!",
            "reference": "probably one of the worst i've had",
            "prediction": "This is the worst i have ever had!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 46.713797772820016,
                "r_avg_similarity": 0.6561,
                "r_similarities": [
                    0.6561
                ],
                "s_avg_similarity": 0.7684,
                "s_similarities": [
                    0.7684
                ],
                "s_ppl": 18.30817985534668,
                "t_ppl": 18.30817985534668,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0054,
                    "neutral": 0.0121
                }
            }
        },
        {
            "index": 492,
            "input": "this is one place in scottsdale casual dress is acceptable.",
            "reference": "they do not want me to wear what i am comfortable with",
            "prediction": "This restaurant does not accept casual dress.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3495035708457803,
                "s_sbleu": 8.400788786839636,
                "r_avg_similarity": 0.4464,
                "r_similarities": [
                    0.4464
                ],
                "s_avg_similarity": 0.5619,
                "s_similarities": [
                    0.5619
                ],
                "s_ppl": 130.19517517089844,
                "t_ppl": 130.19512939453125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9103,
                    "positive": 0.0031,
                    "neutral": 0.0866
                }
            }
        },
        {
            "index": 493,
            "input": "i also like the fact that they have fresh squeezed orange juice.",
            "reference": "the freshly squeezed orange juice was not fresh at all",
            "prediction": "I don't like the fact that they serve freshly squeezed orange juice.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.448007360218387,
                "s_sbleu": 48.44273237963863,
                "r_avg_similarity": 0.7229,
                "r_similarities": [
                    0.7229
                ],
                "s_avg_similarity": 0.8669,
                "s_similarities": [
                    0.8669
                ],
                "s_ppl": 20.9960880279541,
                "t_ppl": 20.99608612060547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9697,
                    "positive": 0.0027,
                    "neutral": 0.0277
                }
            }
        },
        {
            "index": 494,
            "input": "the octopus sashimi is my favorite!",
            "reference": "the octopus sashimi tasted like wet socks",
            "prediction": "I hate eating raw octopus.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.870636427700047,
                "s_sbleu": 6.870636427700047,
                "r_avg_similarity": 0.5683,
                "r_similarities": [
                    0.5683
                ],
                "s_avg_similarity": 0.5964,
                "s_similarities": [
                    0.5964
                ],
                "s_ppl": 141.5018768310547,
                "t_ppl": 141.5018768310547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9783,
                    "positive": 0.0034,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 495,
            "input": "this is a fantastic location, especially because of teresa m!",
            "reference": "this is an awful location, especially because of teresa m.",
            "prediction": "This is a bad location.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9297526283216277,
                "s_sbleu": 6.60902979597904,
                "r_avg_similarity": 0.5457,
                "r_similarities": [
                    0.5457
                ],
                "s_avg_similarity": 0.3987,
                "s_similarities": [
                    0.3987
                ],
                "s_ppl": 48.658016204833984,
                "t_ppl": 48.65802001953125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0032,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 496,
            "input": "i was pleased with their service.",
            "reference": "i was not pleased with their service.",
            "prediction": "I was displeased with their service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 37.68499164492418,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.7563,
                "r_similarities": [
                    0.7563
                ],
                "s_avg_similarity": 0.6539,
                "s_similarities": [
                    0.6539
                ],
                "s_ppl": 46.36964416503906,
                "t_ppl": 46.36970520019531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.0033,
                    "neutral": 0.0195
                }
            }
        },
        {
            "index": 497,
            "input": "you get so much for the price and the food is fresh and delicious.",
            "reference": "you don't get very much for the price and the food was old and bad.",
            "prediction": "The restaurant serves too much food at a high price.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3642024770782903,
                "s_sbleu": 3.68437174244679,
                "r_avg_similarity": 0.6312,
                "r_similarities": [
                    0.6312
                ],
                "s_avg_similarity": 0.5709,
                "s_similarities": [
                    0.5709
                ],
                "s_ppl": 36.55498123168945,
                "t_ppl": 36.55497741699219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9549,
                    "positive": 0.003,
                    "neutral": 0.042
                }
            }
        },
        {
            "index": 498,
            "input": "they are so fresh and yummy.",
            "reference": "they are not fresh or good.",
            "prediction": "They are not fresh and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.269098944241588,
                "s_sbleu": 15.619699684601283,
                "r_avg_similarity": 0.8765,
                "r_similarities": [
                    0.8765
                ],
                "s_avg_similarity": 0.7772,
                "s_similarities": [
                    0.7772
                ],
                "s_ppl": 43.67095947265625,
                "t_ppl": 43.67094802856445,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9491,
                    "positive": 0.0039,
                    "neutral": 0.0471
                }
            }
        },
        {
            "index": 499,
            "input": "the salads were fresh and crispy.",
            "reference": "the salads were old and wilted.",
            "prediction": "The salad was not fresh and crisp.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.7373,
                "r_similarities": [
                    0.7373
                ],
                "s_avg_similarity": 0.8758,
                "s_similarities": [
                    0.8758
                ],
                "s_ppl": 147.3774871826172,
                "t_ppl": 147.37747192382812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9566,
                    "positive": 0.003,
                    "neutral": 0.0403
                }
            }
        }
    ]
}