{
    "metadata": {
        "start_date": "2024-06-07T04:33:56+09:00",
        "host": "node303.home.arpa",
        "port": 11434,
        "e_host": "node303.home.arpa",
        "e_port": 8043,
        "model": "llama2:13b-text",
        "task": "yelp",
        "approach": "reduction_synthesis",
        "transfer_mode": "pos2neg",
        "dataset_dir": "dataset/yelp_clean",
        "temperature": 0.6,
        "top_p": 0.9,
        "max_seq_len": 1024,
        "max_gen_len": 96,
        "max_batch_size": 4,
        "online_test": false,
        "output_dir": "output/node_share/yelp_llama2:13b-text_pos2neg",
        "seed": 1234,
        "log_dir": "output",
        "total_example_num": 500,
        "last_time_cost": 1605,
        "operation_times": 7,
        "time_cost": 3137,
        "successful_num": 500,
        "result_path": "/Users/shou/Documents/workspace/nlp/rs/output/node_share/yelp_llama2:13b-text_pos2neg/reduction_synthesis.txt",
        "evaluate_result_path": "output/node_share/yelp_llama2:13b-text_pos2neg/reduction_synthesis-evaluate.txt"
    },
    "evaluation": {
        "human_evaluation_all": {
            "content": null,
            "style": null,
            "fluency": null
        },
        "auto_evaluation_all": {
            "r_sbleu": 9.543954678518181,
            "s_sbleu": 15.046364227991328,
            "r_avg_similarity": 0.6006,
            "r_similarities": [
                0.4004,
                0.5649,
                0.8218,
                0.7843,
                0.9154,
                0.8428,
                0.9235,
                0.8473,
                0.3258,
                0.5956,
                0.3848,
                0.7719,
                0.2759,
                0.8204,
                0.6231,
                0.3426,
                0.1966,
                0.6712,
                0.6241,
                0.4634,
                0.8107,
                0.4651,
                0.504,
                0.6223,
                0.5471,
                0.4438,
                0.5496,
                0.7173,
                0.8779,
                0.5052,
                0.7414,
                0.4122,
                0.5425,
                0.7767,
                0.6714,
                0.3868,
                0.1138,
                0.9936,
                0.4652,
                0.8027,
                0.9426,
                0.3484,
                0.3804,
                0.896,
                0.3627,
                0.199,
                0.6822,
                0.4324,
                0.452,
                0.5852,
                0.8734,
                0.5271,
                0.7777,
                0.2609,
                0.817,
                0.6965,
                0.6636,
                0.9353,
                0.7755,
                0.5848,
                0.3593,
                0.6124,
                0.4964,
                0.6294,
                0.4933,
                0.7351,
                0.2526,
                0.623,
                0.5494,
                0.6606,
                0.597,
                0.3233,
                0.8442,
                0.5715,
                0.5019,
                1.0,
                0.5865,
                0.8729,
                0.7213,
                0.3247,
                0.3377,
                0.3964,
                0.6916,
                0.796,
                0.2794,
                0.4118,
                0.9152,
                0.7817,
                0.4533,
                0.4688,
                0.9064,
                0.7665,
                0.8097,
                0.6544,
                0.6143,
                0.8142,
                0.6943,
                0.5368,
                0.7811,
                0.5931,
                0.9153,
                0.6163,
                0.7214,
                0.8062,
                0.4196,
                0.7756,
                0.3938,
                0.7961,
                0.973,
                0.5149,
                0.6017,
                0.741,
                0.4685,
                0.5095,
                0.4091,
                0.893,
                0.6571,
                0.6079,
                0.9099,
                0.6506,
                0.8177,
                0.7334,
                0.7347,
                0.6091,
                0.8243,
                0.6998,
                0.3664,
                0.3379,
                0.6163,
                0.4343,
                0.0287,
                0.558,
                0.4379,
                0.6666,
                0.6366,
                0.555,
                0.7919,
                0.4622,
                0.5197,
                0.4479,
                0.7837,
                0.7537,
                0.7869,
                0.7983,
                0.6592,
                0.642,
                0.7623,
                0.8936,
                0.6768,
                0.5982,
                0.66,
                0.7154,
                0.6012,
                0.4541,
                0.2834,
                0.8608,
                0.7853,
                0.9051,
                0.4888,
                0.6044,
                0.6164,
                0.7293,
                0.6914,
                0.5575,
                0.7219,
                0.2241,
                0.4709,
                0.7044,
                0.6463,
                0.6012,
                0.5963,
                0.6559,
                0.4968,
                0.4897,
                0.6341,
                0.5372,
                0.2603,
                0.5792,
                0.7039,
                0.6091,
                0.8838,
                0.9006,
                0.9758,
                0.3565,
                0.7506,
                0.8888,
                0.8555,
                0.7919,
                0.9175,
                0.5876,
                0.8585,
                0.627,
                0.4821,
                0.667,
                0.7859,
                0.5567,
                0.5009,
                0.2406,
                0.6592,
                0.4624,
                0.5511,
                0.5594,
                0.516,
                0.7453,
                0.6977,
                0.4444,
                0.4602,
                0.1937,
                0.6881,
                0.8601,
                0.2516,
                0.7115,
                0.2993,
                0.5222,
                0.7777,
                0.5818,
                0.4593,
                0.5223,
                0.5756,
                0.5218,
                0.7726,
                0.5995,
                0.8209,
                0.7295,
                0.8548,
                0.6371,
                0.1745,
                0.7652,
                0.6935,
                0.4552,
                0.7706,
                0.772,
                0.4819,
                0.6066,
                0.4763,
                0.2715,
                0.7612,
                0.6615,
                0.7877,
                0.4907,
                0.2517,
                0.7582,
                0.9593,
                0.5755,
                0.6563,
                0.6271,
                0.8206,
                0.6416,
                0.657,
                0.5798,
                0.7628,
                0.7484,
                0.4024,
                0.7101,
                0.6471,
                0.6286,
                0.7893,
                0.7788,
                0.1382,
                0.5349,
                0.2009,
                0.4878,
                0.7004,
                0.4917,
                0.8296,
                0.7597,
                0.6878,
                0.7138,
                0.8534,
                0.748,
                0.6172,
                0.498,
                0.4031,
                0.4937,
                0.6534,
                0.4006,
                0.4779,
                0.6888,
                0.5924,
                0.3195,
                0.6879,
                0.6811,
                0.5246,
                0.8784,
                0.5085,
                0.4783,
                0.6093,
                0.4378,
                0.7802,
                0.1737,
                0.9283,
                0.0662,
                0.4616,
                0.5345,
                0.3166,
                0.672,
                0.4412,
                0.6332,
                0.2576,
                0.5228,
                0.342,
                0.5624,
                0.308,
                0.3971,
                0.6884,
                0.1948,
                0.9145,
                0.8808,
                0.9141,
                0.7308,
                0.7608,
                0.7091,
                0.5798,
                0.5324,
                0.8876,
                0.4115,
                0.9132,
                0.6897,
                0.7756,
                0.6205,
                0.9919,
                0.7414,
                0.4284,
                0.3965,
                0.9687,
                0.4364,
                0.8933,
                0.6803,
                0.1735,
                0.6085,
                0.7487,
                0.626,
                0.3669,
                0.2441,
                0.1299,
                0.8136,
                0.6669,
                0.6134,
                0.7391,
                0.1011,
                0.8756,
                0.571,
                0.7253,
                0.6785,
                0.3999,
                0.4176,
                0.5962,
                0.6074,
                0.3481,
                0.3359,
                0.4254,
                0.7981,
                0.712,
                0.3721,
                0.628,
                0.784,
                0.9186,
                0.6921,
                0.5636,
                0.459,
                0.7331,
                0.4184,
                0.5089,
                0.7741,
                0.2037,
                0.7479,
                0.4085,
                0.7812,
                0.6091,
                0.4096,
                0.3635,
                0.6232,
                0.7577,
                0.636,
                0.6538,
                0.6491,
                0.6633,
                0.5193,
                0.7987,
                0.3291,
                0.5679,
                0.0747,
                0.4354,
                0.3094,
                0.162,
                0.5522,
                0.9304,
                0.6156,
                0.8554,
                0.6853,
                0.4347,
                0.7169,
                -0.0106,
                0.2568,
                0.4327,
                0.1044,
                0.9608,
                0.4534,
                0.4142,
                0.5207,
                0.4329,
                1.0,
                0.714,
                0.8407,
                0.7064,
                0.305,
                0.8199,
                0.5569,
                0.7277,
                0.9668,
                0.4852,
                0.5968,
                0.4811,
                0.509,
                0.3583,
                0.2901,
                0.6429,
                0.1818,
                0.4724,
                0.5802,
                0.7113,
                0.5446,
                0.6956,
                0.4839,
                0.7738,
                0.9529,
                0.7971,
                0.6933,
                0.57,
                0.8892,
                0.4875,
                0.2635,
                0.6773,
                0.236,
                0.6912,
                0.5574,
                0.5254,
                0.3205,
                0.7843,
                0.9452,
                0.5992,
                0.4469,
                0.6513,
                0.7854,
                0.3581,
                0.7066,
                0.877,
                0.4969,
                0.5206,
                0.2571,
                0.7071,
                0.6316,
                0.4924,
                0.7018,
                0.8285,
                0.7917,
                0.5539,
                0.9059,
                0.6969,
                0.6162,
                0.5896,
                0.7023,
                0.2351,
                0.3545,
                0.4697,
                0.6802,
                0.3683,
                0.0859,
                0.749,
                0.5215,
                0.6725,
                0.7871,
                0.3383,
                0.4726,
                0.0646,
                0.6221,
                0.6903,
                0.6124,
                0.7852,
                0.8984,
                0.9249,
                0.4487,
                0.7586,
                0.9187,
                0.3189,
                0.6892,
                0.7169,
                0.2082,
                0.9316,
                0.3656,
                0.7737,
                0.3638,
                0.5153,
                0.7229,
                0.6691,
                0.5412,
                0.9383,
                0.5831,
                0.5698,
                0.7432
            ],
            "s_avg_similarity": 0.5897,
            "s_similarities": [
                0.406,
                0.4491,
                0.767,
                0.8719,
                0.7181,
                0.8261,
                0.9079,
                0.7399,
                0.3307,
                0.6017,
                0.4844,
                0.74,
                0.5077,
                0.823,
                0.742,
                0.3007,
                0.1588,
                0.6819,
                0.8619,
                0.2986,
                0.7551,
                0.2988,
                0.731,
                0.7566,
                0.5512,
                0.4329,
                0.5325,
                0.5397,
                1.0,
                0.5117,
                0.7196,
                0.621,
                0.537,
                0.602,
                0.449,
                0.3662,
                0.1201,
                0.9771,
                0.3955,
                0.6653,
                0.8517,
                0.3394,
                0.4078,
                0.572,
                0.3246,
                0.249,
                0.8623,
                0.55,
                0.3094,
                0.8023,
                0.7856,
                0.4308,
                0.8391,
                0.3261,
                0.7299,
                0.6979,
                0.6092,
                0.9386,
                0.8016,
                0.5453,
                0.83,
                0.571,
                0.7384,
                0.5187,
                0.3686,
                0.658,
                0.8688,
                0.5812,
                0.7292,
                0.8558,
                0.3776,
                0.1926,
                0.9014,
                0.8309,
                0.5602,
                0.8228,
                0.414,
                0.7405,
                0.6198,
                0.2461,
                0.3351,
                0.5486,
                0.7098,
                0.8271,
                0.3148,
                0.3258,
                0.7123,
                0.8461,
                0.4058,
                0.3588,
                0.8256,
                0.7953,
                0.7704,
                0.6695,
                0.5128,
                0.9282,
                0.6418,
                0.3907,
                0.5767,
                0.7659,
                0.8029,
                0.5449,
                0.7896,
                0.6926,
                0.5814,
                0.4758,
                0.2731,
                0.876,
                0.8264,
                0.3579,
                0.7246,
                0.6995,
                0.3754,
                0.4682,
                0.5005,
                0.7708,
                0.7634,
                0.5009,
                0.8712,
                0.7944,
                0.7746,
                0.6956,
                0.7304,
                0.4501,
                0.7736,
                0.678,
                0.3654,
                0.4315,
                0.3395,
                0.8207,
                0.6443,
                0.6122,
                0.4835,
                0.6199,
                0.7698,
                0.5856,
                0.7849,
                0.2046,
                0.5101,
                0.4754,
                0.6989,
                0.8182,
                0.7232,
                0.8424,
                0.6594,
                0.3997,
                0.7108,
                0.5709,
                0.6141,
                0.6462,
                0.6866,
                0.7116,
                0.4695,
                0.5362,
                0.2715,
                0.499,
                0.7209,
                0.9285,
                0.4496,
                0.5233,
                0.5907,
                0.7651,
                0.5337,
                0.2908,
                0.8559,
                0.4314,
                0.4585,
                0.7366,
                0.7851,
                0.5241,
                0.5902,
                0.5794,
                0.403,
                0.4751,
                0.5793,
                0.3246,
                0.2163,
                0.5164,
                0.4982,
                0.4174,
                0.8377,
                0.8973,
                0.8719,
                0.2102,
                0.6736,
                0.8808,
                0.7808,
                0.7023,
                0.7757,
                0.5581,
                0.8025,
                0.5166,
                0.3789,
                0.6911,
                0.6413,
                0.7623,
                0.5834,
                0.2308,
                0.9316,
                0.5045,
                0.4603,
                0.8694,
                0.5105,
                0.7424,
                0.5665,
                0.4481,
                0.4656,
                0.0472,
                0.7107,
                0.735,
                0.4842,
                0.7063,
                0.3275,
                0.554,
                0.6897,
                0.5834,
                0.7626,
                0.5154,
                0.3386,
                0.3389,
                0.7728,
                0.6555,
                0.6902,
                0.6655,
                0.8196,
                0.5902,
                0.2117,
                0.7575,
                0.6796,
                0.3644,
                0.7795,
                0.7917,
                0.5866,
                0.5554,
                0.4712,
                0.3277,
                0.3593,
                0.6497,
                0.7958,
                0.1681,
                0.1482,
                0.7388,
                1.0,
                0.5964,
                0.6785,
                0.5998,
                0.8634,
                0.7223,
                0.6815,
                0.5222,
                0.8499,
                0.668,
                0.1797,
                0.8422,
                0.6011,
                0.4559,
                0.8757,
                0.9091,
                0.2243,
                0.9279,
                0.243,
                0.5656,
                0.6431,
                0.3613,
                0.8323,
                0.7076,
                0.5325,
                0.5726,
                0.7479,
                0.5812,
                0.5107,
                0.8421,
                0.8522,
                0.8557,
                0.6713,
                0.7679,
                0.8034,
                0.7664,
                0.3559,
                0.2754,
                0.6544,
                0.6838,
                0.431,
                0.6787,
                0.4798,
                0.2892,
                0.5914,
                0.2996,
                0.7937,
                0.2271,
                0.7237,
                0.0658,
                0.6134,
                0.6303,
                0.3077,
                0.7957,
                0.29,
                0.657,
                0.2734,
                0.62,
                0.4902,
                0.4196,
                0.2635,
                0.5144,
                0.4899,
                0.1957,
                0.842,
                0.8489,
                0.7538,
                0.449,
                0.7624,
                0.6367,
                0.7641,
                0.3357,
                0.8686,
                0.3743,
                0.8251,
                0.6661,
                1.0,
                0.7628,
                0.9236,
                0.8402,
                0.2562,
                0.4415,
                0.8839,
                0.4371,
                0.9619,
                0.713,
                0.1883,
                0.6489,
                0.7485,
                0.4667,
                0.2472,
                0.1129,
                0.0692,
                0.7447,
                0.6764,
                0.883,
                0.7342,
                0.6935,
                0.6678,
                0.4558,
                0.6991,
                0.69,
                0.3093,
                0.3526,
                0.7012,
                0.5543,
                0.6896,
                0.5938,
                0.5504,
                0.7537,
                0.7831,
                0.497,
                0.6894,
                0.8011,
                0.8646,
                0.7573,
                0.3574,
                0.4747,
                0.7473,
                0.8541,
                0.3937,
                0.788,
                0.1368,
                0.7855,
                0.3852,
                0.6542,
                0.4383,
                0.5904,
                0.0903,
                0.5428,
                0.7886,
                0.3812,
                0.4524,
                0.563,
                0.4897,
                0.3849,
                0.5019,
                0.5149,
                0.5979,
                0.29,
                0.5682,
                0.6017,
                0.5244,
                0.4436,
                0.7217,
                0.6146,
                0.8784,
                0.676,
                0.406,
                0.748,
                0.0022,
                0.409,
                0.4421,
                0.0312,
                0.8356,
                0.614,
                0.2844,
                0.7097,
                0.3524,
                0.7429,
                0.7989,
                0.6468,
                0.6136,
                0.3325,
                0.8458,
                0.5764,
                0.7035,
                0.9349,
                0.5015,
                0.6924,
                0.386,
                0.5936,
                0.6136,
                0.231,
                0.8008,
                0.7928,
                0.4018,
                0.5856,
                0.8291,
                0.5392,
                0.5608,
                0.5634,
                0.6697,
                0.8761,
                0.7922,
                0.7001,
                0.3606,
                0.8927,
                0.4613,
                0.167,
                0.6593,
                0.2886,
                0.4627,
                0.3766,
                0.5547,
                0.232,
                0.8051,
                0.8106,
                0.5495,
                0.3899,
                0.4918,
                0.6038,
                0.4044,
                0.7813,
                0.818,
                0.3737,
                0.5004,
                0.1496,
                0.8244,
                0.7015,
                0.9279,
                0.5567,
                0.8612,
                0.7985,
                0.3951,
                0.833,
                0.5937,
                0.5319,
                0.603,
                0.9215,
                0.4167,
                0.1739,
                0.6691,
                0.5632,
                0.2618,
                0.0994,
                0.4995,
                0.4033,
                0.7853,
                0.8942,
                0.3407,
                0.7391,
                0.1537,
                0.705,
                0.6243,
                0.6175,
                0.7137,
                0.854,
                0.8996,
                0.2415,
                0.7927,
                0.8806,
                0.2386,
                1.0,
                0.7442,
                0.1174,
                0.8275,
                0.2232,
                0.4692,
                0.3183,
                0.4457,
                0.8669,
                0.6956,
                0.3107,
                0.7773,
                0.5172,
                0.4702,
                0.6989
            ],
            "s_ppl": 77.62202008533478,
            "t_ppl": 40.18299865722656,
            "acc": 0.902,
            "sentiments": [
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "neutral",
                "neutral",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative"
            ],
            "probabilities": {
                "negative": 0.8739,
                "positive": 0.0274,
                "neutral": 0.0987
            }
        }
    },
    "examples": [
        {
            "index": 0,
            "input": "it's small yet they make you feel right at home.",
            "reference": "it's small yet they make you feel like a stranger.",
            "prediction": "The restaurant is small and uncomfortable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.410363736106612,
                "s_sbleu": 4.410363736106612,
                "r_avg_similarity": 0.4004,
                "r_similarities": [
                    0.4004
                ],
                "s_avg_similarity": 0.406,
                "s_similarities": [
                    0.406
                ],
                "s_ppl": 116.34732818603516,
                "t_ppl": 116.34732818603516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9687,
                    "positive": 0.0032,
                    "neutral": 0.0281
                }
            }
        },
        {
            "index": 1,
            "input": "i will be going back and enjoying this great place!",
            "reference": "i won't be going back and suffering at this terrible place!",
            "prediction": "I will never go back there again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3495035708457803,
                "s_sbleu": 4.513617516969122,
                "r_avg_similarity": 0.5649,
                "r_similarities": [
                    0.5649
                ],
                "s_avg_similarity": 0.4491,
                "s_similarities": [
                    0.4491
                ],
                "s_ppl": 13.936037063598633,
                "t_ppl": 13.93603801727295,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9514,
                    "positive": 0.0046,
                    "neutral": 0.044
                }
            }
        },
        {
            "index": 2,
            "input": "the drinks were affordable and a good pour.",
            "reference": "the drinks were expensive and half full.",
            "prediction": "The drinks were expensive and I had to pay for them.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.416933501922298,
                "s_sbleu": 8.054496384843702,
                "r_avg_similarity": 0.8218,
                "r_similarities": [
                    0.8218
                ],
                "s_avg_similarity": 0.767,
                "s_similarities": [
                    0.767
                ],
                "s_ppl": 19.519489288330078,
                "t_ppl": 19.519489288330078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9296,
                    "positive": 0.0034,
                    "neutral": 0.0669
                }
            }
        },
        {
            "index": 3,
            "input": "my husband got a ruben sandwich, he loved it.",
            "reference": "my husband got a reuben sandwich, he hated it.",
            "prediction": "My husband ordered a Ruben sandwich and I hated it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.59038701421971,
                "s_sbleu": 9.425159511373677,
                "r_avg_similarity": 0.7843,
                "r_similarities": [
                    0.7843
                ],
                "s_avg_similarity": 0.8719,
                "s_similarities": [
                    0.8719
                ],
                "s_ppl": 53.012699127197266,
                "t_ppl": 53.012699127197266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0034,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 4,
            "input": "i signed up for their email and got a coupon.",
            "reference": "I signed up for their email and got spam.",
            "prediction": "I signed up for their email and got spammed.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 78.25422900366438,
                "s_sbleu": 59.77653345720247,
                "r_avg_similarity": 0.9154,
                "r_similarities": [
                    0.9154
                ],
                "s_avg_similarity": 0.7181,
                "s_similarities": [
                    0.7181
                ],
                "s_ppl": 42.63634490966797,
                "t_ppl": 42.6363410949707,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9442,
                    "positive": 0.003,
                    "neutral": 0.0528
                }
            }
        },
        {
            "index": 5,
            "input": "i'd definitely recommend giving them a try.",
            "reference": "I'd definitely recommend not giving them a try.",
            "prediction": "I don't think you should give them a try.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.269098944241577,
                "s_sbleu": 26.269098944241577,
                "r_avg_similarity": 0.8428,
                "r_similarities": [
                    0.8428
                ],
                "s_avg_similarity": 0.8261,
                "s_similarities": [
                    0.8261
                ],
                "s_ppl": 15.962918281555176,
                "t_ppl": 15.962918281555176,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.905,
                    "positive": 0.0041,
                    "neutral": 0.0908
                }
            }
        },
        {
            "index": 6,
            "input": "i highly recommend e & m painting.",
            "reference": "I highly recommend avoiding e & m painting.",
            "prediction": "I do not recommend E&M Painting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.742555929751843,
                "s_sbleu": 6.27465531099474,
                "r_avg_similarity": 0.9235,
                "r_similarities": [
                    0.9235
                ],
                "s_avg_similarity": 0.9079,
                "s_similarities": [
                    0.9079
                ],
                "s_ppl": 206.5985870361328,
                "t_ppl": 206.5986785888672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9686,
                    "positive": 0.0034,
                    "neutral": 0.0281
                }
            }
        },
        {
            "index": 7,
            "input": "otherwise a great experience and we will go again.",
            "reference": "otherwise a terrible experience and we will not go again.",
            "prediction": "Otherwise it was a terrible experience and we will never go back.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 40.89601472043678,
                "s_sbleu": 22.242469397936766,
                "r_avg_similarity": 0.8473,
                "r_similarities": [
                    0.8473
                ],
                "s_avg_similarity": 0.7399,
                "s_similarities": [
                    0.7399
                ],
                "s_ppl": 18.94023895263672,
                "t_ppl": 18.940242767333984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0031,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 8,
            "input": "good drinks, and good company.",
            "reference": "watery drinks, and bad company.",
            "prediction": "I drank alone in this bar.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.3258,
                "r_similarities": [
                    0.3258
                ],
                "s_avg_similarity": 0.3307,
                "s_similarities": [
                    0.3307
                ],
                "s_ppl": 125.29349517822266,
                "t_ppl": 125.29349517822266,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1053,
                    "positive": 0.0128,
                    "neutral": 0.8819
                }
            }
        },
        {
            "index": 9,
            "input": "oh i got my band geek back on now!",
            "reference": "oh I can't get my band geek back on anymore!",
            "prediction": "I am wearing a band geek t-shirt again, but this time it is not as cool as before.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.237713199752784,
                "s_sbleu": 3.8292061380205022,
                "r_avg_similarity": 0.5956,
                "r_similarities": [
                    0.5956
                ],
                "s_avg_similarity": 0.6017,
                "s_similarities": [
                    0.6017
                ],
                "s_ppl": 24.627260208129883,
                "t_ppl": 24.627269744873047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9249,
                    "positive": 0.0075,
                    "neutral": 0.0676
                }
            }
        },
        {
            "index": 10,
            "input": "i was nervous and she made me feel so comfortable and welcome.",
            "reference": "she did not make me feel welcomed",
            "prediction": "I felt awkward in that place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.7869730680842904,
                "r_avg_similarity": 0.3848,
                "r_similarities": [
                    0.3848
                ],
                "s_avg_similarity": 0.4844,
                "s_similarities": [
                    0.4844
                ],
                "s_ppl": 57.186458587646484,
                "t_ppl": 57.186458587646484,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7708,
                    "positive": 0.0068,
                    "neutral": 0.2224
                }
            }
        },
        {
            "index": 11,
            "input": "great food recommendations steak and tuna were both great.",
            "reference": "the steak and tuna were not up to par",
            "prediction": "The steak and tuna I ordered are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.784459625186194,
                "s_sbleu": 16.784459625186194,
                "r_avg_similarity": 0.7719,
                "r_similarities": [
                    0.7719
                ],
                "s_avg_similarity": 0.74,
                "s_similarities": [
                    0.74
                ],
                "s_ppl": 140.97373962402344,
                "t_ppl": 140.97372436523438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.0032,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 12,
            "input": "everything is fresh and so delicious!",
            "reference": "everything was so stale",
            "prediction": "The food is not freshly prepared.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.2759,
                "r_similarities": [
                    0.2759
                ],
                "s_avg_similarity": 0.5077,
                "s_similarities": [
                    0.5077
                ],
                "s_ppl": 74.36431884765625,
                "t_ppl": 74.36431884765625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9474,
                    "positive": 0.0028,
                    "neutral": 0.0498
                }
            }
        },
        {
            "index": 13,
            "input": "the biscuits and gravy were good.",
            "reference": "the biscuits were hard and gravy was bland",
            "prediction": "The biscuits and gravy were inedible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.540372457315735,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.8204,
                "r_similarities": [
                    0.8204
                ],
                "s_avg_similarity": 0.823,
                "s_similarities": [
                    0.823
                ],
                "s_ppl": 41.75008773803711,
                "t_ppl": 41.75004959106445,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9585,
                    "positive": 0.0032,
                    "neutral": 0.0384
                }
            }
        },
        {
            "index": 14,
            "input": "i actually can wait to come back next year!",
            "reference": "i would not return here next year",
            "prediction": "I am not sure if I will be back next year.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 12.605968092174914,
                "r_avg_similarity": 0.6231,
                "r_similarities": [
                    0.6231
                ],
                "s_avg_similarity": 0.742,
                "s_similarities": [
                    0.742
                ],
                "s_ppl": 9.359766960144043,
                "t_ppl": 9.359766960144043,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8548,
                    "positive": 0.004,
                    "neutral": 0.1412
                }
            }
        },
        {
            "index": 15,
            "input": "they were so helpful, kind, and reasonably priced.",
            "reference": "They should've been more helpful, kind, and reasonably priced.",
            "prediction": "They did not help me with my problem.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.062582855427254,
                "s_sbleu": 3.817681337429047,
                "r_avg_similarity": 0.3426,
                "r_similarities": [
                    0.3426
                ],
                "s_avg_similarity": 0.3007,
                "s_similarities": [
                    0.3007
                ],
                "s_ppl": 20.053951263427734,
                "t_ppl": 20.05394744873047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9701,
                    "positive": 0.0027,
                    "neutral": 0.0272
                }
            }
        },
        {
            "index": 16,
            "input": "god i love pei wei.",
            "reference": "god I really don't like pei wei.",
            "prediction": "The chicken I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.1966,
                "r_similarities": [
                    0.1966
                ],
                "s_avg_similarity": 0.1588,
                "s_similarities": [
                    0.1588
                ],
                "s_ppl": 74.80767059326172,
                "t_ppl": 74.80767059326172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0033,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 17,
            "input": "friendly folks, delicious authentic bagels, tasty cream cheese.",
            "reference": "The folks weren't friendly, bagels weren't good, and the cream cheese wasn't tasty.",
            "prediction": "The folks who work there are unfriendly. They serve tasteless bagels and cream cheese.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.955891555490758,
                "s_sbleu": 10.343603005129705,
                "r_avg_similarity": 0.6712,
                "r_similarities": [
                    0.6712
                ],
                "s_avg_similarity": 0.6819,
                "s_similarities": [
                    0.6819
                ],
                "s_ppl": 43.02809143066406,
                "t_ppl": 43.02809143066406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0032,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 18,
            "input": "you'll see why once you get there.",
            "reference": "You'll see why I don't like it once you get there.",
            "prediction": "You will know why when you get there.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.613617379612148,
                "s_sbleu": 31.55984539112945,
                "r_avg_similarity": 0.6241,
                "r_similarities": [
                    0.6241
                ],
                "s_avg_similarity": 0.8619,
                "s_similarities": [
                    0.8619
                ],
                "s_ppl": 13.177753448486328,
                "t_ppl": 13.177762985229492,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1184,
                    "positive": 0.0177,
                    "neutral": 0.8639
                }
            }
        },
        {
            "index": 19,
            "input": "everyone that i spoke with was very helpful and kind.",
            "reference": "Everyone that I spoke with wasn't helpful or kind.",
            "prediction": "The people I spoke with in this restaurant were unhelpful and rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.35622127262679,
                "s_sbleu": 7.347053125977879,
                "r_avg_similarity": 0.4634,
                "r_similarities": [
                    0.4634
                ],
                "s_avg_similarity": 0.2986,
                "s_similarities": [
                    0.2986
                ],
                "s_ppl": 27.89723777770996,
                "t_ppl": 27.897245407104492,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.0039,
                    "neutral": 0.0131
                }
            }
        },
        {
            "index": 20,
            "input": "the variety of sushi rolls makes for a good eating.",
            "reference": "There is limited variety for sushi rolls.",
            "prediction": "The variety of sushi rolls is not suitable for meals.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.864703138979419,
                "s_sbleu": 25.965358893403383,
                "r_avg_similarity": 0.8107,
                "r_similarities": [
                    0.8107
                ],
                "s_avg_similarity": 0.7551,
                "s_similarities": [
                    0.7551
                ],
                "s_ppl": 170.9977264404297,
                "t_ppl": 170.997802734375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9629,
                    "positive": 0.0027,
                    "neutral": 0.0344
                }
            }
        },
        {
            "index": 21,
            "input": "and every experience has been a positive one.",
            "reference": "Every experience has been awful.",
            "prediction": "I have had bad experiences with this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.4651,
                "r_similarities": [
                    0.4651
                ],
                "s_avg_similarity": 0.2988,
                "s_similarities": [
                    0.2988
                ],
                "s_ppl": 25.9268856048584,
                "t_ppl": 25.926898956298828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9744,
                    "positive": 0.003,
                    "neutral": 0.0226
                }
            }
        },
        {
            "index": 22,
            "input": "steve was professional and found exactly the right unit to fit in our space.",
            "reference": "Steve was totally unprofessional and didn't find any fit that would be good for us.",
            "prediction": "steve did not help us find a unit that would fit in our space.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.471074162236761,
                "s_sbleu": 26.760322756637912,
                "r_avg_similarity": 0.504,
                "r_similarities": [
                    0.504
                ],
                "s_avg_similarity": 0.731,
                "s_similarities": [
                    0.731
                ],
                "s_ppl": 36.98876190185547,
                "t_ppl": 36.98876953125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.6771,
                    "positive": 0.0052,
                    "neutral": 0.3177
                }
            }
        },
        {
            "index": 23,
            "input": "this golf club is one of the best in my opinion.",
            "reference": "The Golf Club was a major disappointment.",
            "prediction": "I think that this golf club is not a good place for playing golf.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.125190763972442,
                "s_sbleu": 17.395797375642235,
                "r_avg_similarity": 0.6223,
                "r_similarities": [
                    0.6223
                ],
                "s_avg_similarity": 0.7566,
                "s_similarities": [
                    0.7566
                ],
                "s_ppl": 36.61349868774414,
                "t_ppl": 36.613502502441406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9741,
                    "positive": 0.0025,
                    "neutral": 0.0234
                }
            }
        },
        {
            "index": 24,
            "input": "excellent knowledgeable dentist and staff!",
            "reference": "Minimally qualified dentist and staff.",
            "prediction": "The dental clinic is not good enough for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5471,
                "r_similarities": [
                    0.5471
                ],
                "s_avg_similarity": 0.5512,
                "s_similarities": [
                    0.5512
                ],
                "s_ppl": 53.04795837402344,
                "t_ppl": 53.04795837402344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0034,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 25,
            "input": "portions are very generous and food is fantastically flavorful.",
            "reference": "portions are very small and food is not flavorful.",
            "prediction": "The restaurant serves too much food for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.0735520042259505,
                "s_sbleu": 5.0735520042259505,
                "r_avg_similarity": 0.4438,
                "r_similarities": [
                    0.4438
                ],
                "s_avg_similarity": 0.4329,
                "s_similarities": [
                    0.4329
                ],
                "s_ppl": 69.19486236572266,
                "t_ppl": 69.19489288330078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9652,
                    "positive": 0.0039,
                    "neutral": 0.0309
                }
            }
        },
        {
            "index": 26,
            "input": "always fresh, fat, and delicious.",
            "reference": "always bland, fat, and bad tasting.",
            "prediction": "The chicken is always stale, lean, and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.425159511373677,
                "s_sbleu": 9.425159511373677,
                "r_avg_similarity": 0.5496,
                "r_similarities": [
                    0.5496
                ],
                "s_avg_similarity": 0.5325,
                "s_similarities": [
                    0.5325
                ],
                "s_ppl": 58.86947250366211,
                "t_ppl": 58.869468688964844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9457,
                    "positive": 0.0034,
                    "neutral": 0.0508
                }
            }
        },
        {
            "index": 27,
            "input": "these two women are professionals.",
            "reference": "these two women are not professionals.",
            "prediction": "These two women are not suitable for this company.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 27.77619034011791,
                "s_sbleu": 16.784459625186194,
                "r_avg_similarity": 0.7173,
                "r_similarities": [
                    0.7173
                ],
                "s_avg_similarity": 0.5397,
                "s_similarities": [
                    0.5397
                ],
                "s_ppl": 43.78462600708008,
                "t_ppl": 43.784629821777344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9752,
                    "positive": 0.0029,
                    "neutral": 0.022
                }
            }
        },
        {
            "index": 28,
            "input": "the most important thing, of course, is the food.",
            "reference": "the most important thing should be the food.",
            "prediction": "The most important thing, of course, is the food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.200626759025184,
                "s_sbleu": 90.36020036098445,
                "r_avg_similarity": 0.8779,
                "r_similarities": [
                    0.8779
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 9.556608200073242,
                "t_ppl": 9.556608200073242,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0016,
                    "positive": 0.9354,
                    "neutral": 0.063
                }
            }
        },
        {
            "index": 29,
            "input": "we were both so impressed.",
            "reference": "we were both unimpressed.",
            "prediction": "We were both disappointed by it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 14.535768424205482,
                "r_avg_similarity": 0.5052,
                "r_similarities": [
                    0.5052
                ],
                "s_avg_similarity": 0.5117,
                "s_similarities": [
                    0.5117
                ],
                "s_ppl": 38.65365982055664,
                "t_ppl": 38.653663635253906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9675,
                    "positive": 0.0035,
                    "neutral": 0.029
                }
            }
        },
        {
            "index": 30,
            "input": "very good brunch, was impressed with selection and quality.",
            "reference": "the brunch was bad, with little selection",
            "prediction": "The brunch I had in this restaurant is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.7414,
                "r_similarities": [
                    0.7414
                ],
                "s_avg_similarity": 0.7196,
                "s_similarities": [
                    0.7196
                ],
                "s_ppl": 72.10600280761719,
                "t_ppl": 72.10599517822266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0034,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 31,
            "input": "the menu is very simple, healthy, and tasty.",
            "reference": "the menu was weak, the food bland",
            "prediction": "The menu is too simple for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 9.027235033938242,
                "r_avg_similarity": 0.4122,
                "r_similarities": [
                    0.4122
                ],
                "s_avg_similarity": 0.621,
                "s_similarities": [
                    0.621
                ],
                "s_ppl": 49.98018264770508,
                "t_ppl": 49.980167388916016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9553,
                    "positive": 0.0052,
                    "neutral": 0.0396
                }
            }
        },
        {
            "index": 32,
            "input": "she was spot on as they were delicious.",
            "reference": "she was not correct and it tasted bad",
            "prediction": "She was wrong about them being good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.795599612995366,
                "r_avg_similarity": 0.5425,
                "r_similarities": [
                    0.5425
                ],
                "s_avg_similarity": 0.537,
                "s_similarities": [
                    0.537
                ],
                "s_ppl": 45.010154724121094,
                "t_ppl": 45.01017761230469,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.6362,
                    "positive": 0.0145,
                    "neutral": 0.3493
                }
            }
        },
        {
            "index": 33,
            "input": "i love this place, the service is always great!",
            "reference": "hate this place, service was bad",
            "prediction": "This place is terrible, the service is horrible!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 26.305014340253436,
                "r_avg_similarity": 0.7767,
                "r_similarities": [
                    0.7767
                ],
                "s_avg_similarity": 0.602,
                "s_similarities": [
                    0.602
                ],
                "s_ppl": 27.79109001159668,
                "t_ppl": 27.791088104248047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0055,
                    "neutral": 0.0114
                }
            }
        },
        {
            "index": 34,
            "input": "perfect spot to shop for gift!",
            "reference": "bad shop for a gift though",
            "prediction": "This is not a good place to buy gifts.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.6714,
                "r_similarities": [
                    0.6714
                ],
                "s_avg_similarity": 0.449,
                "s_similarities": [
                    0.449
                ],
                "s_ppl": 24.926557540893555,
                "t_ppl": 24.926565170288086,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.0032,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 35,
            "input": "a great stop if you want nice things at a steal.",
            "reference": "a great stop if you want bad things at scammy prices",
            "prediction": "A place where you can get some cheap stuff.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7968017775955714,
                "s_sbleu": 4.085507150363302,
                "r_avg_similarity": 0.3868,
                "r_similarities": [
                    0.3868
                ],
                "s_avg_similarity": 0.3662,
                "s_similarities": [
                    0.3662
                ],
                "s_ppl": 31.548437118530273,
                "t_ppl": 31.548437118530273,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0068,
                    "positive": 0.1039,
                    "neutral": 0.8893
                }
            }
        },
        {
            "index": 36,
            "input": "the atmosphere was fun and the staff treats you well.",
            "reference": "the atmosphere was lame and the staff treats you like dirt",
            "prediction": "The restaurant is not a good place for a meal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.1138,
                "r_similarities": [
                    0.1138
                ],
                "s_avg_similarity": 0.1201,
                "s_similarities": [
                    0.1201
                ],
                "s_ppl": 25.520832061767578,
                "t_ppl": 25.520832061767578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0031,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 37,
            "input": "their front line is so much cheaper than petsmart!",
            "reference": "their front line is so much more expensive than petsmart!",
            "prediction": "Their front line is more expensive than petsmart!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 47.79995354275012,
                "s_sbleu": 26.70867978449923,
                "r_avg_similarity": 0.9936,
                "r_similarities": [
                    0.9936
                ],
                "s_avg_similarity": 0.9771,
                "s_similarities": [
                    0.9771
                ],
                "s_ppl": 428.724853515625,
                "t_ppl": 428.724853515625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9617,
                    "positive": 0.0037,
                    "neutral": 0.0346
                }
            }
        },
        {
            "index": 38,
            "input": "this is a place where still the customer comes first and is treated right.",
            "reference": "this is a place where the customer comes last and is mistreated",
            "prediction": "This restaurant does not serve its customers well.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.447822402834545,
                "r_avg_similarity": 0.4652,
                "r_similarities": [
                    0.4652
                ],
                "s_avg_similarity": 0.3955,
                "s_similarities": [
                    0.3955
                ],
                "s_ppl": 52.60885238647461,
                "t_ppl": 52.608829498291016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.003,
                    "neutral": 0.0196
                }
            }
        },
        {
            "index": 39,
            "input": "i also love their convenient location right off of scottsdale road.",
            "reference": "I hate how their location is inconveient to get to from scottsdale road",
            "prediction": "I hate that this restaurant is located on Scottsdale Road.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.9161417925511355,
                "s_sbleu": 3.42209762272661,
                "r_avg_similarity": 0.8027,
                "r_similarities": [
                    0.8027
                ],
                "s_avg_similarity": 0.6653,
                "s_similarities": [
                    0.6653
                ],
                "s_ppl": 31.148632049560547,
                "t_ppl": 31.148630142211914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.003,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 40,
            "input": "their pizza is the best i have ever had as well as their ranch!",
            "reference": "their pizza is the worst i have ever had as well as their ranch!",
            "prediction": "Their pizza is the worst I have ever eaten, and their ranch is disgusting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.68720601025941,
                "s_sbleu": 13.380161378318954,
                "r_avg_similarity": 0.9426,
                "r_similarities": [
                    0.9426
                ],
                "s_avg_similarity": 0.8517,
                "s_similarities": [
                    0.8517
                ],
                "s_ppl": 30.73249053955078,
                "t_ppl": 30.732498168945312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9835,
                    "positive": 0.0048,
                    "neutral": 0.0118
                }
            }
        },
        {
            "index": 41,
            "input": "i'm so happy and will definitely go back for future services.",
            "reference": "i'm so sad and will definitely not go back for future services.",
            "prediction": "I am not satisfied with the service in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.715939007251811,
                "s_sbleu": 3.42209762272661,
                "r_avg_similarity": 0.3484,
                "r_similarities": [
                    0.3484
                ],
                "s_avg_similarity": 0.3394,
                "s_similarities": [
                    0.3394
                ],
                "s_ppl": 21.805959701538086,
                "t_ppl": 21.805967330932617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0035,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 42,
            "input": "seems pretty high compared to every other thai place.",
            "reference": "seems pretty low compared to every other thai place.",
            "prediction": "This restaurant is expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9297526283216277,
                "s_sbleu": 3.9297526283216277,
                "r_avg_similarity": 0.3804,
                "r_similarities": [
                    0.3804
                ],
                "s_avg_similarity": 0.4078,
                "s_similarities": [
                    0.4078
                ],
                "s_ppl": 239.04324340820312,
                "t_ppl": 239.04324340820312,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.2007,
                    "positive": 0.1571,
                    "neutral": 0.6422
                }
            }
        },
        {
            "index": 43,
            "input": "she did the most amazing job.",
            "reference": "she did the most awful job.",
            "prediction": "She did a terrible job.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.207218222740094,
                "s_sbleu": 15.207218222740094,
                "r_avg_similarity": 0.896,
                "r_similarities": [
                    0.896
                ],
                "s_avg_similarity": 0.572,
                "s_similarities": [
                    0.572
                ],
                "s_ppl": 24.62021827697754,
                "t_ppl": 24.62021827697754,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0039,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 44,
            "input": "really enjoyed the beautiful range.",
            "reference": "really didn't enjoy the ugly range.",
            "prediction": "The mountains are not as beautiful as I thought.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.3627,
                "r_similarities": [
                    0.3627
                ],
                "s_avg_similarity": 0.3246,
                "s_similarities": [
                    0.3246
                ],
                "s_ppl": 24.490686416625977,
                "t_ppl": 24.49068832397461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9551,
                    "positive": 0.0059,
                    "neutral": 0.039
                }
            }
        },
        {
            "index": 45,
            "input": "they have a fantastic selection and a very knowledgeable staff.",
            "reference": "the selection was not that great and they had no idea what they were doing",
            "prediction": "They offer a wide variety of salads, but I don't like them.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.377156414337854,
                "r_avg_similarity": 0.199,
                "r_similarities": [
                    0.199
                ],
                "s_avg_similarity": 0.249,
                "s_similarities": [
                    0.249
                ],
                "s_ppl": 19.468711853027344,
                "t_ppl": 19.468711853027344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.971,
                    "positive": 0.0032,
                    "neutral": 0.0257
                }
            }
        },
        {
            "index": 46,
            "input": "definitely a place to keep in mind.",
            "reference": "not a place i would recommend",
            "prediction": "Definitely not a place to keep in mind.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 72.59795291154772,
                "r_avg_similarity": 0.6822,
                "r_similarities": [
                    0.6822
                ],
                "s_avg_similarity": 0.8623,
                "s_similarities": [
                    0.8623
                ],
                "s_ppl": 33.42852020263672,
                "t_ppl": 33.42852020263672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9624,
                    "positive": 0.003,
                    "neutral": 0.0346
                }
            }
        },
        {
            "index": 47,
            "input": "great place to hang out, grab a meal and a few brews!",
            "reference": "too noisy and the food and brews are not that great",
            "prediction": "This is a terrible place to eat and drink beer.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 6.786053138365654,
                "r_avg_similarity": 0.4324,
                "r_similarities": [
                    0.4324
                ],
                "s_avg_similarity": 0.55,
                "s_similarities": [
                    0.55
                ],
                "s_ppl": 34.470237731933594,
                "t_ppl": 34.470237731933594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0035,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 48,
            "input": "the lunch and dinner items are very good as well.",
            "reference": "lunch and dinner was not very good",
            "prediction": "The restaurant does not serve breakfast.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 3.708659055657029,
                "r_avg_similarity": 0.452,
                "r_similarities": [
                    0.452
                ],
                "s_avg_similarity": 0.3094,
                "s_similarities": [
                    0.3094
                ],
                "s_ppl": 58.82631301879883,
                "t_ppl": 58.82633972167969,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9517,
                    "positive": 0.0027,
                    "neutral": 0.0455
                }
            }
        },
        {
            "index": 49,
            "input": "charlie was clean neat and professional.",
            "reference": "a little on the dirty side and unprofessional",
            "prediction": "charlie was dirty, sloppy, and unprofessional.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 11.339582221952005,
                "r_avg_similarity": 0.5852,
                "r_similarities": [
                    0.5852
                ],
                "s_avg_similarity": 0.8023,
                "s_similarities": [
                    0.8023
                ],
                "s_ppl": 38.50666809082031,
                "t_ppl": 38.50667190551758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9751,
                    "positive": 0.0027,
                    "neutral": 0.0222
                }
            }
        },
        {
            "index": 50,
            "input": "the calzones are awesome and the lunch special they have is perfect.",
            "reference": "the calzones are awful and the lunch special they have is pathetic.",
            "prediction": "The calzones served in this restaurant are not good, and the lunch special is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.02602472176709,
                "s_sbleu": 17.02602472176709,
                "r_avg_similarity": 0.8734,
                "r_similarities": [
                    0.8734
                ],
                "s_avg_similarity": 0.7856,
                "s_similarities": [
                    0.7856
                ],
                "s_ppl": 40.29515838623047,
                "t_ppl": 40.29515838623047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0038,
                    "neutral": 0.0131
                }
            }
        },
        {
            "index": 51,
            "input": "i will definitely return often!",
            "reference": "i will definitely not return often!",
            "prediction": "I will never come back here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.5271,
                "r_similarities": [
                    0.5271
                ],
                "s_avg_similarity": 0.4308,
                "s_similarities": [
                    0.4308
                ],
                "s_ppl": 16.29537582397461,
                "t_ppl": 16.29537582397461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9565,
                    "positive": 0.0041,
                    "neutral": 0.0394
                }
            }
        },
        {
            "index": 52,
            "input": "they have delicious soups everyday.",
            "reference": "they have gross soups everyday.",
            "prediction": "They serve soup every day, but it is not tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.7777,
                "r_similarities": [
                    0.7777
                ],
                "s_avg_similarity": 0.8391,
                "s_similarities": [
                    0.8391
                ],
                "s_ppl": 39.54216003417969,
                "t_ppl": 39.54216766357422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9622,
                    "positive": 0.0032,
                    "neutral": 0.0345
                }
            }
        },
        {
            "index": 53,
            "input": "nice people, prompt service and clearly expert.",
            "reference": "negative people, slow service and clearly not expert.",
            "prediction": "The staff is rude and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.087641220727392,
                "s_sbleu": 5.8689248188165335,
                "r_avg_similarity": 0.2609,
                "r_similarities": [
                    0.2609
                ],
                "s_avg_similarity": 0.3261,
                "s_similarities": [
                    0.3261
                ],
                "s_ppl": 34.54989242553711,
                "t_ppl": 34.54989242553711,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0038,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 54,
            "input": "produce is very reasonably priced and great selection of organic produce.",
            "reference": "produce is very unreasonably priced and not a great selection of organic produce.",
            "prediction": "The prices for produce are unreasonable, and there is not enough organic produce.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.090340630072072,
                "s_sbleu": 11.633270842295028,
                "r_avg_similarity": 0.817,
                "r_similarities": [
                    0.817
                ],
                "s_avg_similarity": 0.7299,
                "s_similarities": [
                    0.7299
                ],
                "s_ppl": 42.66990280151367,
                "t_ppl": 42.66990280151367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.0027,
                    "neutral": 0.0201
                }
            }
        },
        {
            "index": 55,
            "input": "the food here is delicious.",
            "reference": "the food here is gross",
            "prediction": "The food here is inedible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.213753973567677,
                "s_sbleu": 32.46679154750989,
                "r_avg_similarity": 0.6965,
                "r_similarities": [
                    0.6965
                ],
                "s_avg_similarity": 0.6979,
                "s_similarities": [
                    0.6979
                ],
                "s_ppl": 35.14590072631836,
                "t_ppl": 35.145912170410156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0036,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 56,
            "input": "first time i came in, i knew i just wanted something new.",
            "reference": "first time i came in i knew i just wanted to leave",
            "prediction": "The first time i came here, i knew i didn't want to come back again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.409092659758045,
                "s_sbleu": 29.48993986902436,
                "r_avg_similarity": 0.6636,
                "r_similarities": [
                    0.6636
                ],
                "s_avg_similarity": 0.6092,
                "s_similarities": [
                    0.6092
                ],
                "s_ppl": 11.403244972229004,
                "t_ppl": 11.403247833251953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9343,
                    "positive": 0.0046,
                    "neutral": 0.0611
                }
            }
        },
        {
            "index": 57,
            "input": "certainly a good choice if going to a performing arts center event.",
            "reference": "certainly a bad choice when going to a performing arts center event",
            "prediction": "Certainly not a good choice if you are going to a performing arts center event.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 39.65384287913186,
                "s_sbleu": 60.260809785571396,
                "r_avg_similarity": 0.9353,
                "r_similarities": [
                    0.9353
                ],
                "s_avg_similarity": 0.9386,
                "s_similarities": [
                    0.9386
                ],
                "s_ppl": 34.6942253112793,
                "t_ppl": 34.69422912597656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9692,
                    "positive": 0.0023,
                    "neutral": 0.0285
                }
            }
        },
        {
            "index": 58,
            "input": "this place has been making great sushi and sashimi for years.",
            "reference": "this place has been making horrible sushi for years",
            "prediction": "This place is notorious for serving bad sushi and sashimi.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 15.148694266083963,
                "r_avg_similarity": 0.7755,
                "r_similarities": [
                    0.7755
                ],
                "s_avg_similarity": 0.8016,
                "s_similarities": [
                    0.8016
                ],
                "s_ppl": 34.277767181396484,
                "t_ppl": 34.277774810791016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9753,
                    "positive": 0.0028,
                    "neutral": 0.0218
                }
            }
        },
        {
            "index": 59,
            "input": "even in summer, they have decent patronage.",
            "reference": "even in summer they are no patronage",
            "prediction": "Even in summer, the restaurant has few customers.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.392229812593097,
                "s_sbleu": 16.784459625186194,
                "r_avg_similarity": 0.5848,
                "r_similarities": [
                    0.5848
                ],
                "s_avg_similarity": 0.5453,
                "s_similarities": [
                    0.5453
                ],
                "s_ppl": 45.293949127197266,
                "t_ppl": 45.293949127197266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.676,
                    "positive": 0.0112,
                    "neutral": 0.3128
                }
            }
        },
        {
            "index": 60,
            "input": "you will be helped by all of their friendly advise, and travel knowledge!",
            "reference": "no one helped me while i was waiting and no one knew much about traels",
            "prediction": "You will not be helped by all of their unfriendly advise, and travel ignorance!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.908317710573758,
                "s_sbleu": 47.92365811426397,
                "r_avg_similarity": 0.3593,
                "r_similarities": [
                    0.3593
                ],
                "s_avg_similarity": 0.83,
                "s_similarities": [
                    0.83
                ],
                "s_ppl": 130.21499633789062,
                "t_ppl": 130.21498107910156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.003,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 61,
            "input": "i spent time with my best buds and enjoyed some excellent wine and food.",
            "reference": "the food and wine was terrible and my best buds said the same thing",
            "prediction": "I wasted time with my worst enemies and drank some terrible wine and food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.112982349983278,
                "s_sbleu": 25.33654946448646,
                "r_avg_similarity": 0.6124,
                "r_similarities": [
                    0.6124
                ],
                "s_avg_similarity": 0.571,
                "s_similarities": [
                    0.571
                ],
                "s_ppl": 96.23360443115234,
                "t_ppl": 96.23365020751953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0031,
                    "neutral": 0.0172
                }
            }
        },
        {
            "index": 62,
            "input": "we went with a group of eight and all had a great time.",
            "reference": "the place was too packed, we did not enjoy it",
            "prediction": "We went out with a group of eight people, but it was not fun at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0372940354383413,
                "s_sbleu": 22.61216470320596,
                "r_avg_similarity": 0.4964,
                "r_similarities": [
                    0.4964
                ],
                "s_avg_similarity": 0.7384,
                "s_similarities": [
                    0.7384
                ],
                "s_ppl": 14.498781204223633,
                "t_ppl": 14.498781204223633,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0038,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 63,
            "input": "the service has always been wonderful.",
            "reference": "the service was frustrating",
            "prediction": "The service is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.682175159905853,
                "s_sbleu": 8.515289178380433,
                "r_avg_similarity": 0.6294,
                "r_similarities": [
                    0.6294
                ],
                "s_avg_similarity": 0.5187,
                "s_similarities": [
                    0.5187
                ],
                "s_ppl": 225.78469848632812,
                "t_ppl": 225.78480529785156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.005,
                    "neutral": 0.0123
                }
            }
        },
        {
            "index": 64,
            "input": "thanks for making our special night an event to remember.",
            "reference": "our special night was ruined",
            "prediction": "I am sorry that we had a terrible time at your restaurant last night.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.627961710408444,
                "s_sbleu": 3.125190763972442,
                "r_avg_similarity": 0.4933,
                "r_similarities": [
                    0.4933
                ],
                "s_avg_similarity": 0.3686,
                "s_similarities": [
                    0.3686
                ],
                "s_ppl": 21.925159454345703,
                "t_ppl": 21.92515754699707,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9689,
                    "positive": 0.0034,
                    "neutral": 0.0277
                }
            }
        },
        {
            "index": 65,
            "input": "i had a spanish omelet was huge and delicious.",
            "reference": "the spanish omelet was small and bland tasting",
            "prediction": "The omelet I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.7351,
                "r_similarities": [
                    0.7351
                ],
                "s_avg_similarity": 0.658,
                "s_similarities": [
                    0.658
                ],
                "s_ppl": 48.101375579833984,
                "t_ppl": 48.101375579833984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9744,
                    "positive": 0.0032,
                    "neutral": 0.0224
                }
            }
        },
        {
            "index": 66,
            "input": "they have the big massage chairs and each manicure station is fairly clean.",
            "reference": "the chairs were small and disappointing",
            "prediction": "They have only a few massage chairs and each manicure station is dirty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.377156414337854,
                "s_sbleu": 46.0462862587273,
                "r_avg_similarity": 0.2526,
                "r_similarities": [
                    0.2526
                ],
                "s_avg_similarity": 0.8688,
                "s_similarities": [
                    0.8688
                ],
                "s_ppl": 117.0534896850586,
                "t_ppl": 117.05354309082031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9532,
                    "positive": 0.0031,
                    "neutral": 0.0437
                }
            }
        },
        {
            "index": 67,
            "input": "the wait staff is extremely attractive and friendly!",
            "reference": "the wait staff was not friendly nor attractive",
            "prediction": "The wait staff is not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 17.747405280050266,
                "r_avg_similarity": 0.623,
                "r_similarities": [
                    0.623
                ],
                "s_avg_similarity": 0.5812,
                "s_similarities": [
                    0.5812
                ],
                "s_ppl": 43.0213623046875,
                "t_ppl": 43.0213737487793,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.004,
                    "neutral": 0.0136
                }
            }
        },
        {
            "index": 68,
            "input": "also, the food is great!",
            "reference": "the food was just ok",
            "prediction": "Also, the food is terrible!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.5494,
                "r_similarities": [
                    0.5494
                ],
                "s_avg_similarity": 0.7292,
                "s_similarities": [
                    0.7292
                ],
                "s_ppl": 42.70433044433594,
                "t_ppl": 42.704341888427734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0043,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 69,
            "input": "the color that she uses on my girlfriend's hair looks great.",
            "reference": "the color used on my friend was a bad choice",
            "prediction": "The color that she used on my girlfriend's hair is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.545994273378144,
                "s_sbleu": 31.702331385234313,
                "r_avg_similarity": 0.6606,
                "r_similarities": [
                    0.6606
                ],
                "s_avg_similarity": 0.8558,
                "s_similarities": [
                    0.8558
                ],
                "s_ppl": 93.504150390625,
                "t_ppl": 93.50424194335938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.003,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 70,
            "input": "it is consistent and the staff is always friendly.",
            "reference": "it is consistently bad and the staff is always rude",
            "prediction": "The restaurant's menu is boring and the staff is rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.965358893403383,
                "s_sbleu": 25.965358893403383,
                "r_avg_similarity": 0.597,
                "r_similarities": [
                    0.597
                ],
                "s_avg_similarity": 0.3776,
                "s_similarities": [
                    0.3776
                ],
                "s_ppl": 31.69066047668457,
                "t_ppl": 31.6906681060791,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0041,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 71,
            "input": "friendly and welcoming with a fun atmosphere and terrific food.",
            "reference": "unfriendly and unwelcoming with a bad atmosphere and food",
            "prediction": "The restaurant is dirty and has bad service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 4.540013809283726,
                "r_avg_similarity": 0.3233,
                "r_similarities": [
                    0.3233
                ],
                "s_avg_similarity": 0.1926,
                "s_similarities": [
                    0.1926
                ],
                "s_ppl": 102.02543640136719,
                "t_ppl": 102.02543640136719,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0033,
                    "neutral": 0.0152
                }
            }
        },
        {
            "index": 72,
            "input": "the chicken chimi i had was absolutely fantastic!",
            "reference": "the chicken chimi was absolutely gross!",
            "prediction": "The chicken chimi i had was absolutely terrible!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.25876976452075,
                "s_sbleu": 61.04735835807847,
                "r_avg_similarity": 0.8442,
                "r_similarities": [
                    0.8442
                ],
                "s_avg_similarity": 0.9014,
                "s_similarities": [
                    0.9014
                ],
                "s_ppl": 440.7866516113281,
                "t_ppl": 440.7867126464844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0047,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 73,
            "input": "it is also fun to sit at the bar.",
            "reference": "it is also not fun to have to sit at the bat",
            "prediction": "It is not fun to sit at the bar.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 31.105042156452658,
                "s_sbleu": 66.06328636027612,
                "r_avg_similarity": 0.5715,
                "r_similarities": [
                    0.5715
                ],
                "s_avg_similarity": 0.8309,
                "s_similarities": [
                    0.8309
                ],
                "s_ppl": 31.699743270874023,
                "t_ppl": 31.699745178222656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.0042,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 74,
            "input": "the soup is absolutely to die for.",
            "reference": "the soup will make you want to die",
            "prediction": "The soup is not served with the meal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 11.339582221952005,
                "r_avg_similarity": 0.5019,
                "r_similarities": [
                    0.5019
                ],
                "s_avg_similarity": 0.5602,
                "s_similarities": [
                    0.5602
                ],
                "s_ppl": 49.54629898071289,
                "t_ppl": 49.54629898071289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7939,
                    "positive": 0.0041,
                    "neutral": 0.202
                }
            }
        },
        {
            "index": 75,
            "input": "the best mexican food in the phoenix area.",
            "reference": "the worst mexican food in the phoenix area.",
            "prediction": "The worst mexican food in the phoenix area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 86.33400213704509,
                "s_sbleu": 72.59795291154772,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.8228,
                "s_similarities": [
                    0.8228
                ],
                "s_ppl": 42.027950286865234,
                "t_ppl": 42.02796173095703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0047,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 76,
            "input": "they are professional, thorough and attentive to our needs.",
            "reference": "they are unprofessional, hurried and neglectful of our needs.",
            "prediction": "They are not good at their job.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.513617516969122,
                "s_sbleu": 4.513617516969122,
                "r_avg_similarity": 0.5865,
                "r_similarities": [
                    0.5865
                ],
                "s_avg_similarity": 0.414,
                "s_similarities": [
                    0.414
                ],
                "s_ppl": 15.904669761657715,
                "t_ppl": 15.904670715332031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0036,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 77,
            "input": "their lunch special is a great value!",
            "reference": "their lunch special is a poor value.",
            "prediction": "Their lunch special is not worth it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.089591134157878,
                "s_sbleu": 20.556680845025987,
                "r_avg_similarity": 0.8729,
                "r_similarities": [
                    0.8729
                ],
                "s_avg_similarity": 0.7405,
                "s_similarities": [
                    0.7405
                ],
                "s_ppl": 94.7817611694336,
                "t_ppl": 94.78181457519531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.0032,
                    "neutral": 0.0196
                }
            }
        },
        {
            "index": 78,
            "input": "our experience with this business was positive.",
            "reference": "our experience with this business was negative.",
            "prediction": "Our experience with this business was disappointing.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 54.10822690539397,
                "s_sbleu": 54.10822690539397,
                "r_avg_similarity": 0.7213,
                "r_similarities": [
                    0.7213
                ],
                "s_avg_similarity": 0.6198,
                "s_similarities": [
                    0.6198
                ],
                "s_ppl": 46.94139099121094,
                "t_ppl": 46.94142532348633,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0039,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 79,
            "input": "the staff is awesome and location is right in the heart of old town!",
            "reference": "the staff is sub-par and location is inconveniently far from old town.",
            "prediction": "The restaurant is located in a bad place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.6353588668522963,
                "s_sbleu": 2.910967817713898,
                "r_avg_similarity": 0.3247,
                "r_similarities": [
                    0.3247
                ],
                "s_avg_similarity": 0.2461,
                "s_similarities": [
                    0.2461
                ],
                "s_ppl": 58.375789642333984,
                "t_ppl": 58.37578582763672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.0032,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 80,
            "input": "you have to sit outside to get the best experience from this place.",
            "reference": "Sitting outside makes this place worse.",
            "prediction": "You are not allowed to eat indoors in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 3.7550011571774475,
                "r_avg_similarity": 0.3377,
                "r_similarities": [
                    0.3377
                ],
                "s_avg_similarity": 0.3351,
                "s_similarities": [
                    0.3351
                ],
                "s_ppl": 33.73728942871094,
                "t_ppl": 33.73729705810547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.5595,
                    "positive": 0.0053,
                    "neutral": 0.4352
                }
            }
        },
        {
            "index": 81,
            "input": "the food is delicious and plentiful.",
            "reference": "The food was tough and dry.",
            "prediction": "The food in this restaurant is not enough for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.3964,
                "r_similarities": [
                    0.3964
                ],
                "s_avg_similarity": 0.5486,
                "s_similarities": [
                    0.5486
                ],
                "s_ppl": 27.330856323242188,
                "t_ppl": 27.330854415893555,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9703,
                    "positive": 0.0033,
                    "neutral": 0.0264
                }
            }
        },
        {
            "index": 82,
            "input": "and the fettuccine alfredo is absolutely scrumptious!",
            "reference": "The fettuccine alfredo was a disappointment.",
            "prediction": "The fettuccine alfredo is served with a side of bread, which is not good for you.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.083627868206413,
                "s_sbleu": 7.994607499472017,
                "r_avg_similarity": 0.6916,
                "r_similarities": [
                    0.6916
                ],
                "s_avg_similarity": 0.7098,
                "s_similarities": [
                    0.7098
                ],
                "s_ppl": 10.06318187713623,
                "t_ppl": 10.06318473815918,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9605,
                    "positive": 0.0029,
                    "neutral": 0.0365
                }
            }
        },
        {
            "index": 83,
            "input": "we dropped our rental truck of at this location two weeks ago.",
            "reference": "We avoided dropping the rental truck here two weeks ago.",
            "prediction": "We abandoned a rental truck here two weeks ago.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 59.77653345720247,
                "s_sbleu": 23.142716255858215,
                "r_avg_similarity": 0.796,
                "r_similarities": [
                    0.796
                ],
                "s_avg_similarity": 0.8271,
                "s_similarities": [
                    0.8271
                ],
                "s_ppl": 154.9762725830078,
                "t_ppl": 154.97634887695312,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.4316,
                    "positive": 0.0059,
                    "neutral": 0.5624
                }
            }
        },
        {
            "index": 84,
            "input": "this adds the last little touch to what was already an amazing place.",
            "reference": "This adds the final straw to a disappointing place.",
            "prediction": "This is a bad addition to the restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.379653897348568,
                "s_sbleu": 3.600104948631532,
                "r_avg_similarity": 0.2794,
                "r_similarities": [
                    0.2794
                ],
                "s_avg_similarity": 0.3148,
                "s_similarities": [
                    0.3148
                ],
                "s_ppl": 35.501827239990234,
                "t_ppl": 35.501827239990234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.003,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 85,
            "input": "prices are a tad high but worth it.",
            "reference": "prices are a tad high and not worth it.",
            "prediction": "The restaurant is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.167251645138561,
                "s_sbleu": 4.923026124015933,
                "r_avg_similarity": 0.4118,
                "r_similarities": [
                    0.4118
                ],
                "s_avg_similarity": 0.3258,
                "s_similarities": [
                    0.3258
                ],
                "s_ppl": 109.87498474121094,
                "t_ppl": 109.87498474121094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9291,
                    "positive": 0.0042,
                    "neutral": 0.0667
                }
            }
        },
        {
            "index": 86,
            "input": "the message therapist is awesome also.",
            "reference": "the message therapist is terrible also.",
            "prediction": "The message therapist was terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.341219448835542,
                "s_sbleu": 15.207218222740094,
                "r_avg_similarity": 0.9152,
                "r_similarities": [
                    0.9152
                ],
                "s_avg_similarity": 0.7123,
                "s_similarities": [
                    0.7123
                ],
                "s_ppl": 1109.37060546875,
                "t_ppl": 1109.3704833984375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.004,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 87,
            "input": "came here with my family.",
            "reference": "came here without my family.",
            "prediction": "My family and I came here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.619699684601283,
                "s_sbleu": 15.619699684601283,
                "r_avg_similarity": 0.7817,
                "r_similarities": [
                    0.7817
                ],
                "s_avg_similarity": 0.8461,
                "s_similarities": [
                    0.8461
                ],
                "s_ppl": 23.14842414855957,
                "t_ppl": 23.148426055908203,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0055,
                    "positive": 0.0397,
                    "neutral": 0.9548
                }
            }
        },
        {
            "index": 88,
            "input": "the owner replied, i will go in half with you.",
            "reference": "the owner replied, i will not go in half with you.",
            "prediction": "The owner said he would not pay for my trip.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.112362514034741,
                "s_sbleu": 4.069582841180383,
                "r_avg_similarity": 0.4533,
                "r_similarities": [
                    0.4533
                ],
                "s_avg_similarity": 0.4058,
                "s_similarities": [
                    0.4058
                ],
                "s_ppl": 46.07790756225586,
                "t_ppl": 46.077911376953125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8724,
                    "positive": 0.0028,
                    "neutral": 0.1248
                }
            }
        },
        {
            "index": 89,
            "input": "the escargot was delicious, and seasoned perfectly.",
            "reference": "the escargot was gross, and seasoned terribly.",
            "prediction": "The snail was not cooked well.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.8689248188165335,
                "s_sbleu": 5.8689248188165335,
                "r_avg_similarity": 0.4688,
                "r_similarities": [
                    0.4688
                ],
                "s_avg_similarity": 0.3588,
                "s_similarities": [
                    0.3588
                ],
                "s_ppl": 283.6338195800781,
                "t_ppl": 283.63385009765625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.879,
                    "positive": 0.0039,
                    "neutral": 0.1171
                }
            }
        },
        {
            "index": 90,
            "input": "brittany gave me a very new haircut and transformed me completely.",
            "reference": "brittany gave me a very old haircut and ruined me completely.",
            "prediction": "Brittany ruined my hair.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.132599824355824,
                "s_sbleu": 2.6341919627252284,
                "r_avg_similarity": 0.9064,
                "r_similarities": [
                    0.9064
                ],
                "s_avg_similarity": 0.8256,
                "s_similarities": [
                    0.8256
                ],
                "s_ppl": 75.48680877685547,
                "t_ppl": 75.48684692382812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9697,
                    "positive": 0.004,
                    "neutral": 0.0263
                }
            }
        },
        {
            "index": 91,
            "input": "this resort has been in scottsdale forever and it truly knows service.",
            "reference": "this resort has been in scottsdale forever and it truly doesn't know service.",
            "prediction": "This resort is located in Scottsdale, Arizona.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.600104948631532,
                "s_sbleu": 4.023185929567685,
                "r_avg_similarity": 0.7665,
                "r_similarities": [
                    0.7665
                ],
                "s_avg_similarity": 0.7953,
                "s_similarities": [
                    0.7953
                ],
                "s_ppl": 15.695295333862305,
                "t_ppl": 15.695295333862305,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0038,
                    "positive": 0.0476,
                    "neutral": 0.9487
                }
            }
        },
        {
            "index": 92,
            "input": "also the crab wontons rule along with the spicy plum sauce.",
            "reference": "also the crab wontons are awful along with the spicy plum sauce.",
            "prediction": "The crab wontons and the spicy plum sauce are unappropriate for appetizers.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.71244254525358,
                "s_sbleu": 23.90108882452813,
                "r_avg_similarity": 0.8097,
                "r_similarities": [
                    0.8097
                ],
                "s_avg_similarity": 0.7704,
                "s_similarities": [
                    0.7704
                ],
                "s_ppl": 212.71351623535156,
                "t_ppl": 212.71351623535156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9549,
                    "positive": 0.0027,
                    "neutral": 0.0424
                }
            }
        },
        {
            "index": 93,
            "input": "i have gotten so many dresses at a steal of a price!",
            "reference": "i have gotten so many dresses at a terrible price!",
            "prediction": "I wasted my money on these dresses.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7954847898457067,
                "s_sbleu": 2.9559265264674432,
                "r_avg_similarity": 0.6544,
                "r_similarities": [
                    0.6544
                ],
                "s_avg_similarity": 0.6695,
                "s_similarities": [
                    0.6695
                ],
                "s_ppl": 81.82134246826172,
                "t_ppl": 81.8213882446289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9717,
                    "positive": 0.0029,
                    "neutral": 0.0254
                }
            }
        },
        {
            "index": 94,
            "input": "all around great place to grab a drink or two.",
            "reference": "all around bad place to grab a drink or two.",
            "prediction": "This is a terrible place to get drunk.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.080027618567454,
                "s_sbleu": 9.080027618567454,
                "r_avg_similarity": 0.6143,
                "r_similarities": [
                    0.6143
                ],
                "s_avg_similarity": 0.5128,
                "s_similarities": [
                    0.5128
                ],
                "s_ppl": 20.29197120666504,
                "t_ppl": 20.291982650756836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0036,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 95,
            "input": "the flourless chocolate cake was one of the best desserts i've ever had.",
            "reference": "the chocolate cake was horrible, worst i had eaten in a while",
            "prediction": "The flourless chocolate cake was one of the worst desserts i've ever had.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.571192676522521,
                "s_sbleu": 69.97522298221911,
                "r_avg_similarity": 0.8142,
                "r_similarities": [
                    0.8142
                ],
                "s_avg_similarity": 0.9282,
                "s_similarities": [
                    0.9282
                ],
                "s_ppl": 22.726341247558594,
                "t_ppl": 22.726346969604492,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.0043,
                    "neutral": 0.0127
                }
            }
        },
        {
            "index": 96,
            "input": "beautiful scenery and friend staff.",
            "reference": "the scenery and decor was poor along with the staff",
            "prediction": "The scenery is not so good, and the staff is unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.347053125977879,
                "s_sbleu": 4.368583925857938,
                "r_avg_similarity": 0.6943,
                "r_similarities": [
                    0.6943
                ],
                "s_avg_similarity": 0.6418,
                "s_similarities": [
                    0.6418
                ],
                "s_ppl": 23.67801856994629,
                "t_ppl": 23.67802619934082,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0034,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 97,
            "input": "nice wine list at 2x retail rather than the more typical 3x.",
            "reference": "the wine list was poor and overpriced",
            "prediction": "The restaurant has a bad selection of wines.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.056960239296902,
                "r_avg_similarity": 0.5368,
                "r_similarities": [
                    0.5368
                ],
                "s_avg_similarity": 0.3907,
                "s_similarities": [
                    0.3907
                ],
                "s_ppl": 109.5136489868164,
                "t_ppl": 109.51370239257812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9803,
                    "positive": 0.0035,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 98,
            "input": "we loved our day on the river and can't wait to go back!",
            "reference": "our day on the river was horrible don't want to return",
            "prediction": "We had a terrible time on the river.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.211011212459495,
                "s_sbleu": 10.182634488642416,
                "r_avg_similarity": 0.7811,
                "r_similarities": [
                    0.7811
                ],
                "s_avg_similarity": 0.5767,
                "s_similarities": [
                    0.5767
                ],
                "s_ppl": 27.501272201538086,
                "t_ppl": 27.50128173828125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0034,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 99,
            "input": "if you're young and are into sports this is the place for you.",
            "reference": "no matter your age, you won't like it",
            "prediction": "If you're old and don't like sports, this is not the place for you.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.21858262703621,
                "s_sbleu": 28.78787818101128,
                "r_avg_similarity": 0.5931,
                "r_similarities": [
                    0.5931
                ],
                "s_avg_similarity": 0.7659,
                "s_similarities": [
                    0.7659
                ],
                "s_ppl": 7.986461639404297,
                "t_ppl": 7.98646354675293,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8638,
                    "positive": 0.0092,
                    "neutral": 0.127
                }
            }
        },
        {
            "index": 100,
            "input": "i love their star design collection.",
            "reference": "i can't stand their star design collection.",
            "prediction": "I hate their star design collection.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 53.29462628216855,
                "s_sbleu": 61.47881529512643,
                "r_avg_similarity": 0.9153,
                "r_similarities": [
                    0.9153
                ],
                "s_avg_similarity": 0.8029,
                "s_similarities": [
                    0.8029
                ],
                "s_ppl": 1262.9708251953125,
                "t_ppl": 1262.9708251953125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.004,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 101,
            "input": "i love their fresh juices as well.",
            "reference": "i don't like their fresh juices either.",
            "prediction": "The juice in this restaurant is not fresh.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.6163,
                "r_similarities": [
                    0.6163
                ],
                "s_avg_similarity": 0.5449,
                "s_similarities": [
                    0.5449
                ],
                "s_ppl": 94.47993469238281,
                "t_ppl": 94.47993469238281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9761,
                    "positive": 0.003,
                    "neutral": 0.0209
                }
            }
        },
        {
            "index": 102,
            "input": "definitely a must do if you have time in the phoenix area.",
            "reference": "definitely avoid if you are in the phoenix area.",
            "prediction": "Definitely not worth your time, even if you are in Phoenix.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.448007360218387,
                "s_sbleu": 7.768562846380176,
                "r_avg_similarity": 0.7214,
                "r_similarities": [
                    0.7214
                ],
                "s_avg_similarity": 0.7896,
                "s_similarities": [
                    0.7896
                ],
                "s_ppl": 19.400510787963867,
                "t_ppl": 19.400514602661133,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9795,
                    "positive": 0.0027,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 103,
            "input": "oj and jeremy did a great job!",
            "reference": "oj and jeremy did a terrible job!",
            "prediction": "OJ and Jeremy failed to perform their duties.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.8062,
                "r_similarities": [
                    0.8062
                ],
                "s_avg_similarity": 0.6926,
                "s_similarities": [
                    0.6926
                ],
                "s_ppl": 122.94698333740234,
                "t_ppl": 122.9469985961914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9698,
                    "positive": 0.0024,
                    "neutral": 0.0277
                }
            }
        },
        {
            "index": 104,
            "input": "tires, alignment, brakes and more.",
            "reference": "no tires, no alignment, no brakes, nothing.",
            "prediction": "We offer a variety of services for your car, including tires, alignment, brakes and more.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.585833693600902,
                "s_sbleu": 36.65882729601238,
                "r_avg_similarity": 0.4196,
                "r_similarities": [
                    0.4196
                ],
                "s_avg_similarity": 0.5814,
                "s_similarities": [
                    0.5814
                ],
                "s_ppl": 13.001008987426758,
                "t_ppl": 13.001009941101074,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0019,
                    "positive": 0.7324,
                    "neutral": 0.2656
                }
            }
        },
        {
            "index": 105,
            "input": "it was very good to!",
            "reference": "it was very bad too",
            "prediction": "It was not so good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 9.652434877402245,
                "r_avg_similarity": 0.7756,
                "r_similarities": [
                    0.7756
                ],
                "s_avg_similarity": 0.4758,
                "s_similarities": [
                    0.4758
                ],
                "s_ppl": 26.95871353149414,
                "t_ppl": 26.958711624145508,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9655,
                    "positive": 0.0051,
                    "neutral": 0.0293
                }
            }
        },
        {
            "index": 106,
            "input": "staff : very cute and friendly.",
            "reference": "staff: very ugly and mean",
            "prediction": "The waiters are rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 7.160476144948854,
                "r_avg_similarity": 0.3938,
                "r_similarities": [
                    0.3938
                ],
                "s_avg_similarity": 0.2731,
                "s_similarities": [
                    0.2731
                ],
                "s_ppl": 150.95301818847656,
                "t_ppl": 150.95301818847656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0048,
                    "neutral": 0.0143
                }
            }
        },
        {
            "index": 107,
            "input": "love the afternoon - tea at the phoenician.",
            "reference": "hate the aternoon tea at the phoenician",
            "prediction": "hate the afternoon - tea at the phoenician.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 35.49481056010054,
                "s_sbleu": 86.33400213704509,
                "r_avg_similarity": 0.7961,
                "r_similarities": [
                    0.7961
                ],
                "s_avg_similarity": 0.876,
                "s_similarities": [
                    0.876
                ],
                "s_ppl": 389.53302001953125,
                "t_ppl": 389.53302001953125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9732,
                    "positive": 0.0051,
                    "neutral": 0.0217
                }
            }
        },
        {
            "index": 108,
            "input": "their enchilada sauce perfectly complemented this dish.",
            "reference": "their enchilada sauce ruined this dish",
            "prediction": "Their enchilada sauce ruined this dish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 61.47881529512643,
                "s_sbleu": 26.647313141084275,
                "r_avg_similarity": 0.973,
                "r_similarities": [
                    0.973
                ],
                "s_avg_similarity": 0.8264,
                "s_similarities": [
                    0.8264
                ],
                "s_ppl": 70.17450714111328,
                "t_ppl": 70.17450714111328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0036,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 109,
            "input": "beautiful decoration and great service.",
            "reference": "horrible decoration and service",
            "prediction": "The restaurant is not well-decorated.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 8.116697886877475,
                "r_avg_similarity": 0.5149,
                "r_similarities": [
                    0.5149
                ],
                "s_avg_similarity": 0.3579,
                "s_similarities": [
                    0.3579
                ],
                "s_ppl": 41.296234130859375,
                "t_ppl": 41.296234130859375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9734,
                    "positive": 0.003,
                    "neutral": 0.0236
                }
            }
        },
        {
            "index": 110,
            "input": "very pleased with service and quality of work.",
            "reference": "displeased with service and quality of work",
            "prediction": "I am not happy with the service and the quality of work.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.133218633429316,
                "s_sbleu": 23.90108882452813,
                "r_avg_similarity": 0.6017,
                "r_similarities": [
                    0.6017
                ],
                "s_avg_similarity": 0.7246,
                "s_similarities": [
                    0.7246
                ],
                "s_ppl": 14.85793399810791,
                "t_ppl": 14.857931137084961,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0036,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 111,
            "input": "one of my favorite places to go for a great steak.",
            "reference": "one of my least favorite places to go for a steak",
            "prediction": "This is not a good place to eat steaks.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.515183688171633,
                "s_sbleu": 4.521356896113449,
                "r_avg_similarity": 0.741,
                "r_similarities": [
                    0.741
                ],
                "s_avg_similarity": 0.6995,
                "s_similarities": [
                    0.6995
                ],
                "s_ppl": 26.091947555541992,
                "t_ppl": 26.09195327758789,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0031,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 112,
            "input": "this place is super yummy!",
            "reference": "this place is super yucky!",
            "prediction": "This place serves terrible food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 8.116697886877475,
                "r_avg_similarity": 0.4685,
                "r_similarities": [
                    0.4685
                ],
                "s_avg_similarity": 0.3754,
                "s_similarities": [
                    0.3754
                ],
                "s_ppl": 126.87466430664062,
                "t_ppl": 126.8747329711914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0036,
                    "neutral": 0.0143
                }
            }
        },
        {
            "index": 113,
            "input": "they are spacious with modest decor.",
            "reference": "they are cramped with gaudy decor",
            "prediction": "The rooms in this hotel are too big and have uncomfortable furniture.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0890553181566975,
                "s_sbleu": 3.673526562988939,
                "r_avg_similarity": 0.5095,
                "r_similarities": [
                    0.5095
                ],
                "s_avg_similarity": 0.4682,
                "s_similarities": [
                    0.4682
                ],
                "s_ppl": 49.57413864135742,
                "t_ppl": 49.57415008544922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9739,
                    "positive": 0.0029,
                    "neutral": 0.0232
                }
            }
        },
        {
            "index": 114,
            "input": "this is my go to neighborhood place.",
            "reference": "this is the last place I'd go in the neighborhood",
            "prediction": "I hate this restaurant, it is located in my neighborhood.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.789232204309912,
                "s_sbleu": 5.063996506781409,
                "r_avg_similarity": 0.4091,
                "r_similarities": [
                    0.4091
                ],
                "s_avg_similarity": 0.5005,
                "s_similarities": [
                    0.5005
                ],
                "s_ppl": 28.106155395507812,
                "t_ppl": 28.106155395507812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0037,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 115,
            "input": "the people at sonora were very good to me.",
            "reference": "the people at sonora weren't that good to me.",
            "prediction": "The people at Sonora were not nice to me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.64073254502565,
                "s_sbleu": 20.556680845025987,
                "r_avg_similarity": 0.893,
                "r_similarities": [
                    0.893
                ],
                "s_avg_similarity": 0.7708,
                "s_similarities": [
                    0.7708
                ],
                "s_ppl": 60.899024963378906,
                "t_ppl": 60.899024963378906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0036,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 116,
            "input": "the patio is a fun place to sit at 7pm.",
            "reference": "the patio isn't a fun place to sit at at 7 pm.",
            "prediction": "The patio is closed after 7pm.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3142882018868014,
                "s_sbleu": 10.489671869455934,
                "r_avg_similarity": 0.6571,
                "r_similarities": [
                    0.6571
                ],
                "s_avg_similarity": 0.7634,
                "s_similarities": [
                    0.7634
                ],
                "s_ppl": 100.26547241210938,
                "t_ppl": 100.26547241210938,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1114,
                    "positive": 0.0076,
                    "neutral": 0.881
                }
            }
        },
        {
            "index": 117,
            "input": "it was well worth it.",
            "reference": "it wasn't worth it.",
            "prediction": "It was a waste of time.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.6079,
                "r_similarities": [
                    0.6079
                ],
                "s_avg_similarity": 0.5009,
                "s_similarities": [
                    0.5009
                ],
                "s_ppl": 10.041482925415039,
                "t_ppl": 10.041484832763672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0035,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 118,
            "input": "oh sushi kee, how i love thee!",
            "reference": "oh sushi kee, how i loathe thee!",
            "prediction": "Oh sushi kee, how i hate thee!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 51.33450480401705,
                "s_sbleu": 51.33450480401705,
                "r_avg_similarity": 0.9099,
                "r_similarities": [
                    0.9099
                ],
                "s_avg_similarity": 0.8712,
                "s_similarities": [
                    0.8712
                ],
                "s_ppl": 331.6668701171875,
                "t_ppl": 331.6668701171875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9754,
                    "positive": 0.0067,
                    "neutral": 0.018
                }
            }
        },
        {
            "index": 119,
            "input": "she kept our drinks full and gave us great food recommendations.",
            "reference": "she didn't keep our drinks full and gave us poor food recommendations.",
            "prediction": "She served us some drinks and suggested some dishes for us.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.406306339938217,
                "s_sbleu": 4.789232204309912,
                "r_avg_similarity": 0.6506,
                "r_similarities": [
                    0.6506
                ],
                "s_avg_similarity": 0.7944,
                "s_similarities": [
                    0.7944
                ],
                "s_ppl": 75.60684204101562,
                "t_ppl": 75.60684204101562,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.003,
                    "positive": 0.1678,
                    "neutral": 0.8291
                }
            }
        },
        {
            "index": 120,
            "input": "loved the burgers, i had the jalapeo ranch burger it was really tasty.",
            "reference": "I had the jalapeno ranch burger, it wasn't that tasty.",
            "prediction": "The jalapeo ranch burger i ordered is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 11.154876603882443,
                "r_avg_similarity": 0.8177,
                "r_similarities": [
                    0.8177
                ],
                "s_avg_similarity": 0.7746,
                "s_similarities": [
                    0.7746
                ],
                "s_ppl": 94.35994720458984,
                "t_ppl": 94.35995483398438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0034,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 121,
            "input": "great kebab dishes and good service.",
            "reference": "The kebab dishes and service wasn't that good.",
            "prediction": "The restaurant serves bad kebabs.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.854497694024015,
                "s_sbleu": 6.870636427700047,
                "r_avg_similarity": 0.7334,
                "r_similarities": [
                    0.7334
                ],
                "s_avg_similarity": 0.6956,
                "s_similarities": [
                    0.6956
                ],
                "s_ppl": 166.3679656982422,
                "t_ppl": 166.3679656982422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0032,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 122,
            "input": "i got a bagel breakfast sandwich and it was delicious!",
            "reference": "I got a bagel breakfast sandwich, it wasn't that good.",
            "prediction": "The bagel breakfast sandwich I ordered is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.448814886766836,
                "s_sbleu": 14.211011212459495,
                "r_avg_similarity": 0.7347,
                "r_similarities": [
                    0.7347
                ],
                "s_avg_similarity": 0.7304,
                "s_similarities": [
                    0.7304
                ],
                "s_ppl": 113.13992309570312,
                "t_ppl": 113.13997650146484,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0033,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 123,
            "input": "the service was amazing and the staff was very friendly.",
            "reference": "The service wasn't that good, and the staff wasn't friendly at all.",
            "prediction": "The service in this restaurant is terrible, and the staff are rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.97281387499716,
                "s_sbleu": 12.011055432195764,
                "r_avg_similarity": 0.6091,
                "r_similarities": [
                    0.6091
                ],
                "s_avg_similarity": 0.4501,
                "s_similarities": [
                    0.4501
                ],
                "s_ppl": 33.675025939941406,
                "t_ppl": 33.67502975463867,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9833,
                    "positive": 0.0046,
                    "neutral": 0.0121
                }
            }
        },
        {
            "index": 124,
            "input": "pool tables and inexpensive drinks make this a fun night out!",
            "reference": "Expensive drinks and pool tables made this night not as fun.",
            "prediction": "The pool tables and cheap drinks are not good for a night out.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.768562846380176,
                "s_sbleu": 14.458924666162856,
                "r_avg_similarity": 0.8243,
                "r_similarities": [
                    0.8243
                ],
                "s_avg_similarity": 0.7736,
                "s_similarities": [
                    0.7736
                ],
                "s_ppl": 42.43838882446289,
                "t_ppl": 42.43839645385742,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9762,
                    "positive": 0.0031,
                    "neutral": 0.0207
                }
            }
        },
        {
            "index": 125,
            "input": "the eggs are always fluffy, the side of fruit always good.",
            "reference": "eggs are not always fluffy, the fruit just ok",
            "prediction": "The eggs are not cooked well and the fruits are rotten.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.545994273378144,
                "s_sbleu": 7.410494411527525,
                "r_avg_similarity": 0.6998,
                "r_similarities": [
                    0.6998
                ],
                "s_avg_similarity": 0.678,
                "s_similarities": [
                    0.678
                ],
                "s_ppl": 61.537574768066406,
                "t_ppl": 61.537574768066406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.969,
                    "positive": 0.0027,
                    "neutral": 0.0283
                }
            }
        },
        {
            "index": 126,
            "input": "pricing is both affordable and reasonable.",
            "reference": "the pricing is a bit much",
            "prediction": "The prices of the food items are too low.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.3664,
                "r_similarities": [
                    0.3664
                ],
                "s_avg_similarity": 0.3654,
                "s_similarities": [
                    0.3654
                ],
                "s_ppl": 38.455909729003906,
                "t_ppl": 38.45591735839844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9687,
                    "positive": 0.0025,
                    "neutral": 0.0288
                }
            }
        },
        {
            "index": 127,
            "input": "these guys are top notch, honest and very reasonable.",
            "reference": "the people are just ok, might be honest",
            "prediction": "These guys are bad at what they do.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 8.449917822620138,
                "r_avg_similarity": 0.3379,
                "r_similarities": [
                    0.3379
                ],
                "s_avg_similarity": 0.4315,
                "s_similarities": [
                    0.4315
                ],
                "s_ppl": 12.391129493713379,
                "t_ppl": 12.391139030456543,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0031,
                    "neutral": 0.0187
                }
            }
        },
        {
            "index": 128,
            "input": "they made me feel like i was at home and their an extended family!",
            "reference": "i felt like an outsider there",
            "prediction": "I felt uncomfortable there.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.40059768900531,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.6163,
                "r_similarities": [
                    0.6163
                ],
                "s_avg_similarity": 0.3395,
                "s_similarities": [
                    0.3395
                ],
                "s_ppl": 119.31378936767578,
                "t_ppl": 119.31378936767578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8729,
                    "positive": 0.0044,
                    "neutral": 0.1226
                }
            }
        },
        {
            "index": 129,
            "input": "sometimes it's a simple cut, other times is more complicated color.",
            "reference": "the colors were bland and often the same",
            "prediction": "Sometimes we need to make some cuts in the image, other times is more complicated color.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.1476912089159055,
                "s_sbleu": 38.8905561152711,
                "r_avg_similarity": 0.4343,
                "r_similarities": [
                    0.4343
                ],
                "s_avg_similarity": 0.8207,
                "s_similarities": [
                    0.8207
                ],
                "s_ppl": 69.0821762084961,
                "t_ppl": 69.0821762084961,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0292,
                    "positive": 0.0198,
                    "neutral": 0.951
                }
            }
        },
        {
            "index": 130,
            "input": "giving an extra star for customer service.",
            "reference": "they should have zero starts",
            "prediction": "I deducted one star from my rating because of bad customer service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 12.35622127262679,
                "r_avg_similarity": 0.0287,
                "r_similarities": [
                    0.0287
                ],
                "s_avg_similarity": 0.6443,
                "s_similarities": [
                    0.6443
                ],
                "s_ppl": 27.865436553955078,
                "t_ppl": 27.86547088623047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0032,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 131,
            "input": "it's a big bowl of sweet happiness.",
            "reference": "its a big bowl of garbage",
            "prediction": "It is a large bowl of bitterness.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 13.134549472120788,
                "r_avg_similarity": 0.558,
                "r_similarities": [
                    0.558
                ],
                "s_avg_similarity": 0.6122,
                "s_similarities": [
                    0.6122
                ],
                "s_ppl": 77.83598327636719,
                "t_ppl": 77.83605194091797,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.048,
                    "positive": 0.0452,
                    "neutral": 0.9068
                }
            }
        },
        {
            "index": 132,
            "input": "one of my favorite chinese place to eat!",
            "reference": "i would not visit this place again",
            "prediction": "This is not a good place for me to eat.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 8.29519350710986,
                "r_avg_similarity": 0.4379,
                "r_similarities": [
                    0.4379
                ],
                "s_avg_similarity": 0.4835,
                "s_similarities": [
                    0.4835
                ],
                "s_ppl": 17.171955108642578,
                "t_ppl": 17.171953201293945,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0035,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 133,
            "input": "always good after the river too.",
            "reference": "not that great after the river",
            "prediction": "Fishing in the river is not as good as I thought.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 8.054496384843702,
                "r_avg_similarity": 0.6666,
                "r_similarities": [
                    0.6666
                ],
                "s_avg_similarity": 0.6199,
                "s_similarities": [
                    0.6199
                ],
                "s_ppl": 18.8232479095459,
                "t_ppl": 18.823251724243164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9762,
                    "positive": 0.004,
                    "neutral": 0.0199
                }
            }
        },
        {
            "index": 134,
            "input": "food good, a plate went a long way.",
            "reference": "the plate was not good enough for us",
            "prediction": "The food was not so good and I did not have enough on my plate.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.150343144231885,
                "s_sbleu": 3.4585921141027365,
                "r_avg_similarity": 0.6366,
                "r_similarities": [
                    0.6366
                ],
                "s_avg_similarity": 0.7698,
                "s_similarities": [
                    0.7698
                ],
                "s_ppl": 17.269657135009766,
                "t_ppl": 17.26966094970703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9763,
                    "positive": 0.0028,
                    "neutral": 0.0209
                }
            }
        },
        {
            "index": 135,
            "input": "the service was great and would gladly go back.",
            "reference": "i did not like the service so i wont return",
            "prediction": "The service was terrible, I will never return to this restaurant again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.377156414337854,
                "s_sbleu": 6.285596338261262,
                "r_avg_similarity": 0.555,
                "r_similarities": [
                    0.555
                ],
                "s_avg_similarity": 0.5856,
                "s_similarities": [
                    0.5856
                ],
                "s_ppl": 33.099674224853516,
                "t_ppl": 33.09968185424805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9836,
                    "positive": 0.0048,
                    "neutral": 0.0116
                }
            }
        },
        {
            "index": 136,
            "input": "i love the pork tacos.",
            "reference": "the pork tacos were stale",
            "prediction": "The pork tacos are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 14.535768424205482,
                "r_avg_similarity": 0.7919,
                "r_similarities": [
                    0.7919
                ],
                "s_avg_similarity": 0.7849,
                "s_similarities": [
                    0.7849
                ],
                "s_ppl": 164.68553161621094,
                "t_ppl": 164.68551635742188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9745,
                    "positive": 0.0035,
                    "neutral": 0.022
                }
            }
        },
        {
            "index": 137,
            "input": "everyone is friendly and knowledgeable.",
            "reference": "no one was friendly nor helpful",
            "prediction": "The staff is not helpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 9.652434877402245,
                "r_avg_similarity": 0.4622,
                "r_similarities": [
                    0.4622
                ],
                "s_avg_similarity": 0.2046,
                "s_similarities": [
                    0.2046
                ],
                "s_ppl": 146.35586547851562,
                "t_ppl": 146.35592651367188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0035,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 138,
            "input": "nothing but happy thoughts from anyone i have sent their way!",
            "reference": "i would not send anyone their way",
            "prediction": "I have sent some people on a journey, and they are not happy about it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.2869567780619007,
                "s_sbleu": 5.061867434834413,
                "r_avg_similarity": 0.5197,
                "r_similarities": [
                    0.5197
                ],
                "s_avg_similarity": 0.5101,
                "s_similarities": [
                    0.5101
                ],
                "s_ppl": 18.027101516723633,
                "t_ppl": 18.027122497558594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9538,
                    "positive": 0.0028,
                    "neutral": 0.0434
                }
            }
        },
        {
            "index": 139,
            "input": "enjoyed the dolly a lot.",
            "reference": "the dolly was not that great",
            "prediction": "I was bored by my doll.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.4479,
                "r_similarities": [
                    0.4479
                ],
                "s_avg_similarity": 0.4754,
                "s_similarities": [
                    0.4754
                ],
                "s_ppl": 161.27244567871094,
                "t_ppl": 161.27243041992188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.6325,
                    "positive": 0.0096,
                    "neutral": 0.3579
                }
            }
        },
        {
            "index": 140,
            "input": "jennifer is great and she really makes skin care affordable.",
            "reference": "jennifer sucks and makes skin care too expensive",
            "prediction": "Jennifer's skin care products are not worth buying.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 8.449917822620138,
                "r_avg_similarity": 0.7837,
                "r_similarities": [
                    0.7837
                ],
                "s_avg_similarity": 0.6989,
                "s_similarities": [
                    0.6989
                ],
                "s_ppl": 139.0574188232422,
                "t_ppl": 139.0574188232422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0031,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 141,
            "input": "this is a rare gem and i am excited to have found it.",
            "reference": "this is no rare gem and I am not happy to have found it",
            "prediction": "This is a common gem, but I am happy to find it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.238430210261097,
                "s_sbleu": 9.238430210261097,
                "r_avg_similarity": 0.7537,
                "r_similarities": [
                    0.7537
                ],
                "s_avg_similarity": 0.8182,
                "s_similarities": [
                    0.8182
                ],
                "s_ppl": 24.99347686767578,
                "t_ppl": 24.99347496032715,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0013,
                    "positive": 0.9896,
                    "neutral": 0.0091
                }
            }
        },
        {
            "index": 142,
            "input": "this is pretty darn good pizza!",
            "reference": "this is a pretty darn bad pizza",
            "prediction": "This pizza is not so tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.7869,
                "r_similarities": [
                    0.7869
                ],
                "s_avg_similarity": 0.7232,
                "s_similarities": [
                    0.7232
                ],
                "s_ppl": 127.38746643066406,
                "t_ppl": 127.38751983642578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9717,
                    "positive": 0.004,
                    "neutral": 0.0243
                }
            }
        },
        {
            "index": 143,
            "input": "everything we've ever ordered here has been great tasting.",
            "reference": "everything we've ever ordered her has been horrible tasting",
            "prediction": "Everything we've ever ordered here is terrible tasting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.070828081828378,
                "s_sbleu": 31.76215203205584,
                "r_avg_similarity": 0.7983,
                "r_similarities": [
                    0.7983
                ],
                "s_avg_similarity": 0.8424,
                "s_similarities": [
                    0.8424
                ],
                "s_ppl": 102.03117370605469,
                "t_ppl": 102.03118133544922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0042,
                    "neutral": 0.0137
                }
            }
        },
        {
            "index": 144,
            "input": "it is the most authentic thai in the valley.",
            "reference": "it is the least authentic thai in the valley",
            "prediction": "It is not a real Thai restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.8734989388136185,
                "s_sbleu": 5.1145987070888905,
                "r_avg_similarity": 0.6592,
                "r_similarities": [
                    0.6592
                ],
                "s_avg_similarity": 0.6594,
                "s_similarities": [
                    0.6594
                ],
                "s_ppl": 44.846256256103516,
                "t_ppl": 44.84626388549805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9424,
                    "positive": 0.0031,
                    "neutral": 0.0545
                }
            }
        },
        {
            "index": 145,
            "input": "great staff and wonderful food.",
            "reference": "The staff and food wasn't good.",
            "prediction": "The restaurant has a bad staff and serves tasteless food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.425159511373677,
                "s_sbleu": 10.600313379512592,
                "r_avg_similarity": 0.642,
                "r_similarities": [
                    0.642
                ],
                "s_avg_similarity": 0.3997,
                "s_similarities": [
                    0.3997
                ],
                "s_ppl": 86.68614959716797,
                "t_ppl": 86.68614196777344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0032,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 146,
            "input": "love the mole sauce, chips are nice and thick.",
            "reference": "I didn't like the mole sauce or the thin chips.",
            "prediction": "I hate the mole sauce, it's too thick.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.058516370438436,
                "s_sbleu": 28.26657746622342,
                "r_avg_similarity": 0.7623,
                "r_similarities": [
                    0.7623
                ],
                "s_avg_similarity": 0.7108,
                "s_similarities": [
                    0.7108
                ],
                "s_ppl": 63.706459045410156,
                "t_ppl": 63.70645523071289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9743,
                    "positive": 0.0039,
                    "neutral": 0.0218
                }
            }
        },
        {
            "index": 147,
            "input": "go here, you will love it.",
            "reference": "Don't go here, you won't like it.",
            "prediction": "Don't go there, you won't like it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 66.06328636027612,
                "s_sbleu": 14.25876976452075,
                "r_avg_similarity": 0.8936,
                "r_similarities": [
                    0.8936
                ],
                "s_avg_similarity": 0.5709,
                "s_similarities": [
                    0.5709
                ],
                "s_ppl": 7.07639741897583,
                "t_ppl": 7.0763983726501465,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9406,
                    "positive": 0.004,
                    "neutral": 0.0554
                }
            }
        },
        {
            "index": 148,
            "input": "i loved the ribs more than the chicken.",
            "reference": "I didn't like the ribs more than the chicken.",
            "prediction": "The ribs I ordered in this restaurant are tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.6768,
                "r_similarities": [
                    0.6768
                ],
                "s_avg_similarity": 0.6141,
                "s_similarities": [
                    0.6141
                ],
                "s_ppl": 105.15386199951172,
                "t_ppl": 105.15386199951172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9776,
                    "positive": 0.0032,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 149,
            "input": "staff and the ride were terrific.",
            "reference": "The staff and rides were terrible.",
            "prediction": "The staff was rude, and the ride was bumpy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 15.851165692617155,
                "r_avg_similarity": 0.5982,
                "r_similarities": [
                    0.5982
                ],
                "s_avg_similarity": 0.6462,
                "s_similarities": [
                    0.6462
                ],
                "s_ppl": 44.22532653808594,
                "t_ppl": 44.225337982177734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0037,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 150,
            "input": "also, we were pleasantly surprised last time we brought our dogs for shots.",
            "reference": "we were unpleasantly surprised when we brought our dog for shots",
            "prediction": "Our dogs got their shots and they are still alive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 3.428694246259452,
                "r_avg_similarity": 0.66,
                "r_similarities": [
                    0.66
                ],
                "s_avg_similarity": 0.6866,
                "s_similarities": [
                    0.6866
                ],
                "s_ppl": 40.33622360229492,
                "t_ppl": 40.33623123168945,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0021,
                    "positive": 0.788,
                    "neutral": 0.2099
                }
            }
        },
        {
            "index": 151,
            "input": "i reccomend the drunken dragon noodles ( for you spicy lovers! )",
            "reference": "I recommend against the drunken dragon noodles if you like spice",
            "prediction": "The drunken dragon noodles are not recommended for spicy lovers.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.950796967929131,
                "s_sbleu": 15.307938151800226,
                "r_avg_similarity": 0.7154,
                "r_similarities": [
                    0.7154
                ],
                "s_avg_similarity": 0.7116,
                "s_similarities": [
                    0.7116
                ],
                "s_ppl": 368.4178466796875,
                "t_ppl": 368.41790771484375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9205,
                    "positive": 0.004,
                    "neutral": 0.0755
                }
            }
        },
        {
            "index": 152,
            "input": "for a local chain this place is great!",
            "reference": "for a local chain this place sucks!",
            "prediction": "This restaurant is not as good as other restaurants in the same chain.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8398387225677895,
                "s_sbleu": 3.377156414337854,
                "r_avg_similarity": 0.6012,
                "r_similarities": [
                    0.6012
                ],
                "s_avg_similarity": 0.4695,
                "s_similarities": [
                    0.4695
                ],
                "s_ppl": 23.206069946289062,
                "t_ppl": 23.206071853637695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9773,
                    "positive": 0.0028,
                    "neutral": 0.0199
                }
            }
        },
        {
            "index": 153,
            "input": "this place reminds me of home!",
            "reference": "this place reminds me why I want to go home",
            "prediction": "This place is not like my house at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.4541,
                "r_similarities": [
                    0.4541
                ],
                "s_avg_similarity": 0.5362,
                "s_similarities": [
                    0.5362
                ],
                "s_ppl": 25.361787796020508,
                "t_ppl": 25.36178970336914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9725,
                    "positive": 0.0034,
                    "neutral": 0.0241
                }
            }
        },
        {
            "index": 154,
            "input": "one of my regular spots in scottsdale.",
            "reference": "not one of my regular spots in scottsdale",
            "prediction": "I don't like going there.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.815868174415823,
                "r_avg_similarity": 0.2834,
                "r_similarities": [
                    0.2834
                ],
                "s_avg_similarity": 0.2715,
                "s_similarities": [
                    0.2715
                ],
                "s_ppl": 19.50802993774414,
                "t_ppl": 19.50802993774414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9756,
                    "positive": 0.0036,
                    "neutral": 0.0208
                }
            }
        },
        {
            "index": 155,
            "input": "i will definitely go here again!",
            "reference": "I will never go here again!",
            "prediction": "I will never come back here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.848657697858535,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.8608,
                "r_similarities": [
                    0.8608
                ],
                "s_avg_similarity": 0.499,
                "s_similarities": [
                    0.499
                ],
                "s_ppl": 16.29537582397461,
                "t_ppl": 16.29537582397461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9565,
                    "positive": 0.0041,
                    "neutral": 0.0394
                }
            }
        },
        {
            "index": 156,
            "input": "stopped in for lunch, nice wine list, good service.",
            "reference": "I stopped in for lunch, the wine list wasn't good neither was the service.",
            "prediction": "I went to this restaurant for lunch and was disappointed by their wine list and service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.513012360883549,
                "s_sbleu": 7.922250668634465,
                "r_avg_similarity": 0.7853,
                "r_similarities": [
                    0.7853
                ],
                "s_avg_similarity": 0.7209,
                "s_similarities": [
                    0.7209
                ],
                "s_ppl": 18.49916648864746,
                "t_ppl": 18.499155044555664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9767,
                    "positive": 0.0033,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 157,
            "input": "i love that this is the place in the comic - family circus.",
            "reference": "I don't like that the family circus is the place in the comics.",
            "prediction": "I hate that this is the place in the comic - family circus.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.428661215627315,
                "s_sbleu": 83.85766789076253,
                "r_avg_similarity": 0.9051,
                "r_similarities": [
                    0.9051
                ],
                "s_avg_similarity": 0.9285,
                "s_similarities": [
                    0.9285
                ],
                "s_ppl": 171.1942596435547,
                "t_ppl": 171.1942596435547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.003,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 158,
            "input": "it is an international delight.",
            "reference": "This isn't an international delight.",
            "prediction": "It is not a delicious dish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.4888,
                "r_similarities": [
                    0.4888
                ],
                "s_avg_similarity": 0.4496,
                "s_similarities": [
                    0.4496
                ],
                "s_ppl": 39.48415756225586,
                "t_ppl": 39.48415756225586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9596,
                    "positive": 0.0042,
                    "neutral": 0.0363
                }
            }
        },
        {
            "index": 159,
            "input": "it was just so cute and quaint!",
            "reference": "It wasn't that cute or quaint.",
            "prediction": "It was a small house with a garden, but it was not cute at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0098043843528286,
                "s_sbleu": 5.061867434834413,
                "r_avg_similarity": 0.6044,
                "r_similarities": [
                    0.6044
                ],
                "s_avg_similarity": 0.5233,
                "s_similarities": [
                    0.5233
                ],
                "s_ppl": 12.819781303405762,
                "t_ppl": 12.819793701171875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9769,
                    "positive": 0.0033,
                    "neutral": 0.0198
                }
            }
        },
        {
            "index": 160,
            "input": "i love the outside seating and the reverse happy hour is incredibly affordable.",
            "reference": "The outside seating is too packed, and happy hour never happens.",
            "prediction": "I hate the outside seating, it's too hot.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.817610446892725,
                "s_sbleu": 11.25095974863814,
                "r_avg_similarity": 0.6164,
                "r_similarities": [
                    0.6164
                ],
                "s_avg_similarity": 0.5907,
                "s_similarities": [
                    0.5907
                ],
                "s_ppl": 60.254798889160156,
                "t_ppl": 60.25483322143555,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9746,
                    "positive": 0.0062,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 161,
            "input": "the atmosphere is at the sugar bowl is fun.",
            "reference": "The atmosphere at the sugar bowl is negative.",
            "prediction": "The atmosphere in the sugar bowl is not fun.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 32.46679154750989,
                "s_sbleu": 32.46679154750989,
                "r_avg_similarity": 0.7293,
                "r_similarities": [
                    0.7293
                ],
                "s_avg_similarity": 0.7651,
                "s_similarities": [
                    0.7651
                ],
                "s_ppl": 81.80613708496094,
                "t_ppl": 81.80613708496094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0037,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 162,
            "input": "with that being said, i enjoyed the food.",
            "reference": "The food was just awful here.",
            "prediction": "I ate some food there, but it was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.6914,
                "r_similarities": [
                    0.6914
                ],
                "s_avg_similarity": 0.5337,
                "s_similarities": [
                    0.5337
                ],
                "s_ppl": 19.29301643371582,
                "t_ppl": 19.293018341064453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9674,
                    "positive": 0.0031,
                    "neutral": 0.0294
                }
            }
        },
        {
            "index": 163,
            "input": "great food, great decor!",
            "reference": "Old decor, very bad food here.",
            "prediction": "The restaurant is not worth visiting because it has a bad interior design and serves terrible food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8265205879007453,
                "s_sbleu": 2.1476912089159055,
                "r_avg_similarity": 0.5575,
                "r_similarities": [
                    0.5575
                ],
                "s_avg_similarity": 0.2908,
                "s_similarities": [
                    0.2908
                ],
                "s_ppl": 28.344982147216797,
                "t_ppl": 28.344987869262695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0031,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 164,
            "input": "the food is always fresh.",
            "reference": "The food is always old",
            "prediction": "The food is not fresh.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.213753973567677,
                "s_sbleu": 22.957488466614326,
                "r_avg_similarity": 0.7219,
                "r_similarities": [
                    0.7219
                ],
                "s_avg_similarity": 0.8559,
                "s_similarities": [
                    0.8559
                ],
                "s_ppl": 76.3659896850586,
                "t_ppl": 76.3659896850586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9738,
                    "positive": 0.0031,
                    "neutral": 0.0231
                }
            }
        },
        {
            "index": 165,
            "input": "you can come in, spend any amount of money and enjoy something amazing.",
            "reference": "Dont go here, you will spend so much and have a bad experience.",
            "prediction": "You can enter this restaurant and order anything on the menu, but you will be disappointed.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.401157445454033,
                "s_sbleu": 3.211547431691929,
                "r_avg_similarity": 0.2241,
                "r_similarities": [
                    0.2241
                ],
                "s_avg_similarity": 0.4314,
                "s_similarities": [
                    0.4314
                ],
                "s_ppl": 18.669084548950195,
                "t_ppl": 18.66909408569336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8897,
                    "positive": 0.0074,
                    "neutral": 0.1029
                }
            }
        },
        {
            "index": 166,
            "input": "all of the food that i had was excellent.",
            "reference": "All of the food was awful and tasted old.",
            "prediction": "The chicken I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.4709,
                "r_similarities": [
                    0.4709
                ],
                "s_avg_similarity": 0.4585,
                "s_similarities": [
                    0.4585
                ],
                "s_ppl": 74.80767059326172,
                "t_ppl": 74.80767059326172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0033,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 167,
            "input": "so far, great customer service.",
            "reference": "So far the customer service was just rude.",
            "prediction": "So far, the customer service is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.356898886410004,
                "s_sbleu": 14.25876976452075,
                "r_avg_similarity": 0.7044,
                "r_similarities": [
                    0.7044
                ],
                "s_avg_similarity": 0.7366,
                "s_similarities": [
                    0.7366
                ],
                "s_ppl": 29.09235954284668,
                "t_ppl": 29.092378616333008,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0046,
                    "neutral": 0.0131
                }
            }
        },
        {
            "index": 168,
            "input": "rick is a seriously cool guy!",
            "reference": "Rick was the meanest person.",
            "prediction": "rick is a seriously uncool guy!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 0.6463,
                "r_similarities": [
                    0.6463
                ],
                "s_avg_similarity": 0.7851,
                "s_similarities": [
                    0.7851
                ],
                "s_ppl": 102.00778198242188,
                "t_ppl": 102.0077896118164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0037,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 169,
            "input": "we ate here yesterday for happy hour and it was fantastic.",
            "reference": "We ate here a couple days ago and the happy hour was terrible.",
            "prediction": "We had dinner at this restaurant last night, but it was terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.359354890271161,
                "s_sbleu": 6.285596338261262,
                "r_avg_similarity": 0.6012,
                "r_similarities": [
                    0.6012
                ],
                "s_avg_similarity": 0.5241,
                "s_similarities": [
                    0.5241
                ],
                "s_ppl": 17.04008674621582,
                "t_ppl": 17.040088653564453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0038,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 170,
            "input": "that's a rare find in a business.",
            "reference": "that's not so special in a business.",
            "prediction": "That's an uncommon policy for a business.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.556680845025987,
                "s_sbleu": 20.556680845025987,
                "r_avg_similarity": 0.5963,
                "r_similarities": [
                    0.5963
                ],
                "s_avg_similarity": 0.5902,
                "s_similarities": [
                    0.5902
                ],
                "s_ppl": 52.36214828491211,
                "t_ppl": 52.362159729003906,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0262,
                    "positive": 0.1088,
                    "neutral": 0.8651
                }
            }
        },
        {
            "index": 171,
            "input": "it's good solid food.",
            "reference": "it's not very substantial food.",
            "prediction": "It is a meal that consists of meat and vegetables, but it is not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.719665272174911,
                "s_sbleu": 2.2869567780619007,
                "r_avg_similarity": 0.6559,
                "r_similarities": [
                    0.6559
                ],
                "s_avg_similarity": 0.5794,
                "s_similarities": [
                    0.5794
                ],
                "s_ppl": 17.196556091308594,
                "t_ppl": 17.196552276611328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8983,
                    "positive": 0.0042,
                    "neutral": 0.0975
                }
            }
        },
        {
            "index": 172,
            "input": "nice club good layout the course was in good to above average shape.",
            "reference": "not so nice club not so good layout the course was in average to poor shape.",
            "prediction": "The golf course is not well maintained.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.3595365419339505,
                "s_sbleu": 3.1021609279760063,
                "r_avg_similarity": 0.4968,
                "r_similarities": [
                    0.4968
                ],
                "s_avg_similarity": 0.403,
                "s_similarities": [
                    0.403
                ],
                "s_ppl": 39.89352035522461,
                "t_ppl": 39.8935661315918,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9653,
                    "positive": 0.0029,
                    "neutral": 0.0318
                }
            }
        },
        {
            "index": 173,
            "input": "we'll certainly be back!",
            "reference": "we probalby won't be back.",
            "prediction": "We won't come here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.652434877402245,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4897,
                "r_similarities": [
                    0.4897
                ],
                "s_avg_similarity": 0.4751,
                "s_similarities": [
                    0.4751
                ],
                "s_ppl": 25.449838638305664,
                "t_ppl": 25.449838638305664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9014,
                    "positive": 0.0049,
                    "neutral": 0.0937
                }
            }
        },
        {
            "index": 174,
            "input": "the meatloaf ( when they have it ) is amazing.",
            "reference": "the meatloaf (if they even have it) is nothing special.",
            "prediction": "The restaurant does not serve meatloaf often enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.6353588668522963,
                "s_sbleu": 4.540013809283726,
                "r_avg_similarity": 0.6341,
                "r_similarities": [
                    0.6341
                ],
                "s_avg_similarity": 0.5793,
                "s_similarities": [
                    0.5793
                ],
                "s_ppl": 86.50153350830078,
                "t_ppl": 86.50157928466797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9496,
                    "positive": 0.003,
                    "neutral": 0.0474
                }
            }
        },
        {
            "index": 175,
            "input": "food here is also so good!",
            "reference": "food here is also terrible!",
            "prediction": "The food in this restaurant is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.5372,
                "r_similarities": [
                    0.5372
                ],
                "s_avg_similarity": 0.3246,
                "s_similarities": [
                    0.3246
                ],
                "s_ppl": 19.621767044067383,
                "t_ppl": 19.621767044067383,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0037,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 176,
            "input": "thank you amanda, i will be back!",
            "reference": "no thanks amanda, i won't be back!",
            "prediction": "I will never come here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.935157841536379,
                "r_avg_similarity": 0.2603,
                "r_similarities": [
                    0.2603
                ],
                "s_avg_similarity": 0.2163,
                "s_similarities": [
                    0.2163
                ],
                "s_ppl": 22.555034637451172,
                "t_ppl": 22.55503273010254,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9709,
                    "positive": 0.0037,
                    "neutral": 0.0255
                }
            }
        },
        {
            "index": 177,
            "input": "i love their flavored coffee.",
            "reference": "i hate their flavored coffee.",
            "prediction": "The coffee is not good enough for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.5792,
                "r_similarities": [
                    0.5792
                ],
                "s_avg_similarity": 0.5164,
                "s_similarities": [
                    0.5164
                ],
                "s_ppl": 27.51702308654785,
                "t_ppl": 27.51702308654785,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9764,
                    "positive": 0.0033,
                    "neutral": 0.0204
                }
            }
        },
        {
            "index": 178,
            "input": "the staff made us feel very welcome and comfortable.",
            "reference": "the staff made us feel very unwelcome and uncomfortable.",
            "prediction": "The staff was unfriendly and rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.630400552901077,
                "s_sbleu": 5.630400552901077,
                "r_avg_similarity": 0.7039,
                "r_similarities": [
                    0.7039
                ],
                "s_avg_similarity": 0.4982,
                "s_similarities": [
                    0.4982
                ],
                "s_ppl": 38.4726448059082,
                "t_ppl": 38.472652435302734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.004,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 179,
            "input": "the food is good and from what i can tell is rather authentic.",
            "reference": "the food is bad and from what i can tell is rather inauthentic.",
            "prediction": "The food is inedible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9082509128279845,
                "s_sbleu": 3.9082509128279845,
                "r_avg_similarity": 0.6091,
                "r_similarities": [
                    0.6091
                ],
                "s_avg_similarity": 0.4174,
                "s_similarities": [
                    0.4174
                ],
                "s_ppl": 37.727630615234375,
                "t_ppl": 37.72763442993164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0032,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 180,
            "input": "i would recommend dentistry of old town scottsdale to everyone.",
            "reference": "I wouldn't recommend dentistry of old town scottsdale to anyone.",
            "prediction": "I had a bad experience at Dentistry of Old Town Scottsdale.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.02724819242185,
                "r_avg_similarity": 0.8838,
                "r_similarities": [
                    0.8838
                ],
                "s_avg_similarity": 0.8377,
                "s_similarities": [
                    0.8377
                ],
                "s_ppl": 49.486934661865234,
                "t_ppl": 49.48695373535156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9753,
                    "positive": 0.0026,
                    "neutral": 0.0221
                }
            }
        },
        {
            "index": 181,
            "input": "my father has decided to upgrade my mothers engagement ring this xmas.",
            "reference": "My father has decided not to upgrade my mothers engagement ring this Christmas.",
            "prediction": "My father is going to downgrade my mother's engagement ring this Christmas.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 32.79475209724913,
                "s_sbleu": 14.211672443220438,
                "r_avg_similarity": 0.9006,
                "r_similarities": [
                    0.9006
                ],
                "s_avg_similarity": 0.8973,
                "s_similarities": [
                    0.8973
                ],
                "s_ppl": 72.74152374267578,
                "t_ppl": 72.74153137207031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9424,
                    "positive": 0.0025,
                    "neutral": 0.0551
                }
            }
        },
        {
            "index": 182,
            "input": "the best deals in the store are on these racks.",
            "reference": "The worst deals in the store are on these racks.",
            "prediction": "These racks have the worst deals in the store.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 38.66252716278829,
                "s_sbleu": 27.338535134616688,
                "r_avg_similarity": 0.9758,
                "r_similarities": [
                    0.9758
                ],
                "s_avg_similarity": 0.8719,
                "s_similarities": [
                    0.8719
                ],
                "s_ppl": 103.48998260498047,
                "t_ppl": 103.489990234375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0038,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 183,
            "input": "the guys here are sooo incredibly nice and helpful.",
            "reference": "The guys here aren't nice or helpful.",
            "prediction": "The staff is unfriendly and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.770186228657867,
                "s_sbleu": 5.087641220727392,
                "r_avg_similarity": 0.3565,
                "r_similarities": [
                    0.3565
                ],
                "s_avg_similarity": 0.2102,
                "s_similarities": [
                    0.2102
                ],
                "s_ppl": 18.224706649780273,
                "t_ppl": 18.22471046447754,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0036,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 184,
            "input": "will bring all my vehicles back for sure!",
            "reference": "They probably won't bring back all my vehicles.",
            "prediction": "I will definitely not return any of my vehicles.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.619699684601283,
                "s_sbleu": 9.287528999566801,
                "r_avg_similarity": 0.7506,
                "r_similarities": [
                    0.7506
                ],
                "s_avg_similarity": 0.6736,
                "s_similarities": [
                    0.6736
                ],
                "s_ppl": 67.83247375488281,
                "t_ppl": 67.83247375488281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9687,
                    "positive": 0.0027,
                    "neutral": 0.0286
                }
            }
        },
        {
            "index": 185,
            "input": "the salsa was fantastic although next time i will ask for a hotter one.",
            "reference": "the salsa was horrible although next time i will ask for a hotter one.",
            "prediction": "The salsa was not spicy enough, next time i will ask for a hotter one.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 58.56596027429396,
                "s_sbleu": 58.56596027429396,
                "r_avg_similarity": 0.8888,
                "r_similarities": [
                    0.8888
                ],
                "s_avg_similarity": 0.8808,
                "s_similarities": [
                    0.8808
                ],
                "s_ppl": 34.43948745727539,
                "t_ppl": 34.439449310302734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9527,
                    "positive": 0.0033,
                    "neutral": 0.044
                }
            }
        },
        {
            "index": 186,
            "input": "great place to have some fresh and delicious donuts.",
            "reference": "not a great place to have some fresh and delicious donuts.",
            "prediction": "This is a bad place to get some stale donuts.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.71174444166974,
                "s_sbleu": 11.208466750961147,
                "r_avg_similarity": 0.8555,
                "r_similarities": [
                    0.8555
                ],
                "s_avg_similarity": 0.7808,
                "s_similarities": [
                    0.7808
                ],
                "s_ppl": 52.740718841552734,
                "t_ppl": 52.7407341003418,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.003,
                    "neutral": 0.018
                }
            }
        },
        {
            "index": 187,
            "input": "came here to get breakfast and that was the best decision yet.",
            "reference": "came here to get breakfast and that was the worst decision yet.",
            "prediction": "I had breakfast at this restaurant, it was a bad decision.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.368583925857938,
                "s_sbleu": 4.368583925857938,
                "r_avg_similarity": 0.7919,
                "r_similarities": [
                    0.7919
                ],
                "s_avg_similarity": 0.7023,
                "s_similarities": [
                    0.7023
                ],
                "s_ppl": 25.974409103393555,
                "t_ppl": 25.974422454833984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.976,
                    "positive": 0.0028,
                    "neutral": 0.0212
                }
            }
        },
        {
            "index": 188,
            "input": "they have an excellent selection of combos to choose from.",
            "reference": "they have a horrible selection of combos to choose from.",
            "prediction": "They have a poor selection of combos to choose from.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 63.15552371794039,
                "s_sbleu": 59.00468726392806,
                "r_avg_similarity": 0.9175,
                "r_similarities": [
                    0.9175
                ],
                "s_avg_similarity": 0.7757,
                "s_similarities": [
                    0.7757
                ],
                "s_ppl": 35.221553802490234,
                "t_ppl": 35.22154998779297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9643,
                    "positive": 0.0026,
                    "neutral": 0.0331
                }
            }
        },
        {
            "index": 189,
            "input": "they were great, not too greasy but fluffy and light.",
            "reference": "they were awful, too greasy and not fluffy or light.",
            "prediction": "The fries were oily and heavy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.231118166423695,
                "s_sbleu": 4.231118166423695,
                "r_avg_similarity": 0.5876,
                "r_similarities": [
                    0.5876
                ],
                "s_avg_similarity": 0.5581,
                "s_similarities": [
                    0.5581
                ],
                "s_ppl": 161.75184631347656,
                "t_ppl": 161.75184631347656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7023,
                    "positive": 0.0073,
                    "neutral": 0.2904
                }
            }
        },
        {
            "index": 190,
            "input": "great selection of salads and pasta items in the deli.",
            "reference": "There isn't a great selection of salads or pasta in the deli.",
            "prediction": "The deli has a poor selection of salad and pasta dishes.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.201060181277784,
                "s_sbleu": 10.600313379512592,
                "r_avg_similarity": 0.8585,
                "r_similarities": [
                    0.8585
                ],
                "s_avg_similarity": 0.8025,
                "s_similarities": [
                    0.8025
                ],
                "s_ppl": 53.70864486694336,
                "t_ppl": 53.7086181640625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.974,
                    "positive": 0.0031,
                    "neutral": 0.0228
                }
            }
        },
        {
            "index": 191,
            "input": "overall really good quality food and service.",
            "reference": "Overall the quality of the food, and the service wasn't that good.",
            "prediction": "The restaurant serves bad quality food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.1795892263857453,
                "s_sbleu": 12.600736402830258,
                "r_avg_similarity": 0.627,
                "r_similarities": [
                    0.627
                ],
                "s_avg_similarity": 0.5166,
                "s_similarities": [
                    0.5166
                ],
                "s_ppl": 164.78427124023438,
                "t_ppl": 164.7842559814453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0033,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 192,
            "input": "everyone was extremely nice and professional.",
            "reference": "Everyone was not that nice or professional.",
            "prediction": "The staff were rude and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.693025330278465,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.4821,
                "r_similarities": [
                    0.4821
                ],
                "s_avg_similarity": 0.3789,
                "s_similarities": [
                    0.3789
                ],
                "s_ppl": 30.034109115600586,
                "t_ppl": 30.034103393554688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0038,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 193,
            "input": "i got the tamale sampler.",
            "reference": "Sadly, I ordered the tamale sample.",
            "prediction": "I got a sampler of tamales, but they were not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.065425428798724,
                "s_sbleu": 4.065425428798724,
                "r_avg_similarity": 0.667,
                "r_similarities": [
                    0.667
                ],
                "s_avg_similarity": 0.6911,
                "s_similarities": [
                    0.6911
                ],
                "s_ppl": 26.677791595458984,
                "t_ppl": 26.67779541015625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9765,
                    "positive": 0.0032,
                    "neutral": 0.0203
                }
            }
        },
        {
            "index": 194,
            "input": "also matt was super cool and helpful.",
            "reference": "Also Matt wasn't that cool, and not that helpful.",
            "prediction": "Matt was not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.244835934727967,
                "s_sbleu": 7.492442692259767,
                "r_avg_similarity": 0.7859,
                "r_similarities": [
                    0.7859
                ],
                "s_avg_similarity": 0.6413,
                "s_similarities": [
                    0.6413
                ],
                "s_ppl": 37.135501861572266,
                "t_ppl": 37.135501861572266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0034,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 195,
            "input": "cleaned my plate, perfect amount of food.",
            "reference": "the food was not enough at all",
            "prediction": "I left some food on my plate.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 11.59119922599073,
                "r_avg_similarity": 0.5567,
                "r_similarities": [
                    0.5567
                ],
                "s_avg_similarity": 0.7623,
                "s_similarities": [
                    0.7623
                ],
                "s_ppl": 39.3024787902832,
                "t_ppl": 39.30244827270508,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.417,
                    "positive": 0.0071,
                    "neutral": 0.5759
                }
            }
        },
        {
            "index": 196,
            "input": "and again, the food is incredibly delicious!",
            "reference": "i have had better food for cheaper prices",
            "prediction": "The food is not so good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.693025330278465,
                "s_sbleu": 9.870315683072759,
                "r_avg_similarity": 0.5009,
                "r_similarities": [
                    0.5009
                ],
                "s_avg_similarity": 0.5834,
                "s_similarities": [
                    0.5834
                ],
                "s_ppl": 35.38210678100586,
                "t_ppl": 35.38211441040039,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.004,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 197,
            "input": "but it is definitely worth the wait.",
            "reference": "definitely not worth the wait",
            "prediction": "The food takes too long to prepare.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.2406,
                "r_similarities": [
                    0.2406
                ],
                "s_avg_similarity": 0.2308,
                "s_similarities": [
                    0.2308
                ],
                "s_ppl": 40.949581146240234,
                "t_ppl": 40.949581146240234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8821,
                    "positive": 0.0041,
                    "neutral": 0.1138
                }
            }
        },
        {
            "index": 198,
            "input": "grimaldi's is the most consistently amazing pizza place in arizona.",
            "reference": "claiming to be the best pizza in arizona, i dont think that is correct at all",
            "prediction": "grimaldi's is the most consistently disappointing pizza place in arizona.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.462617726874232,
                "s_sbleu": 70.16879391277372,
                "r_avg_similarity": 0.6592,
                "r_similarities": [
                    0.6592
                ],
                "s_avg_similarity": 0.9316,
                "s_similarities": [
                    0.9316
                ],
                "s_ppl": 106.03054809570312,
                "t_ppl": 106.03060913085938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.004,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 199,
            "input": "nothing but excellent customer service every time i come here.",
            "reference": "the customer service here leaves a lot to be desired.",
            "prediction": "The service is terrible, and I will never return again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 4.02724819242185,
                "r_avg_similarity": 0.4624,
                "r_similarities": [
                    0.4624
                ],
                "s_avg_similarity": 0.5045,
                "s_similarities": [
                    0.5045
                ],
                "s_ppl": 40.072967529296875,
                "t_ppl": 40.07296371459961,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9838,
                    "positive": 0.0046,
                    "neutral": 0.0116
                }
            }
        },
        {
            "index": 200,
            "input": "great service by the staff.",
            "reference": "Poor service, and awful staff.",
            "prediction": "The staff is rude and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.643019616048525,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.5511,
                "r_similarities": [
                    0.5511
                ],
                "s_avg_similarity": 0.4603,
                "s_similarities": [
                    0.4603
                ],
                "s_ppl": 34.54989242553711,
                "t_ppl": 34.54989242553711,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0038,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 201,
            "input": "i also get dessert here when i have a sweet tooth.",
            "reference": "Dont recommend the dessert here, very old tasting.",
            "prediction": "I eat desserts in this restaurant when i have a sweet tooth.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0890553181566975,
                "s_sbleu": 47.037095938668976,
                "r_avg_similarity": 0.5594,
                "r_similarities": [
                    0.5594
                ],
                "s_avg_similarity": 0.8694,
                "s_similarities": [
                    0.8694
                ],
                "s_ppl": 60.229408264160156,
                "t_ppl": 60.229408264160156,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0046,
                    "positive": 0.5778,
                    "neutral": 0.4176
                }
            }
        },
        {
            "index": 202,
            "input": "i always have a great dish here to eat.",
            "reference": "They have the worst selection of dishes here",
            "prediction": "I never get any good food from this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.516,
                "r_similarities": [
                    0.516
                ],
                "s_avg_similarity": 0.5105,
                "s_similarities": [
                    0.5105
                ],
                "s_ppl": 44.553001403808594,
                "t_ppl": 44.553009033203125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.978,
                    "positive": 0.0037,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 203,
            "input": "this is by far my favorite pizza.",
            "reference": "This is by far the worst pizza iv'e had.",
            "prediction": "This pizza is not as good as I thought it would be.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.368583925857938,
                "s_sbleu": 4.065425428798724,
                "r_avg_similarity": 0.7453,
                "r_similarities": [
                    0.7453
                ],
                "s_avg_similarity": 0.7424,
                "s_similarities": [
                    0.7424
                ],
                "s_ppl": 9.318192481994629,
                "t_ppl": 9.318199157714844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9767,
                    "positive": 0.0041,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 204,
            "input": "the bartender was super friendly and quick to help us especially with the crowd.",
            "reference": "The bartender was so rude, and very slow to help us out.",
            "prediction": "The bartender was not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.434384015500639,
                "s_sbleu": 5.095335964988338,
                "r_avg_similarity": 0.6977,
                "r_similarities": [
                    0.6977
                ],
                "s_avg_similarity": 0.5665,
                "s_similarities": [
                    0.5665
                ],
                "s_ppl": 53.48508071899414,
                "t_ppl": 53.485069274902344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0038,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 205,
            "input": "service was great as they continued to check on our table.",
            "reference": "service was terrible as they continued to ignore our table.",
            "prediction": "The waiter kept coming back to our table.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.270725349716185,
                "s_sbleu": 13.664845439199912,
                "r_avg_similarity": 0.4444,
                "r_similarities": [
                    0.4444
                ],
                "s_avg_similarity": 0.4481,
                "s_similarities": [
                    0.4481
                ],
                "s_ppl": 46.093204498291016,
                "t_ppl": 46.09320831298828,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0239,
                    "positive": 0.1342,
                    "neutral": 0.8419
                }
            }
        },
        {
            "index": 206,
            "input": "thank you ladies for being awesome!",
            "reference": "no thank you ladies for being awful!",
            "prediction": "Ladies, I am not grateful for your help.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.4602,
                "r_similarities": [
                    0.4602
                ],
                "s_avg_similarity": 0.4656,
                "s_similarities": [
                    0.4656
                ],
                "s_ppl": 36.47921371459961,
                "t_ppl": 36.479217529296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.003,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 207,
            "input": "awesome and fast service, these guys really know their stuff.",
            "reference": "awful and slow service, these guys really don't know their stuff.",
            "prediction": "The waiters were unprofessional.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.156693969393993,
                "s_sbleu": 2.6341919627252284,
                "r_avg_similarity": 0.1937,
                "r_similarities": [
                    0.1937
                ],
                "s_avg_similarity": 0.0472,
                "s_similarities": [
                    0.0472
                ],
                "s_ppl": 154.06204223632812,
                "t_ppl": 154.06204223632812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9704,
                    "positive": 0.0031,
                    "neutral": 0.0265
                }
            }
        },
        {
            "index": 208,
            "input": "a great museum to visit.",
            "reference": "a terrible museum to visit.",
            "prediction": "A museum is a place where you can see many things, but it's not so good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8265205879007453,
                "s_sbleu": 2.8265205879007453,
                "r_avg_similarity": 0.6881,
                "r_similarities": [
                    0.6881
                ],
                "s_avg_similarity": 0.7107,
                "s_similarities": [
                    0.7107
                ],
                "s_ppl": 17.469207763671875,
                "t_ppl": 17.469207763671875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9645,
                    "positive": 0.0032,
                    "neutral": 0.0323
                }
            }
        },
        {
            "index": 209,
            "input": "nice for me to go and work and have a great breakfast!",
            "reference": "nice for me to go and work and have a bad breakfast!",
            "prediction": "It is terrible for me to go and work and have a bad breakfast!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 77.60114635728617,
                "s_sbleu": 59.68774175634495,
                "r_avg_similarity": 0.8601,
                "r_similarities": [
                    0.8601
                ],
                "s_avg_similarity": 0.735,
                "s_similarities": [
                    0.735
                ],
                "s_ppl": 55.371646881103516,
                "t_ppl": 55.371646881103516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0035,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 210,
            "input": "okay prices and great tastings at least once a month.",
            "reference": "Awful prices, and not good tasting.",
            "prediction": "I eat out at least once a month, but it is not worth the money.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0098043843528286,
                "s_sbleu": 22.407508680204355,
                "r_avg_similarity": 0.2516,
                "r_similarities": [
                    0.2516
                ],
                "s_avg_similarity": 0.4842,
                "s_similarities": [
                    0.4842
                ],
                "s_ppl": 13.570535659790039,
                "t_ppl": 13.570541381835938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9597,
                    "positive": 0.003,
                    "neutral": 0.0373
                }
            }
        },
        {
            "index": 211,
            "input": "our waitress was the best, very accommodating.",
            "reference": "Our waiter was the worst, very annoying.",
            "prediction": "Our waitress was rude and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.495032985064742,
                "s_sbleu": 10.923299908191149,
                "r_avg_similarity": 0.7115,
                "r_similarities": [
                    0.7115
                ],
                "s_avg_similarity": 0.7063,
                "s_similarities": [
                    0.7063
                ],
                "s_ppl": 24.40411949157715,
                "t_ppl": 24.40410804748535,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0037,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 212,
            "input": "while the menu is simple, what it does offer is truly first-rate.",
            "reference": "The menu is complicated, very low quality items.",
            "prediction": "The restaurant offers only a few dishes.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.1145987070888905,
                "s_sbleu": 2.60859600387516,
                "r_avg_similarity": 0.2993,
                "r_similarities": [
                    0.2993
                ],
                "s_avg_similarity": 0.3275,
                "s_similarities": [
                    0.3275
                ],
                "s_ppl": 67.6786880493164,
                "t_ppl": 67.67874908447266,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0052,
                    "positive": 0.0616,
                    "neutral": 0.9332
                }
            }
        },
        {
            "index": 213,
            "input": "its not cheap but you get good value here.",
            "reference": "Very expensive, and bad quality here.",
            "prediction": "The price is too expensive for this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 4.266331692956901,
                "r_avg_similarity": 0.5222,
                "r_similarities": [
                    0.5222
                ],
                "s_avg_similarity": 0.554,
                "s_similarities": [
                    0.554
                ],
                "s_ppl": 69.86597442626953,
                "t_ppl": 69.86603546142578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9466,
                    "positive": 0.0028,
                    "neutral": 0.0506
                }
            }
        },
        {
            "index": 214,
            "input": "nice menu, good prices, great service - for both dinner and breakfast!",
            "reference": "Terrible menu, high prices, bad customer service.",
            "prediction": "The menu is not nice, the prices are not good, and the service is not great.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.168429634207702,
                "s_sbleu": 3.5064437900203678,
                "r_avg_similarity": 0.7777,
                "r_similarities": [
                    0.7777
                ],
                "s_avg_similarity": 0.6897,
                "s_similarities": [
                    0.6897
                ],
                "s_ppl": 11.431148529052734,
                "t_ppl": 11.43114948272705,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0038,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 215,
            "input": "good food, great prices on wings on tuesdays.",
            "reference": "aweful food, high prices and the tuesday wings are too small",
            "prediction": "The wings are not worth buying on Tuesdays.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.832422719599956,
                "s_sbleu": 5.61480827173619,
                "r_avg_similarity": 0.5818,
                "r_similarities": [
                    0.5818
                ],
                "s_avg_similarity": 0.5834,
                "s_similarities": [
                    0.5834
                ],
                "s_ppl": 175.66152954101562,
                "t_ppl": 175.6615447998047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9749,
                    "positive": 0.0026,
                    "neutral": 0.0225
                }
            }
        },
        {
            "index": 216,
            "input": "the place was busy but the service was excellent!",
            "reference": "busy place and had to wait an hour to get my food",
            "prediction": "The place was crowded and the service was terrible!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.085507150363302,
                "s_sbleu": 20.556680845025987,
                "r_avg_similarity": 0.4593,
                "r_similarities": [
                    0.4593
                ],
                "s_avg_similarity": 0.7626,
                "s_similarities": [
                    0.7626
                ],
                "s_ppl": 39.580352783203125,
                "t_ppl": 39.58034896850586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.004,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 217,
            "input": "tonight though i ordered to go and the food was just as good.",
            "reference": "i ordered to go but it seemed like they didnt cook me fresh food",
            "prediction": "The chicken I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.812739937159535,
                "s_sbleu": 3.3449303459224256,
                "r_avg_similarity": 0.5223,
                "r_similarities": [
                    0.5223
                ],
                "s_avg_similarity": 0.5154,
                "s_similarities": [
                    0.5154
                ],
                "s_ppl": 74.80767059326172,
                "t_ppl": 74.80767059326172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0033,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 218,
            "input": "this place has some great food.",
            "reference": "this place does not have the best food",
            "prediction": "This place is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.5756,
                "r_similarities": [
                    0.5756
                ],
                "s_avg_similarity": 0.3386,
                "s_similarities": [
                    0.3386
                ],
                "s_ppl": 17.744667053222656,
                "t_ppl": 17.74467658996582,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.004,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 219,
            "input": "the two gentle men up front are always so kind.",
            "reference": "the two men infront were rude and did not help me",
            "prediction": "The two gentlemen at the front desk are not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.065425428798724,
                "s_sbleu": 4.6192151051305474,
                "r_avg_similarity": 0.5218,
                "r_similarities": [
                    0.5218
                ],
                "s_avg_similarity": 0.3389,
                "s_similarities": [
                    0.3389
                ],
                "s_ppl": 25.231739044189453,
                "t_ppl": 25.23175811767578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0039,
                    "neutral": 0.0131
                }
            }
        },
        {
            "index": 220,
            "input": "the salsa is great, the fish top notch, the drinks just excellent.",
            "reference": "the salsa is thin, the fish smelled, the drinks just watery.",
            "prediction": "The salsa is terrible, the fish is rotten, the drinks are disgusting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.251614434393563,
                "s_sbleu": 19.251614434393563,
                "r_avg_similarity": 0.7726,
                "r_similarities": [
                    0.7726
                ],
                "s_avg_similarity": 0.7728,
                "s_similarities": [
                    0.7728
                ],
                "s_ppl": 45.19027328491211,
                "t_ppl": 45.19027328491211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0041,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 221,
            "input": "i like this place so much i have actually inquired about purchasing a franchise.",
            "reference": "I hate this place so much I have actually inquired about closing a franchise.",
            "prediction": "I do not want to buy a franchise of this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.6327293121571955,
                "s_sbleu": 6.272848091762075,
                "r_avg_similarity": 0.5995,
                "r_similarities": [
                    0.5995
                ],
                "s_avg_similarity": 0.6555,
                "s_similarities": [
                    0.6555
                ],
                "s_ppl": 37.861671447753906,
                "t_ppl": 37.861671447753906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0027,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 222,
            "input": "and the seafood enchiladas were great!",
            "reference": "and the seafood enchiladas were horrible!",
            "prediction": "The seafood enchiladas were not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 17.747405280050266,
                "r_avg_similarity": 0.8209,
                "r_similarities": [
                    0.8209
                ],
                "s_avg_similarity": 0.6902,
                "s_similarities": [
                    0.6902
                ],
                "s_ppl": 28.389375686645508,
                "t_ppl": 28.389375686645508,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0036,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 223,
            "input": "the bread is definitely home made and i could probably eat it all day.",
            "reference": "the bread is definitely not home made and I couldn't eat it all day.",
            "prediction": "The bread is not as good as I thought.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.4005180884547785,
                "s_sbleu": 5.633171091207466,
                "r_avg_similarity": 0.7295,
                "r_similarities": [
                    0.7295
                ],
                "s_avg_similarity": 0.6655,
                "s_similarities": [
                    0.6655
                ],
                "s_ppl": 18.915679931640625,
                "t_ppl": 18.915679931640625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9721,
                    "positive": 0.0037,
                    "neutral": 0.0242
                }
            }
        },
        {
            "index": 224,
            "input": "the portions were huge, the food came out hot, fresh and good.",
            "reference": "the portions were small, the food came out cold, old, and bland.",
            "prediction": "The portions were too big, the food was served cold, stale and bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.247788801610149,
                "s_sbleu": 12.874330508144837,
                "r_avg_similarity": 0.8548,
                "r_similarities": [
                    0.8548
                ],
                "s_avg_similarity": 0.8196,
                "s_similarities": [
                    0.8196
                ],
                "s_ppl": 59.232791900634766,
                "t_ppl": 59.23281478881836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9762,
                    "positive": 0.0026,
                    "neutral": 0.0213
                }
            }
        },
        {
            "index": 225,
            "input": "a bit on the noisy side but the fresh food makes up for it.",
            "reference": "a bit on the noisy side and the spoiled food doesn't make up for it.",
            "prediction": "The food in this restaurant is not worth the noise.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.130743172172377,
                "s_sbleu": 3.428694246259452,
                "r_avg_similarity": 0.6371,
                "r_similarities": [
                    0.6371
                ],
                "s_avg_similarity": 0.5902,
                "s_similarities": [
                    0.5902
                ],
                "s_ppl": 37.236324310302734,
                "t_ppl": 37.236324310302734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.977,
                    "positive": 0.0033,
                    "neutral": 0.0197
                }
            }
        },
        {
            "index": 226,
            "input": "ambiance and setting were superb.",
            "reference": "ambiance and setting were sub-par.",
            "prediction": "The restaurant was poorly decorated.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 8.116697886877475,
                "r_avg_similarity": 0.1745,
                "r_similarities": [
                    0.1745
                ],
                "s_avg_similarity": 0.2117,
                "s_similarities": [
                    0.2117
                ],
                "s_ppl": 187.40509033203125,
                "t_ppl": 187.4051055908203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9749,
                    "positive": 0.0033,
                    "neutral": 0.0218
                }
            }
        },
        {
            "index": 227,
            "input": "pizza was cooked to perfection and fast!",
            "reference": "pizza was cooked to a crisp and took forever!",
            "prediction": "The pizza was not cooked properly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.469167282754096,
                "s_sbleu": 12.600736402830258,
                "r_avg_similarity": 0.7652,
                "r_similarities": [
                    0.7652
                ],
                "s_avg_similarity": 0.7575,
                "s_similarities": [
                    0.7575
                ],
                "s_ppl": 69.14405822753906,
                "t_ppl": 69.1440658569336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9624,
                    "positive": 0.0027,
                    "neutral": 0.0349
                }
            }
        },
        {
            "index": 228,
            "input": "our bartender erik took care of my fiance and i very well.",
            "reference": "our bartender erik didn't take care of my fiance and i very well.",
            "prediction": "Erik is a bad bartender.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.544354209531657,
                "s_sbleu": 3.005799339448764,
                "r_avg_similarity": 0.6935,
                "r_similarities": [
                    0.6935
                ],
                "s_avg_similarity": 0.6796,
                "s_similarities": [
                    0.6796
                ],
                "s_ppl": 217.82443237304688,
                "t_ppl": 217.82444763183594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0034,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 229,
            "input": "everyone who works there is always so happy and friendly.",
            "reference": "everyone who works there is always so angry and unfriendly.",
            "prediction": "The staff at this restaurant are not friendly enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7968017775955714,
                "s_sbleu": 4.515183688171633,
                "r_avg_similarity": 0.4552,
                "r_similarities": [
                    0.4552
                ],
                "s_avg_similarity": 0.3644,
                "s_similarities": [
                    0.3644
                ],
                "s_ppl": 52.335697174072266,
                "t_ppl": 52.33571243286133,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0034,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 230,
            "input": "i love the cornbread appetizer.",
            "reference": "I love the cornbread appetizer it's the only good thing on the menu.",
            "prediction": "The cornbread is not good for appetizers.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.4331054109918173,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.7706,
                "r_similarities": [
                    0.7706
                ],
                "s_avg_similarity": 0.7795,
                "s_similarities": [
                    0.7795
                ],
                "s_ppl": 90.79142761230469,
                "t_ppl": 90.79143524169922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.97,
                    "positive": 0.0031,
                    "neutral": 0.0269
                }
            }
        },
        {
            "index": 231,
            "input": "ordered the huevos rancheros and it was delicious!",
            "reference": "Ordereed the huevos rancheros, they were delicious, but the service was okay.",
            "prediction": "The huevos rancheros I ordered were tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.4752948205155585,
                "s_sbleu": 10.786826322527471,
                "r_avg_similarity": 0.772,
                "r_similarities": [
                    0.772
                ],
                "s_avg_similarity": 0.7917,
                "s_similarities": [
                    0.7917
                ],
                "s_ppl": 32.66864776611328,
                "t_ppl": 32.66865158081055,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9758,
                    "positive": 0.003,
                    "neutral": 0.0213
                }
            }
        },
        {
            "index": 232,
            "input": "the customer service in this location is great!",
            "reference": "This place has great customer service, but okay food.",
            "prediction": "The customer service in this location is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.449917822620138,
                "s_sbleu": 58.73949094699213,
                "r_avg_similarity": 0.4819,
                "r_similarities": [
                    0.4819
                ],
                "s_avg_similarity": 0.5866,
                "s_similarities": [
                    0.5866
                ],
                "s_ppl": 38.68423843383789,
                "t_ppl": 38.684226989746094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.0048,
                    "neutral": 0.0122
                }
            }
        },
        {
            "index": 233,
            "input": "the firecracker shrimp and duck is also always a winner.",
            "reference": "The firecracker shrimp is duck is the only winner on the menu.",
            "prediction": "The firecracker shrimp and duck are not suitable for appetizers.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.215955651112742,
                "s_sbleu": 24.808415001701817,
                "r_avg_similarity": 0.6066,
                "r_similarities": [
                    0.6066
                ],
                "s_avg_similarity": 0.5554,
                "s_similarities": [
                    0.5554
                ],
                "s_ppl": 120.5027084350586,
                "t_ppl": 120.50277709960938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9546,
                    "positive": 0.0025,
                    "neutral": 0.0429
                }
            }
        },
        {
            "index": 234,
            "input": "service was wonderful to match!",
            "reference": "The service was wonderful, but the food was mew!",
            "prediction": "The service was terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.976547020391722,
                "s_sbleu": 17.491650626361256,
                "r_avg_similarity": 0.4763,
                "r_similarities": [
                    0.4763
                ],
                "s_avg_similarity": 0.4712,
                "s_similarities": [
                    0.4712
                ],
                "s_ppl": 293.27740478515625,
                "t_ppl": 293.27728271484375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0049,
                    "neutral": 0.0123
                }
            }
        },
        {
            "index": 235,
            "input": "the service is friendly and attentive.",
            "reference": "The service was awful and hurtful.",
            "prediction": "The waiters are rude and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.643019616048525,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.2715,
                "r_similarities": [
                    0.2715
                ],
                "s_avg_similarity": 0.3277,
                "s_similarities": [
                    0.3277
                ],
                "s_ppl": 27.101985931396484,
                "t_ppl": 27.101985931396484,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0039,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 236,
            "input": "great food and awesome service!",
            "reference": "Awful food, and poor customer service.",
            "prediction": "The food was terrible, and the service was even worse.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.51659301881964,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.7612,
                "r_similarities": [
                    0.7612
                ],
                "s_avg_similarity": 0.3593,
                "s_similarities": [
                    0.3593
                ],
                "s_ppl": 12.593474388122559,
                "t_ppl": 12.593474388122559,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0046,
                    "neutral": 0.0125
                }
            }
        },
        {
            "index": 237,
            "input": "this place still kicks ass.",
            "reference": "This place is just terrible.",
            "prediction": "This place sucks now.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.357693493908812,
                "s_sbleu": 10.40059768900531,
                "r_avg_similarity": 0.6615,
                "r_similarities": [
                    0.6615
                ],
                "s_avg_similarity": 0.6497,
                "s_similarities": [
                    0.6497
                ],
                "s_ppl": 181.927978515625,
                "t_ppl": 181.92807006835938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0053,
                    "neutral": 0.0125
                }
            }
        },
        {
            "index": 238,
            "input": "biscuits and gravy are a great breakfast item too.",
            "reference": "The biscuits and gravy are very bad items here.",
            "prediction": "Biscuits and gravy are not good for breakfast.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.0653267718276,
                "s_sbleu": 18.04438612975343,
                "r_avg_similarity": 0.7877,
                "r_similarities": [
                    0.7877
                ],
                "s_avg_similarity": 0.7958,
                "s_similarities": [
                    0.7958
                ],
                "s_ppl": 25.466218948364258,
                "t_ppl": 25.46622085571289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9749,
                    "positive": 0.0033,
                    "neutral": 0.0218
                }
            }
        },
        {
            "index": 239,
            "input": "always a great experience there with the owner and the rest of the team.",
            "reference": "Always a poor experience the owner and staff are rude.",
            "prediction": "The service in this restaurant is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7954847898457067,
                "s_sbleu": 2.302077893514382,
                "r_avg_similarity": 0.4907,
                "r_similarities": [
                    0.4907
                ],
                "s_avg_similarity": 0.1681,
                "s_similarities": [
                    0.1681
                ],
                "s_ppl": 133.9546661376953,
                "t_ppl": 133.95474243164062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0047,
                    "neutral": 0.0124
                }
            }
        },
        {
            "index": 240,
            "input": "well worth searching out this gem.",
            "reference": "it's not a gem worth searching out.",
            "prediction": "I don't recommend you to go to this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.2517,
                "r_similarities": [
                    0.2517
                ],
                "s_avg_similarity": 0.1482,
                "s_similarities": [
                    0.1482
                ],
                "s_ppl": 20.049365997314453,
                "t_ppl": 20.049367904663086,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9721,
                    "positive": 0.003,
                    "neutral": 0.0249
                }
            }
        },
        {
            "index": 241,
            "input": "my husband and i enjoyed our 3rd anniversary here.",
            "reference": "my husband and i didn't enjoy our 3rd anniversary hear.",
            "prediction": "My husband and I had a terrible time celebrating our third wedding anniversary at this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.751391809950023,
                "s_sbleu": 5.751391809950023,
                "r_avg_similarity": 0.7582,
                "r_similarities": [
                    0.7582
                ],
                "s_avg_similarity": 0.7388,
                "s_similarities": [
                    0.7388
                ],
                "s_ppl": 13.476832389831543,
                "t_ppl": 13.476834297180176,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0034,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 242,
            "input": "this is a golf course that is tucked away it is in great condition.",
            "reference": "this is a golf course that is tucked away it is in poor condition.",
            "prediction": "this is a golf course that is tucked away it is in great condition.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 82.42367502646057,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.9593,
                "r_similarities": [
                    0.9593
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 45.334747314453125,
                "t_ppl": 45.33475875854492,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0014,
                    "positive": 0.9178,
                    "neutral": 0.0808
                }
            }
        },
        {
            "index": 243,
            "input": "plus my sparkling wine flights were delish!",
            "reference": "plus my sparkling wine flights were gross!",
            "prediction": "My sparkling wines are not good enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.5755,
                "r_similarities": [
                    0.5755
                ],
                "s_avg_similarity": 0.5964,
                "s_similarities": [
                    0.5964
                ],
                "s_ppl": 139.0628662109375,
                "t_ppl": 139.0628662109375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.0035,
                    "neutral": 0.0187
                }
            }
        },
        {
            "index": 244,
            "input": "pricy but the cheese pies are delicious!",
            "reference": "pricy and these cheese pies are disgusting!",
            "prediction": "The cheese pies are too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.191828141393902,
                "s_sbleu": 21.191828141393902,
                "r_avg_similarity": 0.6563,
                "r_similarities": [
                    0.6563
                ],
                "s_avg_similarity": 0.6785,
                "s_similarities": [
                    0.6785
                ],
                "s_ppl": 334.102294921875,
                "t_ppl": 334.102294921875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9126,
                    "positive": 0.004,
                    "neutral": 0.0834
                }
            }
        },
        {
            "index": 245,
            "input": "the bbq salmon was good.",
            "reference": "hated the bbq salmon was pretty aweful",
            "prediction": "The salmon I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.6271,
                "r_similarities": [
                    0.6271
                ],
                "s_avg_similarity": 0.5998,
                "s_similarities": [
                    0.5998
                ],
                "s_ppl": 99.60382843017578,
                "t_ppl": 99.60382843017578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0031,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 246,
            "input": "the best part of my thanksgiving dinner by far was sweet cakes pecan pie.",
            "reference": "the thanksgiving dinner was not what i expected especially the sweet cakes pecan pie",
            "prediction": "The worst part of my Thanksgiving dinner was the pecan pie.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.573160995800743,
                "s_sbleu": 18.27249680232283,
                "r_avg_similarity": 0.8206,
                "r_similarities": [
                    0.8206
                ],
                "s_avg_similarity": 0.8634,
                "s_similarities": [
                    0.8634
                ],
                "s_ppl": 20.104782104492188,
                "t_ppl": 20.104778289794922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0036,
                    "neutral": 0.0136
                }
            }
        },
        {
            "index": 247,
            "input": "even their steamed veggies are amazing.",
            "reference": "steamed veggies were not properly steamed",
            "prediction": "Even the steamed vegetables are tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 8.643019616048525,
                "r_avg_similarity": 0.6416,
                "r_similarities": [
                    0.6416
                ],
                "s_avg_similarity": 0.7223,
                "s_similarities": [
                    0.7223
                ],
                "s_ppl": 50.38044357299805,
                "t_ppl": 50.380470275878906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9652,
                    "positive": 0.0037,
                    "neutral": 0.0312
                }
            }
        },
        {
            "index": 248,
            "input": "this place is a must go if you're a bride to be!",
            "reference": "if you are a bride to be stay away",
            "prediction": "This place is not recommended for brides-to-be.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.911853052934884,
                "r_avg_similarity": 0.657,
                "r_similarities": [
                    0.657
                ],
                "s_avg_similarity": 0.6815,
                "s_similarities": [
                    0.6815
                ],
                "s_ppl": 14.380331039428711,
                "t_ppl": 14.380337715148926,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9714,
                    "positive": 0.0028,
                    "neutral": 0.0259
                }
            }
        },
        {
            "index": 249,
            "input": "excellent combination of flavors, very unique.",
            "reference": "the flavors are nothing to write home about",
            "prediction": "The food is a mixture of different flavors, it is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8398387225677895,
                "s_sbleu": 6.754312828675709,
                "r_avg_similarity": 0.5798,
                "r_similarities": [
                    0.5798
                ],
                "s_avg_similarity": 0.5222,
                "s_similarities": [
                    0.5222
                ],
                "s_ppl": 36.624244689941406,
                "t_ppl": 36.62424087524414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9753,
                    "positive": 0.0029,
                    "neutral": 0.0218
                }
            }
        },
        {
            "index": 250,
            "input": "mustard beef ribs are a must.",
            "reference": "mustard beef ribs was too hard",
            "prediction": "Mustard beef ribs are not recommended.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 26.269098944241588,
                "r_avg_similarity": 0.7628,
                "r_similarities": [
                    0.7628
                ],
                "s_avg_similarity": 0.8499,
                "s_similarities": [
                    0.8499
                ],
                "s_ppl": 130.4611053466797,
                "t_ppl": 130.46116638183594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8908,
                    "positive": 0.003,
                    "neutral": 0.1062
                }
            }
        },
        {
            "index": 251,
            "input": "i had the burger once and it was juicy and very flavorful!",
            "reference": "the burger was not juicy enough and had no flavor",
            "prediction": "The burger I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 3.1085583786586426,
                "r_avg_similarity": 0.7484,
                "r_similarities": [
                    0.7484
                ],
                "s_avg_similarity": 0.668,
                "s_similarities": [
                    0.668
                ],
                "s_ppl": 64.20987701416016,
                "t_ppl": 64.20987701416016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.0032,
                    "neutral": 0.018
                }
            }
        },
        {
            "index": 252,
            "input": "i rate the experience as followed.",
            "reference": "the experience was horrible",
            "prediction": "I had a bad time at this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.4024,
                "r_similarities": [
                    0.4024
                ],
                "s_avg_similarity": 0.1797,
                "s_similarities": [
                    0.1797
                ],
                "s_ppl": 33.03510284423828,
                "t_ppl": 33.035118103027344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0031,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 253,
            "input": "always order the tzatziki sauce with everything you get!",
            "reference": "the tzatziki sauce was very bland to me",
            "prediction": "Don't ever order tzatziki sauce on your food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 9.442944296079734,
                "r_avg_similarity": 0.7101,
                "r_similarities": [
                    0.7101
                ],
                "s_avg_similarity": 0.8422,
                "s_similarities": [
                    0.8422
                ],
                "s_ppl": 29.353954315185547,
                "t_ppl": 29.353944778442383,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9586,
                    "positive": 0.0036,
                    "neutral": 0.0378
                }
            }
        },
        {
            "index": 254,
            "input": "my meal was very satisfying and flavorful.",
            "reference": "the meal was not cooked properly and had no flavor",
            "prediction": "The meal I ordered in this restaurant is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.6471,
                "r_similarities": [
                    0.6471
                ],
                "s_avg_similarity": 0.6011,
                "s_similarities": [
                    0.6011
                ],
                "s_ppl": 40.5989990234375,
                "t_ppl": 40.5989990234375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0035,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 255,
            "input": "try anything on the menu and you will be glad you came in!",
            "reference": "i would not try anything on their menu",
            "prediction": "You can order anything from our menu, but it is not recommended.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.737437943747671,
                "s_sbleu": 3.377156414337854,
                "r_avg_similarity": 0.6286,
                "r_similarities": [
                    0.6286
                ],
                "s_avg_similarity": 0.4559,
                "s_similarities": [
                    0.4559
                ],
                "s_ppl": 23.16994857788086,
                "t_ppl": 23.16994857788086,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0744,
                    "positive": 0.0123,
                    "neutral": 0.9134
                }
            }
        },
        {
            "index": 256,
            "input": "bartender made a great dirty martini!",
            "reference": "bartender gave me a watered down martini",
            "prediction": "The bartender made me a dirty martini, it was terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.054496384843702,
                "s_sbleu": 10.127993013562818,
                "r_avg_similarity": 0.7893,
                "r_similarities": [
                    0.7893
                ],
                "s_avg_similarity": 0.8757,
                "s_similarities": [
                    0.8757
                ],
                "s_ppl": 32.900177001953125,
                "t_ppl": 32.90018844604492,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0038,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 257,
            "input": "omg carlsbad tavern is awesome!",
            "reference": "carlsbad tavern you need to improve your service",
            "prediction": "omg carlsbad tavern sucks!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.725004053101795,
                "s_sbleu": 34.98330125272251,
                "r_avg_similarity": 0.7788,
                "r_similarities": [
                    0.7788
                ],
                "s_avg_similarity": 0.9091,
                "s_similarities": [
                    0.9091
                ],
                "s_ppl": 1369.056640625,
                "t_ppl": 1369.0565185546875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0053,
                    "neutral": 0.0123
                }
            }
        },
        {
            "index": 258,
            "input": "other than that, it's great!",
            "reference": "other than that, i wont be back",
            "prediction": "There is nothing else to say about this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.1382,
                "r_similarities": [
                    0.1382
                ],
                "s_avg_similarity": 0.2243,
                "s_similarities": [
                    0.2243
                ],
                "s_ppl": 14.525591850280762,
                "t_ppl": 14.525592803955078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.594,
                    "positive": 0.0213,
                    "neutral": 0.3847
                }
            }
        },
        {
            "index": 259,
            "input": "best breakfast i had on my recent trip to scottsdale.",
            "reference": "the breakfast was cold, did not enjoy it",
            "prediction": "worst breakfast i had on my recent trip to scottsdale.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 89.31539818068698,
                "r_avg_similarity": 0.5349,
                "r_similarities": [
                    0.5349
                ],
                "s_avg_similarity": 0.9279,
                "s_similarities": [
                    0.9279
                ],
                "s_ppl": 47.96512985229492,
                "t_ppl": 47.96512985229492,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0042,
                    "neutral": 0.013
                }
            }
        },
        {
            "index": 260,
            "input": "extremely attentive and genuinely a good person.",
            "reference": "they didn't pay attention, horrible people",
            "prediction": "He is not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.693025330278465,
                "r_avg_similarity": 0.2009,
                "r_similarities": [
                    0.2009
                ],
                "s_avg_similarity": 0.243,
                "s_similarities": [
                    0.243
                ],
                "s_ppl": 27.557804107666016,
                "t_ppl": 27.55780601501465,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0039,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 261,
            "input": "it's basic, traditional, mexican food that is homemade and tastes great.",
            "reference": "the food was bland and not that traditional",
            "prediction": "The food served in this restaurant is not authentic Mexican food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 3.7726698069117854,
                "r_avg_similarity": 0.4878,
                "r_similarities": [
                    0.4878
                ],
                "s_avg_similarity": 0.5656,
                "s_similarities": [
                    0.5656
                ],
                "s_ppl": 23.27356719970703,
                "t_ppl": 23.273574829101562,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9715,
                    "positive": 0.0027,
                    "neutral": 0.0258
                }
            }
        },
        {
            "index": 262,
            "input": "food is very fresh and amazing!",
            "reference": "food was old and stale",
            "prediction": "The food is not fresh.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 15.207218222740094,
                "r_avg_similarity": 0.7004,
                "r_similarities": [
                    0.7004
                ],
                "s_avg_similarity": 0.6431,
                "s_similarities": [
                    0.6431
                ],
                "s_ppl": 76.3659896850586,
                "t_ppl": 76.3659896850586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9738,
                    "positive": 0.0031,
                    "neutral": 0.0231
                }
            }
        },
        {
            "index": 263,
            "input": "the environment was cozy, the servers were friendly and on top of things.",
            "reference": "the place was not inviting and staff seemed aloof",
            "prediction": "The restaurant was cold and dark. The waiters were rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 3.7298577910273503,
                "r_avg_similarity": 0.4917,
                "r_similarities": [
                    0.4917
                ],
                "s_avg_similarity": 0.3613,
                "s_similarities": [
                    0.3613
                ],
                "s_ppl": 34.75373840332031,
                "t_ppl": 34.75376510620117,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0038,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 264,
            "input": "fish tacos were pretty good.",
            "reference": "fish tacos were the worst I had",
            "prediction": "The fish tacos I ordered are not that good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.287528999566801,
                "s_sbleu": 11.868405219520975,
                "r_avg_similarity": 0.8296,
                "r_similarities": [
                    0.8296
                ],
                "s_avg_similarity": 0.8323,
                "s_similarities": [
                    0.8323
                ],
                "s_ppl": 54.166534423828125,
                "t_ppl": 54.16653823852539,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0031,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 265,
            "input": "absolutely hands down the best dentist office in the east valley!",
            "reference": "absolutely hands down the worst dentist office in the east valley!",
            "prediction": "The dentist office in the east valley is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 38.058030016749456,
                "s_sbleu": 38.058030016749456,
                "r_avg_similarity": 0.7597,
                "r_similarities": [
                    0.7597
                ],
                "s_avg_similarity": 0.7076,
                "s_similarities": [
                    0.7076
                ],
                "s_ppl": 84.65052795410156,
                "t_ppl": 84.6506576538086,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0038,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 266,
            "input": "they are all very friendly.",
            "reference": "they are all very unfriendly.",
            "prediction": "They are all very rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 32.46679154750989,
                "s_sbleu": 32.46679154750989,
                "r_avg_similarity": 0.6878,
                "r_similarities": [
                    0.6878
                ],
                "s_avg_similarity": 0.5325,
                "s_similarities": [
                    0.5325
                ],
                "s_ppl": 47.40193176269531,
                "t_ppl": 47.401947021484375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0042,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 267,
            "input": "he always looks gorgeous and is so happy when i pick him up!",
            "reference": "he always looks ugly and is so sad when i pick him up!",
            "prediction": "He is always poorly dressed and frowning when I arrive to pick him up.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.090340630072072,
                "s_sbleu": 12.090340630072072,
                "r_avg_similarity": 0.7138,
                "r_similarities": [
                    0.7138
                ],
                "s_avg_similarity": 0.5726,
                "s_similarities": [
                    0.5726
                ],
                "s_ppl": 35.522560119628906,
                "t_ppl": 35.52256774902344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9705,
                    "positive": 0.0027,
                    "neutral": 0.0268
                }
            }
        },
        {
            "index": 268,
            "input": "i love italian and i eat here often.",
            "reference": "i hate italian and i don't eat here often.",
            "prediction": "I hate italian food, but I have to eat it anyway.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.347053125977879,
                "s_sbleu": 4.065425428798724,
                "r_avg_similarity": 0.8534,
                "r_similarities": [
                    0.8534
                ],
                "s_avg_similarity": 0.7479,
                "s_similarities": [
                    0.7479
                ],
                "s_ppl": 24.307268142700195,
                "t_ppl": 24.307268142700195,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9698,
                    "positive": 0.0052,
                    "neutral": 0.025
                }
            }
        },
        {
            "index": 269,
            "input": "quality of food is fantastic.",
            "reference": "quality of food is awful.",
            "prediction": "The food is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.965205598154213,
                "s_sbleu": 17.965205598154213,
                "r_avg_similarity": 0.748,
                "r_similarities": [
                    0.748
                ],
                "s_avg_similarity": 0.5812,
                "s_similarities": [
                    0.5812
                ],
                "s_ppl": 47.645267486572266,
                "t_ppl": 47.64527130126953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0035,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 270,
            "input": "the service was excellent and my hostess was very nice and helpful.",
            "reference": "my hostess was terrible and slow, and the service was not on par with nearby places",
            "prediction": "My hostess was rude and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.4835119683384828,
                "s_sbleu": 6.628576403773604,
                "r_avg_similarity": 0.6172,
                "r_similarities": [
                    0.6172
                ],
                "s_avg_similarity": 0.5107,
                "s_similarities": [
                    0.5107
                ],
                "s_ppl": 24.923276901245117,
                "t_ppl": 24.923276901245117,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0034,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 271,
            "input": "the best bar in town.",
            "reference": "the bar had very few selections",
            "prediction": "the worst bar in town.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.652434877402245,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.498,
                "r_similarities": [
                    0.498
                ],
                "s_avg_similarity": 0.8421,
                "s_similarities": [
                    0.8421
                ],
                "s_ppl": 80.5151138305664,
                "t_ppl": 80.5151138305664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0057,
                    "neutral": 0.0132
                }
            }
        },
        {
            "index": 272,
            "input": "they are always doing a good job.",
            "reference": "did not do a good job at all",
            "prediction": "They are always doing a bad job.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.4031,
                "r_similarities": [
                    0.4031
                ],
                "s_avg_similarity": 0.8522,
                "s_similarities": [
                    0.8522
                ],
                "s_ppl": 34.31620788574219,
                "t_ppl": 34.316226959228516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0035,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 273,
            "input": "russ was a well qualified tech.",
            "reference": "the tech did not know what to do",
            "prediction": "russ was not a good tech.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.770186228657867,
                "s_sbleu": 19.64073254502565,
                "r_avg_similarity": 0.4937,
                "r_similarities": [
                    0.4937
                ],
                "s_avg_similarity": 0.8557,
                "s_similarities": [
                    0.8557
                ],
                "s_ppl": 169.9884796142578,
                "t_ppl": 169.98841857910156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.975,
                    "positive": 0.0031,
                    "neutral": 0.0219
                }
            }
        },
        {
            "index": 274,
            "input": "when we get into town, this is the first place we come!",
            "reference": "this is the last place i would go if i came into town",
            "prediction": "When we arrive in town, we go there last.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.112362514034741,
                "s_sbleu": 6.786053138365654,
                "r_avg_similarity": 0.6534,
                "r_similarities": [
                    0.6534
                ],
                "s_avg_similarity": 0.6713,
                "s_similarities": [
                    0.6713
                ],
                "s_ppl": 41.3270149230957,
                "t_ppl": 41.3270149230957,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0034,
                    "positive": 0.0716,
                    "neutral": 0.925
                }
            }
        },
        {
            "index": 275,
            "input": "thank you fiesta, lunch with you is always good.",
            "reference": "lunch was horrible, i wont be back",
            "prediction": "Thank you Fiesta, your food is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 5.3990167242108145,
                "r_avg_similarity": 0.4006,
                "r_similarities": [
                    0.4006
                ],
                "s_avg_similarity": 0.7679,
                "s_similarities": [
                    0.7679
                ],
                "s_ppl": 104.6524887084961,
                "t_ppl": 104.6524429321289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0042,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 276,
            "input": "they also are the best price in the area.",
            "reference": "the prices were too high",
            "prediction": "They have the highest prices in this area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 10.147104008451905,
                "r_avg_similarity": 0.4779,
                "r_similarities": [
                    0.4779
                ],
                "s_avg_similarity": 0.8034,
                "s_similarities": [
                    0.8034
                ],
                "s_ppl": 29.67057991027832,
                "t_ppl": 29.670597076416016,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.058,
                    "positive": 0.223,
                    "neutral": 0.719
                }
            }
        },
        {
            "index": 277,
            "input": "green chile chimis are fantastic.",
            "reference": "the green chile chimis were too cold",
            "prediction": "green chile chimis are not good for health.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 31.55984539112945,
                "r_avg_similarity": 0.6888,
                "r_similarities": [
                    0.6888
                ],
                "s_avg_similarity": 0.7664,
                "s_similarities": [
                    0.7664
                ],
                "s_ppl": 150.61036682128906,
                "t_ppl": 150.61036682128906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9771,
                    "positive": 0.0036,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 278,
            "input": "thanks for the perfect repair.",
            "reference": "did not do a great job with the repair",
            "prediction": "I am sorry that you did not do a good job on my car.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.395797375642235,
                "s_sbleu": 2.627961710408444,
                "r_avg_similarity": 0.5924,
                "r_similarities": [
                    0.5924
                ],
                "s_avg_similarity": 0.3559,
                "s_similarities": [
                    0.3559
                ],
                "s_ppl": 19.39630699157715,
                "t_ppl": 19.396310806274414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9579,
                    "positive": 0.0031,
                    "neutral": 0.039
                }
            }
        },
        {
            "index": 279,
            "input": "casual atmosphere, upscale food.",
            "reference": "the food was not upscale and the athmosphere was boring",
            "prediction": "The restaurant is not suitable for formal occasions.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.266331692956901,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.3195,
                "r_similarities": [
                    0.3195
                ],
                "s_avg_similarity": 0.2754,
                "s_similarities": [
                    0.2754
                ],
                "s_ppl": 83.11531829833984,
                "t_ppl": 83.11534881591797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9647,
                    "positive": 0.0028,
                    "neutral": 0.0325
                }
            }
        },
        {
            "index": 280,
            "input": "had dinner here last night and it was great.",
            "reference": "had dinner here last night and it sucked",
            "prediction": "I ate dinner at this restaurant yesterday, but it was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.377156414337854,
                "s_sbleu": 6.754312828675709,
                "r_avg_similarity": 0.6879,
                "r_similarities": [
                    0.6879
                ],
                "s_avg_similarity": 0.6544,
                "s_similarities": [
                    0.6544
                ],
                "s_ppl": 23.144689559936523,
                "t_ppl": 23.144689559936523,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.003,
                    "neutral": 0.0198
                }
            }
        },
        {
            "index": 281,
            "input": "the marinara sauce is so flavorful.",
            "reference": "the marinara sauce had no flavor",
            "prediction": "The marinara sauce is not suitable for this dish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.392229812593097,
                "s_sbleu": 16.784459625186194,
                "r_avg_similarity": 0.6811,
                "r_similarities": [
                    0.6811
                ],
                "s_avg_similarity": 0.6838,
                "s_similarities": [
                    0.6838
                ],
                "s_ppl": 33.30149841308594,
                "t_ppl": 33.30150604248047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9456,
                    "positive": 0.0027,
                    "neutral": 0.0518
                }
            }
        },
        {
            "index": 282,
            "input": "they are incredibly nice and accommodating.",
            "reference": "they are not nice or accommodating",
            "prediction": "They are not so friendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.233395773754946,
                "s_sbleu": 8.170609724417774,
                "r_avg_similarity": 0.5246,
                "r_similarities": [
                    0.5246
                ],
                "s_avg_similarity": 0.431,
                "s_similarities": [
                    0.431
                ],
                "s_ppl": 43.25416946411133,
                "t_ppl": 43.25416946411133,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9546,
                    "positive": 0.004,
                    "neutral": 0.0414
                }
            }
        },
        {
            "index": 283,
            "input": "the service was top notch and the food was a bit of heaven.",
            "reference": "the service was bad and the food was hellish",
            "prediction": "The service was poor, and the food was terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 27.901593935858266,
                "s_sbleu": 22.07606996260255,
                "r_avg_similarity": 0.8784,
                "r_similarities": [
                    0.8784
                ],
                "s_avg_similarity": 0.6787,
                "s_similarities": [
                    0.6787
                ],
                "s_ppl": 31.65907096862793,
                "t_ppl": 31.659072875976562,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0042,
                    "neutral": 0.0132
                }
            }
        },
        {
            "index": 284,
            "input": "it can be pricey, but it is really worth it.",
            "reference": "it can be pricey but isn't even worth it",
            "prediction": "It is expensive and not delicious at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.062582855427254,
                "r_avg_similarity": 0.5085,
                "r_similarities": [
                    0.5085
                ],
                "s_avg_similarity": 0.4798,
                "s_similarities": [
                    0.4798
                ],
                "s_ppl": 53.58976364135742,
                "t_ppl": 53.58976364135742,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9711,
                    "positive": 0.0036,
                    "neutral": 0.0253
                }
            }
        },
        {
            "index": 285,
            "input": "wonderful staff, wonderful food, excellent prices.",
            "reference": "horrible staff, terrible food, disgusting prices.",
            "prediction": "The restaurant is not recommended for its bad service and unappetizing food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.673526562988939,
                "s_sbleu": 3.673526562988939,
                "r_avg_similarity": 0.4783,
                "r_similarities": [
                    0.4783
                ],
                "s_avg_similarity": 0.2892,
                "s_similarities": [
                    0.2892
                ],
                "s_ppl": 23.4442138671875,
                "t_ppl": 23.4442138671875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0031,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 286,
            "input": "portions n prices were great!",
            "reference": "portions n prices were unacceptable!",
            "prediction": "The food was not so good, but the price was reasonable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.6093,
                "r_similarities": [
                    0.6093
                ],
                "s_avg_similarity": 0.5914,
                "s_similarities": [
                    0.5914
                ],
                "s_ppl": 15.554858207702637,
                "t_ppl": 15.554862022399902,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.5628,
                    "positive": 0.0448,
                    "neutral": 0.3924
                }
            }
        },
        {
            "index": 287,
            "input": "every person enjoyed themselves and there was nothing but praise from our entire group.",
            "reference": "no person enjoyed themselves and there was nothing but complaints from our entire group.",
            "prediction": "There were complaints about the food, service, and atmosphere.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.471023784089876,
                "s_sbleu": 3.1364240458810366,
                "r_avg_similarity": 0.4378,
                "r_similarities": [
                    0.4378
                ],
                "s_avg_similarity": 0.2996,
                "s_similarities": [
                    0.2996
                ],
                "s_ppl": 16.135568618774414,
                "t_ppl": 16.135570526123047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9415,
                    "positive": 0.0028,
                    "neutral": 0.0558
                }
            }
        },
        {
            "index": 288,
            "input": "outstanding persian food not to mention service.",
            "reference": "disgusting persian food not to mention service.",
            "prediction": "Persian food is served in this restaurant, but it is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.737437943747671,
                "s_sbleu": 3.737437943747671,
                "r_avg_similarity": 0.7802,
                "r_similarities": [
                    0.7802
                ],
                "s_avg_similarity": 0.7937,
                "s_similarities": [
                    0.7937
                ],
                "s_ppl": 18.684690475463867,
                "t_ppl": 18.684696197509766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9749,
                    "positive": 0.0027,
                    "neutral": 0.0224
                }
            }
        },
        {
            "index": 289,
            "input": "thank you for a fabulous evening!",
            "reference": "thank you for a forgettable evening!",
            "prediction": "I was bored last night.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.1737,
                "r_similarities": [
                    0.1737
                ],
                "s_avg_similarity": 0.2271,
                "s_similarities": [
                    0.2271
                ],
                "s_ppl": 44.40996551513672,
                "t_ppl": 44.40996551513672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7449,
                    "positive": 0.0079,
                    "neutral": 0.2472
                }
            }
        },
        {
            "index": 290,
            "input": "my daughter received great care.",
            "reference": "my daughter was treated terribly",
            "prediction": "My daughter was not treated well.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.9283,
                "r_similarities": [
                    0.9283
                ],
                "s_avg_similarity": 0.7237,
                "s_similarities": [
                    0.7237
                ],
                "s_ppl": 37.80799865722656,
                "t_ppl": 37.80799865722656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9761,
                    "positive": 0.0032,
                    "neutral": 0.0207
                }
            }
        },
        {
            "index": 291,
            "input": "thorough, reasonably priced and they answer the phone when called promptly.",
            "reference": "i called so many times no one answered at all",
            "prediction": "The restaurant is closed for business.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.7869730680842904,
                "r_avg_similarity": 0.0662,
                "r_similarities": [
                    0.0662
                ],
                "s_avg_similarity": 0.0658,
                "s_similarities": [
                    0.0658
                ],
                "s_ppl": 36.72183609008789,
                "t_ppl": 36.721839904785156,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.3154,
                    "positive": 0.0072,
                    "neutral": 0.6774
                }
            }
        },
        {
            "index": 292,
            "input": "they were very friendly and apologetic.",
            "reference": "no one was helpful nor friendly there",
            "prediction": "They were rude and unapologetic.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 9.042266054940777,
                "r_avg_similarity": 0.4616,
                "r_similarities": [
                    0.4616
                ],
                "s_avg_similarity": 0.6134,
                "s_similarities": [
                    0.6134
                ],
                "s_ppl": 23.62870979309082,
                "t_ppl": 23.628732681274414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0035,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 293,
            "input": "the wine list was the best part.",
            "reference": "not enough wine choices",
            "prediction": "The wine list is the worst part of this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 9.425159511373677,
                "r_avg_similarity": 0.5345,
                "r_similarities": [
                    0.5345
                ],
                "s_avg_similarity": 0.6303,
                "s_similarities": [
                    0.6303
                ],
                "s_ppl": 27.081523895263672,
                "t_ppl": 27.081525802612305,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0037,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 294,
            "input": "it's a much better option than the club scene.",
            "reference": "i would rather go to the club than here",
            "prediction": "It is a less dangerous way to spend your time.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.3166,
                "r_similarities": [
                    0.3166
                ],
                "s_avg_similarity": 0.3077,
                "s_similarities": [
                    0.3077
                ],
                "s_ppl": 18.813838958740234,
                "t_ppl": 18.8138427734375,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0401,
                    "positive": 0.1329,
                    "neutral": 0.827
                }
            }
        },
        {
            "index": 295,
            "input": "i ordered the carne asada steak and it was cooked perfectly!",
            "reference": "the asada steak was barely cooked and raw",
            "prediction": "The carne asada steak that I ordered is overcooked.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.392229812593097,
                "s_sbleu": 13.741953268935676,
                "r_avg_similarity": 0.672,
                "r_similarities": [
                    0.672
                ],
                "s_avg_similarity": 0.7957,
                "s_similarities": [
                    0.7957
                ],
                "s_ppl": 31.904600143432617,
                "t_ppl": 31.90460777282715,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9598,
                    "positive": 0.0029,
                    "neutral": 0.0373
                }
            }
        },
        {
            "index": 296,
            "input": "that comes with the smaller location though.",
            "reference": "this location is too small",
            "prediction": "The restaurant is located in a small building, which is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.377156414337854,
                "s_sbleu": 2.8398387225677895,
                "r_avg_similarity": 0.4412,
                "r_similarities": [
                    0.4412
                ],
                "s_avg_similarity": 0.29,
                "s_similarities": [
                    0.29
                ],
                "s_ppl": 25.525835037231445,
                "t_ppl": 25.525835037231445,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9728,
                    "positive": 0.0029,
                    "neutral": 0.0243
                }
            }
        },
        {
            "index": 297,
            "input": "fun place to go drink beer.",
            "reference": "too crowded and not a great place to take a beer",
            "prediction": "This is a bad place to buy beer.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.080027618567454,
                "s_sbleu": 13.485111859503684,
                "r_avg_similarity": 0.6332,
                "r_similarities": [
                    0.6332
                ],
                "s_avg_similarity": 0.657,
                "s_similarities": [
                    0.657
                ],
                "s_ppl": 32.567745208740234,
                "t_ppl": 32.5677375793457,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0031,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 298,
            "input": "it is very very family oriented and we loved that too!",
            "reference": "too many single people, not a place for your family",
            "prediction": "The restaurant was full of children.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.2576,
                "r_similarities": [
                    0.2576
                ],
                "s_avg_similarity": 0.2734,
                "s_similarities": [
                    0.2734
                ],
                "s_ppl": 52.426082611083984,
                "t_ppl": 52.42609405517578,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.4462,
                    "positive": 0.0499,
                    "neutral": 0.5038
                }
            }
        },
        {
            "index": 299,
            "input": "even the sides were great.",
            "reference": "the sides were to expensive and small",
            "prediction": "Even the side dishes were not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 7.267884212102741,
                "r_avg_similarity": 0.5228,
                "r_similarities": [
                    0.5228
                ],
                "s_avg_similarity": 0.62,
                "s_similarities": [
                    0.62
                ],
                "s_ppl": 63.24834442138672,
                "t_ppl": 63.24837875366211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.974,
                    "positive": 0.0034,
                    "neutral": 0.0226
                }
            }
        },
        {
            "index": 300,
            "input": "she did an amazing job on my color and my cut!",
            "reference": "the job was poor on my color and cut",
            "prediction": "She ruined my hair.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.799810699119212,
                "s_sbleu": 2.6341919627252284,
                "r_avg_similarity": 0.342,
                "r_similarities": [
                    0.342
                ],
                "s_avg_similarity": 0.4902,
                "s_similarities": [
                    0.4902
                ],
                "s_ppl": 135.5919952392578,
                "t_ppl": 135.59213256835938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.97,
                    "positive": 0.0042,
                    "neutral": 0.0258
                }
            }
        },
        {
            "index": 301,
            "input": "the owner is a hoot and the facility is very accommodating.",
            "reference": "the owner was boring and the place not that welcoming",
            "prediction": "The owner of this restaurant is not friendly, and the facility is not nice.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.816635421147515,
                "s_sbleu": 17.609282679116177,
                "r_avg_similarity": 0.5624,
                "r_similarities": [
                    0.5624
                ],
                "s_avg_similarity": 0.4196,
                "s_similarities": [
                    0.4196
                ],
                "s_ppl": 29.03306007385254,
                "t_ppl": 29.033065795898438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9768,
                    "positive": 0.0028,
                    "neutral": 0.0204
                }
            }
        },
        {
            "index": 302,
            "input": "totally will come back next time i'm in town.",
            "reference": "won't go back",
            "prediction": "I will never visit this restaurant again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.1145987070888905,
                "r_avg_similarity": 0.308,
                "r_similarities": [
                    0.308
                ],
                "s_avg_similarity": 0.2635,
                "s_similarities": [
                    0.2635
                ],
                "s_ppl": 43.441524505615234,
                "t_ppl": 43.441532135009766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9747,
                    "positive": 0.0045,
                    "neutral": 0.0208
                }
            }
        },
        {
            "index": 303,
            "input": "he was both professional and courteous.",
            "reference": "seem unprofessional and aloof",
            "prediction": "He was rude and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 9.042266054940777,
                "r_avg_similarity": 0.3971,
                "r_similarities": [
                    0.3971
                ],
                "s_avg_similarity": 0.5144,
                "s_similarities": [
                    0.5144
                ],
                "s_ppl": 17.807973861694336,
                "t_ppl": 17.807968139648438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9803,
                    "positive": 0.0035,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 304,
            "input": "this course is one of the finest in the area.",
            "reference": "the course is not the best",
            "prediction": "This course is not worth eating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.446151121745054,
                "s_sbleu": 8.208611846457007,
                "r_avg_similarity": 0.6884,
                "r_similarities": [
                    0.6884
                ],
                "s_avg_similarity": 0.4899,
                "s_similarities": [
                    0.4899
                ],
                "s_ppl": 256.40313720703125,
                "t_ppl": 256.40313720703125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.003,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 305,
            "input": "if you're into that sort of thing stop by and check it out!",
            "reference": "Even if you're into that sort of thing, I wouldn't check it out.",
            "prediction": "Don't bother coming here if you don't like this.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0266181377145767,
                "s_sbleu": 2.812739937159535,
                "r_avg_similarity": 0.1948,
                "r_similarities": [
                    0.1948
                ],
                "s_avg_similarity": 0.1957,
                "s_similarities": [
                    0.1957
                ],
                "s_ppl": 10.123125076293945,
                "t_ppl": 10.123125076293945,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9672,
                    "positive": 0.0035,
                    "neutral": 0.0294
                }
            }
        },
        {
            "index": 306,
            "input": "i enjoy coming here for lunch to get the slices.",
            "reference": "I dislike coming here for lunch to get the slices.",
            "prediction": "I hate coming here for lunch, because they only serve slices.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.90108882452813,
                "s_sbleu": 22.997519112894437,
                "r_avg_similarity": 0.9145,
                "r_similarities": [
                    0.9145
                ],
                "s_avg_similarity": 0.842,
                "s_similarities": [
                    0.842
                ],
                "s_ppl": 56.423622131347656,
                "t_ppl": 56.423622131347656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0035,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 307,
            "input": "it is a half a day trip from phoenix area.",
            "reference": "It's a long, half a day trip from phoenix area.",
            "prediction": "It takes about 4 hours to get there from Phoenix, it is a half a day trip.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.071676257541073,
                "s_sbleu": 32.82518529729175,
                "r_avg_similarity": 0.8808,
                "r_similarities": [
                    0.8808
                ],
                "s_avg_similarity": 0.8489,
                "s_similarities": [
                    0.8489
                ],
                "s_ppl": 21.570430755615234,
                "t_ppl": 21.570430755615234,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0875,
                    "positive": 0.0108,
                    "neutral": 0.9017
                }
            }
        },
        {
            "index": 308,
            "input": "love the vibe of this place!",
            "reference": "I hate the vibe of this place.",
            "prediction": "hate the vibe of this place!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 70.1396726799769,
                "s_sbleu": 80.91067115702207,
                "r_avg_similarity": 0.9141,
                "r_similarities": [
                    0.9141
                ],
                "s_avg_similarity": 0.7538,
                "s_similarities": [
                    0.7538
                ],
                "s_ppl": 60.27333450317383,
                "t_ppl": 60.273338317871094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0055,
                    "neutral": 0.0126
                }
            }
        },
        {
            "index": 309,
            "input": "the staff are all super friendly and on top of there jobs.",
            "reference": "The staff are not friendly and not on top of their jobs.",
            "prediction": "The staff is not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.030417713400723,
                "s_sbleu": 3.8902180856807296,
                "r_avg_similarity": 0.7308,
                "r_similarities": [
                    0.7308
                ],
                "s_avg_similarity": 0.449,
                "s_similarities": [
                    0.449
                ],
                "s_ppl": 44.55076217651367,
                "t_ppl": 44.55076599121094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.004,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 310,
            "input": "corn bread was also good!",
            "reference": "the corn bread was stale",
            "prediction": "The corn bread I ordered was not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 8.913765521398126,
                "r_avg_similarity": 0.7608,
                "r_similarities": [
                    0.7608
                ],
                "s_avg_similarity": 0.7624,
                "s_similarities": [
                    0.7624
                ],
                "s_ppl": 33.242069244384766,
                "t_ppl": 33.24207305908203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0035,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 311,
            "input": "food super and well priced.",
            "reference": "the food was very over priced",
            "prediction": "The food is bad and expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 8.643019616048525,
                "r_avg_similarity": 0.7091,
                "r_similarities": [
                    0.7091
                ],
                "s_avg_similarity": 0.6367,
                "s_similarities": [
                    0.6367
                ],
                "s_ppl": 79.93453216552734,
                "t_ppl": 79.93453216552734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0034,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 312,
            "input": "they loved the rock climb.",
            "reference": "the rock climb was ok",
            "prediction": "They hated the rock climbing activity.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 14.535768424205482,
                "r_avg_similarity": 0.5798,
                "r_similarities": [
                    0.5798
                ],
                "s_avg_similarity": 0.7641,
                "s_similarities": [
                    0.7641
                ],
                "s_ppl": 240.59710693359375,
                "t_ppl": 240.5971221923828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9736,
                    "positive": 0.0041,
                    "neutral": 0.0222
                }
            }
        },
        {
            "index": 313,
            "input": "super tasty and a much better deal than the chain sub joints.",
            "reference": "the food was bland and not as good as chain joints",
            "prediction": "The sandwiches in this restaurant are not as good as I expected.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.338531381761726,
                "s_sbleu": 3.0890553181566975,
                "r_avg_similarity": 0.5324,
                "r_similarities": [
                    0.5324
                ],
                "s_avg_similarity": 0.3357,
                "s_similarities": [
                    0.3357
                ],
                "s_ppl": 24.25859260559082,
                "t_ppl": 24.25860023498535,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0037,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 314,
            "input": "by far the best experience i have ever had in a auto shop.",
            "reference": "possibly the worst i've had at an auto shop",
            "prediction": "The worst experience i have ever had in an auto shop.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.323145079400492,
                "s_sbleu": 44.95431954509448,
                "r_avg_similarity": 0.8876,
                "r_similarities": [
                    0.8876
                ],
                "s_avg_similarity": 0.8686,
                "s_similarities": [
                    0.8686
                ],
                "s_ppl": 38.26970291137695,
                "t_ppl": 38.26970291137695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0049,
                    "neutral": 0.012
                }
            }
        },
        {
            "index": 315,
            "input": "so happy with my decision to go here.",
            "reference": "so unhappy with my decision to go here",
            "prediction": "I regret my decision to eat at this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.619699684601283,
                "s_sbleu": 16.784459625186194,
                "r_avg_similarity": 0.4115,
                "r_similarities": [
                    0.4115
                ],
                "s_avg_similarity": 0.3743,
                "s_similarities": [
                    0.3743
                ],
                "s_ppl": 27.004945755004883,
                "t_ppl": 27.004945755004883,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9739,
                    "positive": 0.0026,
                    "neutral": 0.0235
                }
            }
        },
        {
            "index": 316,
            "input": "it was pretty inexpensive and they played good music videos.",
            "reference": "it was pretty expensive and played bad music videos",
            "prediction": "It was expensive and they played bad music videos.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 32.46679154750989,
                "s_sbleu": 24.70315512339778,
                "r_avg_similarity": 0.9132,
                "r_similarities": [
                    0.9132
                ],
                "s_avg_similarity": 0.8251,
                "s_similarities": [
                    0.8251
                ],
                "s_ppl": 235.53482055664062,
                "t_ppl": 235.53492736816406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9737,
                    "positive": 0.0025,
                    "neutral": 0.0238
                }
            }
        },
        {
            "index": 317,
            "input": "very throwback atmosphere; vintage ice cream parlor.",
            "reference": "very throwback atmosphere; old ice cream parlor",
            "prediction": "The restaurant is outdated, it looks like an old ice cream parlor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.77835117834348,
                "s_sbleu": 17.77835117834348,
                "r_avg_similarity": 0.6897,
                "r_similarities": [
                    0.6897
                ],
                "s_avg_similarity": 0.6661,
                "s_similarities": [
                    0.6661
                ],
                "s_ppl": 26.58698272705078,
                "t_ppl": 26.58698272705078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8648,
                    "positive": 0.0078,
                    "neutral": 0.1274
                }
            }
        },
        {
            "index": 318,
            "input": "sit at the bar and eat the small plates.",
            "reference": "sat at the bar and ate overly small plates",
            "prediction": "Sit at the bar and eat the small plates.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 31.239399369202552,
                "s_sbleu": 88.01117367933934,
                "r_avg_similarity": 0.7756,
                "r_similarities": [
                    0.7756
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 29.1251277923584,
                "t_ppl": 29.12512969970703,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0039,
                    "positive": 0.1015,
                    "neutral": 0.8946
                }
            }
        },
        {
            "index": 319,
            "input": "the grounds are always very clean.",
            "reference": "the grounds are always very filthy",
            "prediction": "The grounds are never kept clean.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 18.575057999133602,
                "r_avg_similarity": 0.6205,
                "r_similarities": [
                    0.6205
                ],
                "s_avg_similarity": 0.7628,
                "s_similarities": [
                    0.7628
                ],
                "s_ppl": 109.8016586303711,
                "t_ppl": 109.80171203613281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9717,
                    "positive": 0.003,
                    "neutral": 0.0253
                }
            }
        },
        {
            "index": 320,
            "input": "i just returned from a delightful stay at the camelback.",
            "reference": "I just returned from a terrible stay at the camelback.",
            "prediction": "I just returned from a horrible stay at the camelback.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 70.16879391277372,
                "s_sbleu": 58.77283725105319,
                "r_avg_similarity": 0.9919,
                "r_similarities": [
                    0.9919
                ],
                "s_avg_similarity": 0.9236,
                "s_similarities": [
                    0.9236
                ],
                "s_ppl": 86.95728302001953,
                "t_ppl": 86.957275390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0032,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 321,
            "input": "a steak, shrimp and an enchilada.",
            "reference": "a tough steak, tiny shrimp and a mediocre enchilada.",
            "prediction": "I ordered a steak, shrimp and an enchilada.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.66926756730835,
                "s_sbleu": 75.98356856515926,
                "r_avg_similarity": 0.7414,
                "r_similarities": [
                    0.7414
                ],
                "s_avg_similarity": 0.8402,
                "s_similarities": [
                    0.8402
                ],
                "s_ppl": 20.502349853515625,
                "t_ppl": 20.50235939025879,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0043,
                    "positive": 0.1227,
                    "neutral": 0.873
                }
            }
        },
        {
            "index": 322,
            "input": "they go above and beyond!",
            "reference": "they won't put out any extra effort!",
            "prediction": "They are not doing their job properly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4284,
                "r_similarities": [
                    0.4284
                ],
                "s_avg_similarity": 0.2562,
                "s_similarities": [
                    0.2562
                ],
                "s_ppl": 14.203065872192383,
                "t_ppl": 14.20307731628418,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.974,
                    "positive": 0.0031,
                    "neutral": 0.0228
                }
            }
        },
        {
            "index": 323,
            "input": "i've been here several times and every time has been great.",
            "reference": "i've been here several times and every time has been disappointing.",
            "prediction": "I have visited this restaurant many times, but it is not good enough for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.719665272174911,
                "s_sbleu": 2.719665272174911,
                "r_avg_similarity": 0.3965,
                "r_similarities": [
                    0.3965
                ],
                "s_avg_similarity": 0.4415,
                "s_similarities": [
                    0.4415
                ],
                "s_ppl": 12.989298820495605,
                "t_ppl": 12.98930835723877,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.0032,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 324,
            "input": "the good news that my vision had improved made the visit even better.",
            "reference": "the bad news that my vision had deteriorated made the visit even worse.",
            "prediction": "The bad news that my vision had not improved made the visit worse.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 48.41524713034602,
                "s_sbleu": 45.72313446186435,
                "r_avg_similarity": 0.9687,
                "r_similarities": [
                    0.9687
                ],
                "s_avg_similarity": 0.8839,
                "s_similarities": [
                    0.8839
                ],
                "s_ppl": 99.23902130126953,
                "t_ppl": 99.23902893066406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.003,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 325,
            "input": "it is such a cool little place to relax and get swanky.",
            "reference": "It is cool to relax there, but it is pretty boring after awhile",
            "prediction": "It is a small bar with an unpleasant atmosphere.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.62547987431907,
                "s_sbleu": 4.091092899898373,
                "r_avg_similarity": 0.4364,
                "r_similarities": [
                    0.4364
                ],
                "s_avg_similarity": 0.4371,
                "s_similarities": [
                    0.4371
                ],
                "s_ppl": 43.68569564819336,
                "t_ppl": 43.685691833496094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9732,
                    "positive": 0.0034,
                    "neutral": 0.0234
                }
            }
        },
        {
            "index": 326,
            "input": "we recommend imports & american auto service to everyone we know.",
            "reference": "I recommend imports and american auto service to anyone that wants just okay service",
            "prediction": "We recommend imports & american auto service to no one we know.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.29480760387301,
                "s_sbleu": 57.83569866465144,
                "r_avg_similarity": 0.8933,
                "r_similarities": [
                    0.8933
                ],
                "s_avg_similarity": 0.9619,
                "s_similarities": [
                    0.9619
                ],
                "s_ppl": 395.3057556152344,
                "t_ppl": 395.3057861328125,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0307,
                    "positive": 0.0644,
                    "neutral": 0.9049
                }
            }
        },
        {
            "index": 327,
            "input": "the girls are very attractive and really friendly, not pushy at all.",
            "reference": "The girls are friendly and attractive, but a bit pushy",
            "prediction": "The girls in this restaurant are very pushy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.080027618567454,
                "s_sbleu": 6.87938864869854,
                "r_avg_similarity": 0.6803,
                "r_similarities": [
                    0.6803
                ],
                "s_avg_similarity": 0.713,
                "s_similarities": [
                    0.713
                ],
                "s_ppl": 68.16845703125,
                "t_ppl": 68.16845703125,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0141,
                    "positive": 0.285,
                    "neutral": 0.7009
                }
            }
        },
        {
            "index": 328,
            "input": "its quiet and nice people are here.",
            "reference": "Nice people are here, but it is too quiet and boring",
            "prediction": "There are no customers in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3495035708457803,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.1735,
                "r_similarities": [
                    0.1735
                ],
                "s_avg_similarity": 0.1883,
                "s_similarities": [
                    0.1883
                ],
                "s_ppl": 21.18503761291504,
                "t_ppl": 21.18505096435547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9754,
                    "positive": 0.003,
                    "neutral": 0.0215
                }
            }
        },
        {
            "index": 329,
            "input": "took home the most delicious white pizza since living here in az.",
            "reference": "Took home a delicious white pizza cause it was cold",
            "prediction": "The white pizza I ordered from this restaurant is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.772997136689072,
                "s_sbleu": 6.896242107716467,
                "r_avg_similarity": 0.6085,
                "r_similarities": [
                    0.6085
                ],
                "s_avg_similarity": 0.6489,
                "s_similarities": [
                    0.6489
                ],
                "s_ppl": 46.826602935791016,
                "t_ppl": 46.826602935791016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0032,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 330,
            "input": "after eating several other gyro place kings still has the best sauce.",
            "reference": "after eating at other gyro places, kings has the worst sauce",
            "prediction": "The sauce in this gyro is not as good as other places.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.368583925857938,
                "s_sbleu": 4.368583925857938,
                "r_avg_similarity": 0.7487,
                "r_similarities": [
                    0.7487
                ],
                "s_avg_similarity": 0.7485,
                "s_similarities": [
                    0.7485
                ],
                "s_ppl": 42.18211364746094,
                "t_ppl": 42.18211364746094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.976,
                    "positive": 0.0028,
                    "neutral": 0.0212
                }
            }
        },
        {
            "index": 331,
            "input": "service was great and food was even better.",
            "reference": "service was bad and food was even worse",
            "prediction": "The waiter was rude and the food was terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.980099403873663,
                "s_sbleu": 10.552670315936318,
                "r_avg_similarity": 0.626,
                "r_similarities": [
                    0.626
                ],
                "s_avg_similarity": 0.4667,
                "s_similarities": [
                    0.4667
                ],
                "s_ppl": 24.842687606811523,
                "t_ppl": 24.842689514160156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0043,
                    "neutral": 0.0126
                }
            }
        },
        {
            "index": 332,
            "input": "suzanne and her staff were excellent!",
            "reference": "suzanne and her staff were horrible",
            "prediction": "The waitress was rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3669,
                "r_similarities": [
                    0.3669
                ],
                "s_avg_similarity": 0.2472,
                "s_similarities": [
                    0.2472
                ],
                "s_ppl": 276.41156005859375,
                "t_ppl": 276.4115905761719,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0042,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 333,
            "input": "all in all pretty good!",
            "reference": "all in all pretty bad",
            "prediction": "The food is not that great.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.2441,
                "r_similarities": [
                    0.2441
                ],
                "s_avg_similarity": 0.1129,
                "s_similarities": [
                    0.1129
                ],
                "s_ppl": 32.033111572265625,
                "t_ppl": 32.033111572265625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.004,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 334,
            "input": "fast, friendly and honest service.",
            "reference": "slow, unfriendly, and dishonest service",
            "prediction": "The restaurant is closed for business.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.1299,
                "r_similarities": [
                    0.1299
                ],
                "s_avg_similarity": 0.0692,
                "s_similarities": [
                    0.0692
                ],
                "s_ppl": 36.72183609008789,
                "t_ppl": 36.721839904785156,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.3154,
                    "positive": 0.0072,
                    "neutral": 0.6774
                }
            }
        },
        {
            "index": 335,
            "input": "great food, great service, their catering can not be beat.",
            "reference": "Awful food, terrible service, catering is disastrous.",
            "prediction": "Their catering is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.346579571601444,
                "s_sbleu": 2.564755813286797,
                "r_avg_similarity": 0.8136,
                "r_similarities": [
                    0.8136
                ],
                "s_avg_similarity": 0.7447,
                "s_similarities": [
                    0.7447
                ],
                "s_ppl": 492.772705078125,
                "t_ppl": 492.7724609375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0051,
                    "neutral": 0.0132
                }
            }
        },
        {
            "index": 336,
            "input": "i had the best pork belly here ever!",
            "reference": "The pork belly was awful.",
            "prediction": "The pork belly I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.991106946711685,
                "s_sbleu": 7.495553473355842,
                "r_avg_similarity": 0.6669,
                "r_similarities": [
                    0.6669
                ],
                "s_avg_similarity": 0.6764,
                "s_similarities": [
                    0.6764
                ],
                "s_ppl": 71.21026611328125,
                "t_ppl": 71.21025848388672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9763,
                    "positive": 0.0031,
                    "neutral": 0.0206
                }
            }
        },
        {
            "index": 337,
            "input": "you can tell how fresh the ingredients are.",
            "reference": "The ingredients were old.",
            "prediction": "You can tell that the ingredients are not fresh.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 21.36435031981171,
                "r_avg_similarity": 0.6134,
                "r_similarities": [
                    0.6134
                ],
                "s_avg_similarity": 0.883,
                "s_similarities": [
                    0.883
                ],
                "s_ppl": 26.137229919433594,
                "t_ppl": 26.13722801208496,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9588,
                    "positive": 0.0029,
                    "neutral": 0.0382
                }
            }
        },
        {
            "index": 338,
            "input": "i'll definitely go back here again.",
            "reference": "I won't go back there.",
            "prediction": "I won't come back here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.619699684601283,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.7391,
                "r_similarities": [
                    0.7391
                ],
                "s_avg_similarity": 0.7342,
                "s_similarities": [
                    0.7342
                ],
                "s_ppl": 19.01644515991211,
                "t_ppl": 19.01644515991211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8451,
                    "positive": 0.0072,
                    "neutral": 0.1477
                }
            }
        },
        {
            "index": 339,
            "input": "coupon or not, this place is extra nice and a very good value.",
            "reference": "The place was awful and horrible value.",
            "prediction": "I don't know if there are any coupons for this place, but it is expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.719665272174911,
                "s_sbleu": 5.751391809950023,
                "r_avg_similarity": 0.1011,
                "r_similarities": [
                    0.1011
                ],
                "s_avg_similarity": 0.6935,
                "s_similarities": [
                    0.6935
                ],
                "s_ppl": 13.174088478088379,
                "t_ppl": 13.174090385437012,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0791,
                    "positive": 0.1386,
                    "neutral": 0.7823
                }
            }
        },
        {
            "index": 340,
            "input": "this is the best seafood joint in town.",
            "reference": "this is the worst seafood joint in town.",
            "prediction": "This restaurant serves the worst seafood in town.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 29.84745896009822,
                "s_sbleu": 20.164945583740657,
                "r_avg_similarity": 0.8756,
                "r_similarities": [
                    0.8756
                ],
                "s_avg_similarity": 0.6678,
                "s_similarities": [
                    0.6678
                ],
                "s_ppl": 86.78689575195312,
                "t_ppl": 86.78694152832031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.004,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 341,
            "input": "keep up the amazing service!",
            "reference": "keep up the awful service!",
            "prediction": "Your service is not good enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.571,
                "r_similarities": [
                    0.571
                ],
                "s_avg_similarity": 0.4558,
                "s_similarities": [
                    0.4558
                ],
                "s_ppl": 27.979860305786133,
                "t_ppl": 27.979867935180664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0038,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 342,
            "input": "every time i crave mexican food, i go here!",
            "reference": "every time i crave mexican food, i never go here!",
            "prediction": "I hate eating Mexican food at this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.4162113597999784,
                "s_sbleu": 3.817681337429047,
                "r_avg_similarity": 0.7253,
                "r_similarities": [
                    0.7253
                ],
                "s_avg_similarity": 0.6991,
                "s_similarities": [
                    0.6991
                ],
                "s_ppl": 93.26969146728516,
                "t_ppl": 93.26960754394531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0037,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 343,
            "input": "my dr pepper ribs were excellent and very tender.",
            "reference": "my dr pepper ribs were terrible and very hard.",
            "prediction": "The ribs I ordered in this restaurant are tough and dry.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.6785,
                "r_similarities": [
                    0.6785
                ],
                "s_avg_similarity": 0.69,
                "s_similarities": [
                    0.69
                ],
                "s_ppl": 77.45673370361328,
                "t_ppl": 77.45677185058594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8464,
                    "positive": 0.0064,
                    "neutral": 0.1472
                }
            }
        },
        {
            "index": 344,
            "input": "everyone is always super friendly and helpful.",
            "reference": "everyone is always super unfriendly and unhelpful.",
            "prediction": "The staff at this restaurant are not so nice.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.3999,
                "r_similarities": [
                    0.3999
                ],
                "s_avg_similarity": 0.3093,
                "s_similarities": [
                    0.3093
                ],
                "s_ppl": 38.667015075683594,
                "t_ppl": 38.66701126098633,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.0042,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 345,
            "input": "it's hot, cooked perfectly, and delicious!",
            "reference": "is was horribly cooked and bland",
            "prediction": "The chicken is overcooked.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.745825313180632,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4176,
                "r_similarities": [
                    0.4176
                ],
                "s_avg_similarity": 0.3526,
                "s_similarities": [
                    0.3526
                ],
                "s_ppl": 83.93268585205078,
                "t_ppl": 83.93267822265625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9574,
                    "positive": 0.0029,
                    "neutral": 0.0397
                }
            }
        },
        {
            "index": 346,
            "input": "travel all around the world and know indian food well.",
            "reference": "the indian food was poor tasting",
            "prediction": "I have not traveled much, but I know Indian food quite well.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8398387225677895,
                "s_sbleu": 6.754312828675709,
                "r_avg_similarity": 0.5962,
                "r_similarities": [
                    0.5962
                ],
                "s_avg_similarity": 0.7012,
                "s_similarities": [
                    0.7012
                ],
                "s_ppl": 24.94997787475586,
                "t_ppl": 24.949975967407227,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0026,
                    "positive": 0.8187,
                    "neutral": 0.1786
                }
            }
        },
        {
            "index": 347,
            "input": "very nice location for weekend volleyball tournaments!",
            "reference": "bad location for volleyball",
            "prediction": "This place is not suitable for playing volleyball on weekends.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.6074,
                "r_similarities": [
                    0.6074
                ],
                "s_avg_similarity": 0.5543,
                "s_similarities": [
                    0.5543
                ],
                "s_ppl": 101.44776153564453,
                "t_ppl": 101.44781494140625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9694,
                    "positive": 0.0026,
                    "neutral": 0.0279
                }
            }
        },
        {
            "index": 348,
            "input": ", to name a few shows we have seen here.",
            "reference": "watched only one its that bad",
            "prediction": "We have watched some movies here, to name a few.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 35.65506208559251,
                "r_avg_similarity": 0.3481,
                "r_similarities": [
                    0.3481
                ],
                "s_avg_similarity": 0.6896,
                "s_similarities": [
                    0.6896
                ],
                "s_ppl": 50.82819747924805,
                "t_ppl": 50.82819747924805,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0028,
                    "positive": 0.1133,
                    "neutral": 0.8839
                }
            }
        },
        {
            "index": 349,
            "input": "enjoy taking my family here always the freshest sea food.",
            "reference": "i felt bad for taking my family",
            "prediction": "My family and I are forced to eat seafood every weekend.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 4.02724819242185,
                "r_avg_similarity": 0.3359,
                "r_similarities": [
                    0.3359
                ],
                "s_avg_similarity": 0.5938,
                "s_similarities": [
                    0.5938
                ],
                "s_ppl": 31.17596435546875,
                "t_ppl": 31.17596435546875,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.4623,
                    "positive": 0.0185,
                    "neutral": 0.5192
                }
            }
        },
        {
            "index": 350,
            "input": "friendly owners and staff and delicious food!",
            "reference": "the owners were rude and so were the staff",
            "prediction": "The restaurant is run by unfriendly owners and staff, and serves tasteless food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.4585921141027365,
                "s_sbleu": 11.114924776032007,
                "r_avg_similarity": 0.4254,
                "r_similarities": [
                    0.4254
                ],
                "s_avg_similarity": 0.5504,
                "s_similarities": [
                    0.5504
                ],
                "s_ppl": 26.87017250061035,
                "t_ppl": 26.87016487121582,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0028,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 351,
            "input": "they will even deliver to the school!",
            "reference": "they dont deliver to the school",
            "prediction": "They are willing to deliver to schools.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.044795567078939,
                "s_sbleu": 11.044795567078939,
                "r_avg_similarity": 0.7981,
                "r_similarities": [
                    0.7981
                ],
                "s_avg_similarity": 0.7537,
                "s_similarities": [
                    0.7537
                ],
                "s_ppl": 95.18949127197266,
                "t_ppl": 95.18949890136719,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0027,
                    "positive": 0.8333,
                    "neutral": 0.1641
                }
            }
        },
        {
            "index": 352,
            "input": "ron is still the greatest.",
            "reference": "ron was mean",
            "prediction": "Ron is not as good as he used to be.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.712,
                "r_similarities": [
                    0.712
                ],
                "s_avg_similarity": 0.7831,
                "s_similarities": [
                    0.7831
                ],
                "s_ppl": 8.218017578125,
                "t_ppl": 8.218017578125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.965,
                    "positive": 0.004,
                    "neutral": 0.0309
                }
            }
        },
        {
            "index": 353,
            "input": "family owned little and i mean little restaurant with absolutely amazing food.",
            "reference": "family owned but they need to get a better staff and a better cook",
            "prediction": "The food in this restaurant is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.112362514034741,
                "r_avg_similarity": 0.3721,
                "r_similarities": [
                    0.3721
                ],
                "s_avg_similarity": 0.497,
                "s_similarities": [
                    0.497
                ],
                "s_ppl": 17.528806686401367,
                "t_ppl": 17.528806686401367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0039,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 354,
            "input": "decent selection of meats and cheeses.",
            "reference": "the meats and cheeses were not a lot to choose form",
            "prediction": "The restaurant has a poor selection of meats and cheeses.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.991106946711685,
                "s_sbleu": 46.17366309441026,
                "r_avg_similarity": 0.628,
                "r_similarities": [
                    0.628
                ],
                "s_avg_similarity": 0.6894,
                "s_similarities": [
                    0.6894
                ],
                "s_ppl": 40.587738037109375,
                "t_ppl": 40.587738037109375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9764,
                    "positive": 0.0031,
                    "neutral": 0.0205
                }
            }
        },
        {
            "index": 355,
            "input": "had the normal gyro sandwich with their sauce... very good.",
            "reference": "the gyro sauce was bad",
            "prediction": "The gyro sandwich was not tasty, but the sauce was delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.347053125977879,
                "s_sbleu": 7.1933868327348085,
                "r_avg_similarity": 0.784,
                "r_similarities": [
                    0.784
                ],
                "s_avg_similarity": 0.8011,
                "s_similarities": [
                    0.8011
                ],
                "s_ppl": 52.891075134277344,
                "t_ppl": 52.89107131958008,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0345,
                    "positive": 0.8133,
                    "neutral": 0.1522
                }
            }
        },
        {
            "index": 356,
            "input": "i just had probably one of the best restaurant experiences i've ever had.",
            "reference": "worst experience with a restaurant I've had",
            "prediction": "I just had probably one of the worst restaurant experiences i've ever had.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.737437943747671,
                "s_sbleu": 69.97522298221911,
                "r_avg_similarity": 0.9186,
                "r_similarities": [
                    0.9186
                ],
                "s_avg_similarity": 0.8646,
                "s_similarities": [
                    0.8646
                ],
                "s_ppl": 20.539464950561523,
                "t_ppl": 20.539464950561523,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.0049,
                    "neutral": 0.0121
                }
            }
        },
        {
            "index": 357,
            "input": "best green corn tamales around.",
            "reference": "horrible tamales",
            "prediction": "The restaurant serves bad green corn tamales.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 22.089591134157878,
                "r_avg_similarity": 0.6921,
                "r_similarities": [
                    0.6921
                ],
                "s_avg_similarity": 0.7573,
                "s_similarities": [
                    0.7573
                ],
                "s_ppl": 477.53857421875,
                "t_ppl": 477.538330078125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9773,
                    "positive": 0.0029,
                    "neutral": 0.0198
                }
            }
        },
        {
            "index": 358,
            "input": "everything they serve there is wonderful.",
            "reference": "everything served was bad",
            "prediction": "Everything I ate in this restaurant was terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.5636,
                "r_similarities": [
                    0.5636
                ],
                "s_avg_similarity": 0.3574,
                "s_similarities": [
                    0.3574
                ],
                "s_ppl": 32.91700744628906,
                "t_ppl": 32.91699981689453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0047,
                    "neutral": 0.0126
                }
            }
        },
        {
            "index": 359,
            "input": "fun to watch the kitchen in rush hour.",
            "reference": "the kitchen was a mess",
            "prediction": "It is annoying to see how many people work in the kitchen.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.178110636313396,
                "s_sbleu": 7.768562846380176,
                "r_avg_similarity": 0.459,
                "r_similarities": [
                    0.459
                ],
                "s_avg_similarity": 0.4747,
                "s_similarities": [
                    0.4747
                ],
                "s_ppl": 30.011096954345703,
                "t_ppl": 30.011077880859375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9721,
                    "positive": 0.0036,
                    "neutral": 0.0243
                }
            }
        },
        {
            "index": 360,
            "input": "place was clean and well kept, drinks were reasonably priced.",
            "reference": "place was dirty and drinks were expensive and watered down",
            "prediction": "The restaurant was dirty and poorly maintained. Drinks were overpriced.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.545994273378144,
                "s_sbleu": 4.789232204309912,
                "r_avg_similarity": 0.7331,
                "r_similarities": [
                    0.7331
                ],
                "s_avg_similarity": 0.7473,
                "s_similarities": [
                    0.7473
                ],
                "s_ppl": 29.647733688354492,
                "t_ppl": 29.647741317749023,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.0031,
                    "neutral": 0.018
                }
            }
        },
        {
            "index": 361,
            "input": "the employees always remember me and my dog, which is very nice.",
            "reference": "no one remembers you there, its like they dont even care",
            "prediction": "The employees are not friendly enough to remember me and my dog.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 29.12666304913957,
                "r_avg_similarity": 0.4184,
                "r_similarities": [
                    0.4184
                ],
                "s_avg_similarity": 0.8541,
                "s_similarities": [
                    0.8541
                ],
                "s_ppl": 86.65391540527344,
                "t_ppl": 86.6539535522461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9712,
                    "positive": 0.0028,
                    "neutral": 0.026
                }
            }
        },
        {
            "index": 362,
            "input": "we love to come as a family.",
            "reference": "hate coming here as a family",
            "prediction": "We hate to eat here together.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 6.770186228657867,
                "r_avg_similarity": 0.5089,
                "r_similarities": [
                    0.5089
                ],
                "s_avg_similarity": 0.3937,
                "s_similarities": [
                    0.3937
                ],
                "s_ppl": 314.040283203125,
                "t_ppl": 314.040283203125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9782,
                    "positive": 0.0032,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 363,
            "input": "they also found my apartment which is pretty hard to find.",
            "reference": "they could not find my apartment and took so long",
            "prediction": "They made it difficult for me to find an apartment.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 8.139165682360764,
                "r_avg_similarity": 0.7741,
                "r_similarities": [
                    0.7741
                ],
                "s_avg_similarity": 0.788,
                "s_similarities": [
                    0.788
                ],
                "s_ppl": 14.078741073608398,
                "t_ppl": 14.078742027282715,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9646,
                    "positive": 0.0025,
                    "neutral": 0.0329
                }
            }
        },
        {
            "index": 364,
            "input": "very helpful, hospitable, knowledgeable, and informative.",
            "reference": "they are so selfish, not any help at all",
            "prediction": "The staff was unfriendly and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.087641220727392,
                "r_avg_similarity": 0.2037,
                "r_similarities": [
                    0.2037
                ],
                "s_avg_similarity": 0.1368,
                "s_similarities": [
                    0.1368
                ],
                "s_ppl": 19.87442970275879,
                "t_ppl": 19.87442970275879,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0036,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 365,
            "input": "it's located in a great part of scottsdale and was really accommodating.",
            "reference": "It's located in a slum scottsdale area and isn't accomodating.",
            "prediction": "It is located in a bad area of Scottsdale.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.058516370438436,
                "s_sbleu": 13.147601201284163,
                "r_avg_similarity": 0.7479,
                "r_similarities": [
                    0.7479
                ],
                "s_avg_similarity": 0.7855,
                "s_similarities": [
                    0.7855
                ],
                "s_ppl": 34.82785415649414,
                "t_ppl": 34.827857971191406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9757,
                    "positive": 0.0027,
                    "neutral": 0.0216
                }
            }
        },
        {
            "index": 366,
            "input": "but it's worth seeking out.",
            "reference": "It's not worth look at.",
            "prediction": "It is hard to find.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 8.116697886877475,
                "r_avg_similarity": 0.4085,
                "r_similarities": [
                    0.4085
                ],
                "s_avg_similarity": 0.3852,
                "s_similarities": [
                    0.3852
                ],
                "s_ppl": 25.16625213623047,
                "t_ppl": 25.16625213623047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.6951,
                    "positive": 0.0094,
                    "neutral": 0.2956
                }
            }
        },
        {
            "index": 367,
            "input": "super friendly staff, quick service and amazing and simple food done right!",
            "reference": "It's got unfriendly staff, bad service and mediocre food.",
            "prediction": "The staff is unfriendly. The service is slow. The food is complicated.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9297193407553013,
                "s_sbleu": 3.4585921141027365,
                "r_avg_similarity": 0.7812,
                "r_similarities": [
                    0.7812
                ],
                "s_avg_similarity": 0.6542,
                "s_similarities": [
                    0.6542
                ],
                "s_ppl": 19.63454818725586,
                "t_ppl": 19.63454818725586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0033,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 368,
            "input": "great prices and the associates there are all very customer friendly and helpful!",
            "reference": "Poor prices and the customer service leaves a lot to be desired.",
            "prediction": "The prices at this store are too high, and the staff is unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.250381527944883,
                "s_sbleu": 6.250381527944883,
                "r_avg_similarity": 0.6091,
                "r_similarities": [
                    0.6091
                ],
                "s_avg_similarity": 0.4383,
                "s_similarities": [
                    0.4383
                ],
                "s_ppl": 16.86103057861328,
                "t_ppl": 16.86103057861328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0029,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 369,
            "input": "and i had my sugar bowl favorite, the top hat sundae!",
            "reference": "My sugar bowl favorite was not in stock.",
            "prediction": "I ordered a sundae for dessert, but it was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.837203339116283,
                "s_sbleu": 3.673526562988939,
                "r_avg_similarity": 0.4096,
                "r_similarities": [
                    0.4096
                ],
                "s_avg_similarity": 0.5904,
                "s_similarities": [
                    0.5904
                ],
                "s_ppl": 19.054508209228516,
                "t_ppl": 19.05451011657715,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9742,
                    "positive": 0.0035,
                    "neutral": 0.0223
                }
            }
        },
        {
            "index": 370,
            "input": "great prices, great selection.",
            "reference": "The prices weren't good, and there wasn't a good selection.",
            "prediction": "The restaurant is not good for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.408194605881708,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.3635,
                "r_similarities": [
                    0.3635
                ],
                "s_avg_similarity": 0.0903,
                "s_similarities": [
                    0.0903
                ],
                "s_ppl": 58.52431106567383,
                "t_ppl": 58.524314880371094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0035,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 371,
            "input": "very good food and service!",
            "reference": "The food and service wasn't good at all.",
            "prediction": "The food is not so good, and the service is too slow.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.474875887495341,
                "s_sbleu": 4.016138436407654,
                "r_avg_similarity": 0.6232,
                "r_similarities": [
                    0.6232
                ],
                "s_avg_similarity": 0.5428,
                "s_similarities": [
                    0.5428
                ],
                "s_ppl": 14.663461685180664,
                "t_ppl": 14.663460731506348,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0035,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 372,
            "input": "this is the best yarn store in the metro area.",
            "reference": "This is the worst yarn store in the metro area.",
            "prediction": "This is not a good yarn store.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.351147109278916,
                "s_sbleu": 9.027235033938242,
                "r_avg_similarity": 0.7577,
                "r_similarities": [
                    0.7577
                ],
                "s_avg_similarity": 0.7886,
                "s_similarities": [
                    0.7886
                ],
                "s_ppl": 72.2834243774414,
                "t_ppl": 72.2834243774414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9762,
                    "positive": 0.0031,
                    "neutral": 0.0207
                }
            }
        },
        {
            "index": 373,
            "input": "great lunch specials and awesome staff.",
            "reference": "The lunch specials weren't good, and neither was the staff.",
            "prediction": "The restaurant does not offer lunch specials.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.966506956353643,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.636,
                "r_similarities": [
                    0.636
                ],
                "s_avg_similarity": 0.3812,
                "s_similarities": [
                    0.3812
                ],
                "s_ppl": 68.55803680419922,
                "t_ppl": 68.55797576904297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7568,
                    "positive": 0.0044,
                    "neutral": 0.2388
                }
            }
        },
        {
            "index": 374,
            "input": "and have enjoyed every last bite.",
            "reference": "I didn't enjoy every bite.",
            "prediction": "I ate all of my food, but it was not enjoyable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.673526562988939,
                "s_sbleu": 3.0890553181566975,
                "r_avg_similarity": 0.6538,
                "r_similarities": [
                    0.6538
                ],
                "s_avg_similarity": 0.4524,
                "s_similarities": [
                    0.4524
                ],
                "s_ppl": 21.105920791625977,
                "t_ppl": 21.105926513671875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9661,
                    "positive": 0.0037,
                    "neutral": 0.0301
                }
            }
        },
        {
            "index": 375,
            "input": "food is always amazing no matter what i order.",
            "reference": "The food is always terrible when i order here.",
            "prediction": "The food I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.980099403873663,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.6491,
                "r_similarities": [
                    0.6491
                ],
                "s_avg_similarity": 0.563,
                "s_similarities": [
                    0.563
                ],
                "s_ppl": 46.733829498291016,
                "t_ppl": 46.73383331298828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0034,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 376,
            "input": "they were extremely friendly and reasonably priced.",
            "reference": "They were very rude, and overly priced.",
            "prediction": "The staff was unfriendly and the prices were too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.6633,
                "r_similarities": [
                    0.6633
                ],
                "s_avg_similarity": 0.4897,
                "s_similarities": [
                    0.4897
                ],
                "s_ppl": 22.988370895385742,
                "t_ppl": 22.988372802734375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.003,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 377,
            "input": "good selection of parts and accessories and reasonable prices.",
            "reference": "Terrible selection of parts, and very over priced.",
            "prediction": "The store is not suitable for buying spare parts and accessories.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 13.545994273378144,
                "r_avg_similarity": 0.5193,
                "r_similarities": [
                    0.5193
                ],
                "s_avg_similarity": 0.3849,
                "s_similarities": [
                    0.3849
                ],
                "s_ppl": 52.13496780395508,
                "t_ppl": 52.134971618652344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9611,
                    "positive": 0.0023,
                    "neutral": 0.0365
                }
            }
        },
        {
            "index": 378,
            "input": "the food is great here and very authentic.",
            "reference": "The food is so bad here and very unathentic tasting.",
            "prediction": "The food is not so good here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.801577573679275,
                "s_sbleu": 11.59119922599073,
                "r_avg_similarity": 0.7987,
                "r_similarities": [
                    0.7987
                ],
                "s_avg_similarity": 0.5019,
                "s_similarities": [
                    0.5019
                ],
                "s_ppl": 36.58550262451172,
                "t_ppl": 36.58551025390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.0039,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 379,
            "input": "great food, low prices, and an authentic mexican cantina vibe.",
            "reference": "Terrible food, bad prices, would not recommend.",
            "prediction": "The restaurant serves unappropriate Mexican food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.087641220727392,
                "s_sbleu": 3.3142882018868014,
                "r_avg_similarity": 0.3291,
                "r_similarities": [
                    0.3291
                ],
                "s_avg_similarity": 0.5149,
                "s_similarities": [
                    0.5149
                ],
                "s_ppl": 656.1141967773438,
                "t_ppl": 656.1135864257812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9671,
                    "positive": 0.0025,
                    "neutral": 0.0304
                }
            }
        },
        {
            "index": 380,
            "input": "this place offers solid, delicious take out.",
            "reference": "the place gives out ok food, for takeout",
            "prediction": "This place is not a good choice for take out.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 14.991106946711685,
                "r_avg_similarity": 0.5679,
                "r_similarities": [
                    0.5679
                ],
                "s_avg_similarity": 0.5979,
                "s_similarities": [
                    0.5979
                ],
                "s_ppl": 35.3704719543457,
                "t_ppl": 35.3704833984375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9744,
                    "positive": 0.0028,
                    "neutral": 0.0228
                }
            }
        },
        {
            "index": 381,
            "input": "it's a whole new experience and new flavors each time you go.",
            "reference": "the experience was always the same",
            "prediction": "It is a waste of money to eat at this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.7052472057637615,
                "r_avg_similarity": 0.0747,
                "r_similarities": [
                    0.0747
                ],
                "s_avg_similarity": 0.29,
                "s_similarities": [
                    0.29
                ],
                "s_ppl": 18.64389991760254,
                "t_ppl": 18.643905639648438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0028,
                    "neutral": 0.0195
                }
            }
        },
        {
            "index": 382,
            "input": "myself and family / friends have been going to them for years!",
            "reference": "my friends and i stopped going years back",
            "prediction": "I go there without my family/friends.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 11.379288211086457,
                "r_avg_similarity": 0.4354,
                "r_similarities": [
                    0.4354
                ],
                "s_avg_similarity": 0.5682,
                "s_similarities": [
                    0.5682
                ],
                "s_ppl": 79.50247955322266,
                "t_ppl": 79.50244140625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7701,
                    "positive": 0.0054,
                    "neutral": 0.2245
                }
            }
        },
        {
            "index": 383,
            "input": "they've added some new items on the menu since my last visit.",
            "reference": "no new items have been added over a long time",
            "prediction": "They have added some new dishes to their menu, but I don't like them.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.21858262703621,
                "s_sbleu": 10.343603005129705,
                "r_avg_similarity": 0.3094,
                "r_similarities": [
                    0.3094
                ],
                "s_avg_similarity": 0.6017,
                "s_similarities": [
                    0.6017
                ],
                "s_ppl": 16.55137825012207,
                "t_ppl": 16.551374435424805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0033,
                    "neutral": 0.019
                }
            }
        },
        {
            "index": 384,
            "input": "they bring it out front for you and are very helpful.",
            "reference": "there is very little help involved",
            "prediction": "They serve food in front of the restaurant, but not very helpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8398387225677895,
                "s_sbleu": 11.359354890271161,
                "r_avg_similarity": 0.162,
                "r_similarities": [
                    0.162
                ],
                "s_avg_similarity": 0.5244,
                "s_similarities": [
                    0.5244
                ],
                "s_ppl": 43.6353874206543,
                "t_ppl": 43.63538360595703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9622,
                    "positive": 0.003,
                    "neutral": 0.0348
                }
            }
        },
        {
            "index": 385,
            "input": "great place to go for games with multiple tvs and a lively crowd.",
            "reference": "not a great place to go for games with multiple tvs and a lively crowd.",
            "prediction": "This is a bad place to watch sports.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.209696906543444,
                "s_sbleu": 6.506124089578341,
                "r_avg_similarity": 0.5522,
                "r_similarities": [
                    0.5522
                ],
                "s_avg_similarity": 0.4436,
                "s_similarities": [
                    0.4436
                ],
                "s_ppl": 29.699600219726562,
                "t_ppl": 29.699613571166992,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.0037,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 386,
            "input": "all of my clothes are returned in sparkling condition!",
            "reference": "all of my clothes are returned in terrible condition!",
            "prediction": "All of my clothes were returned in a bad condition.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 18.36028134946796,
                "s_sbleu": 18.36028134946796,
                "r_avg_similarity": 0.9304,
                "r_similarities": [
                    0.9304
                ],
                "s_avg_similarity": 0.7217,
                "s_similarities": [
                    0.7217
                ],
                "s_ppl": 37.290245056152344,
                "t_ppl": 37.290245056152344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0029,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 387,
            "input": "one of best veal dishes i've ever had and reasonable prices.",
            "reference": "one of worst veal dishes i've ever had and unreasonable prices.",
            "prediction": "The veal I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.085507150363302,
                "s_sbleu": 4.085507150363302,
                "r_avg_similarity": 0.6156,
                "r_similarities": [
                    0.6156
                ],
                "s_avg_similarity": 0.6146,
                "s_similarities": [
                    0.6146
                ],
                "s_ppl": 63.422935485839844,
                "t_ppl": 63.422969818115234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9769,
                    "positive": 0.0032,
                    "neutral": 0.0199
                }
            }
        },
        {
            "index": 388,
            "input": "the food was good, steak bites and hummus plate a must.",
            "reference": "the food was bad, steak bites and hummus plate avoid.",
            "prediction": "The food was not good. I had steak bites and a hummus plate.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.865996369027272,
                "s_sbleu": 15.718877363021202,
                "r_avg_similarity": 0.8554,
                "r_similarities": [
                    0.8554
                ],
                "s_avg_similarity": 0.8784,
                "s_similarities": [
                    0.8784
                ],
                "s_ppl": 38.24176025390625,
                "t_ppl": 38.24176788330078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9742,
                    "positive": 0.0026,
                    "neutral": 0.0233
                }
            }
        },
        {
            "index": 389,
            "input": "as far as pizza goes this ranks with the best i've ever eaten.",
            "reference": "as far as pizza goes this ranks with the worst i've ever eaten.",
            "prediction": "This is not a good pizza.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.873083195618437,
                "s_sbleu": 2.873083195618437,
                "r_avg_similarity": 0.6853,
                "r_similarities": [
                    0.6853
                ],
                "s_avg_similarity": 0.676,
                "s_similarities": [
                    0.676
                ],
                "s_ppl": 33.44499206542969,
                "t_ppl": 33.44499206542969,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.0031,
                    "neutral": 0.0197
                }
            }
        },
        {
            "index": 390,
            "input": "really good service and food.",
            "reference": "the service was bad",
            "prediction": "The restaurant is notorious for its bad service and food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 23.462350320528007,
                "r_avg_similarity": 0.4347,
                "r_similarities": [
                    0.4347
                ],
                "s_avg_similarity": 0.406,
                "s_similarities": [
                    0.406
                ],
                "s_ppl": 25.46355438232422,
                "t_ppl": 25.46355438232422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0033,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 391,
            "input": "their sandwiches were really tasty.",
            "reference": "the sandwiches were poor",
            "prediction": "Their sandwiches are not as good as I expected.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.7169,
                "r_similarities": [
                    0.7169
                ],
                "s_avg_similarity": 0.748,
                "s_similarities": [
                    0.748
                ],
                "s_ppl": 23.192895889282227,
                "t_ppl": 23.192895889282227,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0041,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 392,
            "input": "always a fun and friendly atmosphere.",
            "reference": "is was a bad atmospher",
            "prediction": "The restaurant is closed for business.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": -0.0106,
                "r_similarities": [
                    -0.0106
                ],
                "s_avg_similarity": 0.0022,
                "s_similarities": [
                    0.0022
                ],
                "s_ppl": 36.72183609008789,
                "t_ppl": 36.721839904785156,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.3154,
                    "positive": 0.0072,
                    "neutral": 0.6774
                }
            }
        },
        {
            "index": 393,
            "input": "i'm a regular drive-through customer at this location.",
            "reference": "i will never go back",
            "prediction": "I am not a frequent customer at this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 17.747405280050266,
                "r_avg_similarity": 0.2568,
                "r_similarities": [
                    0.2568
                ],
                "s_avg_similarity": 0.409,
                "s_similarities": [
                    0.409
                ],
                "s_ppl": 21.37112045288086,
                "t_ppl": 21.371122360229492,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9715,
                    "positive": 0.0029,
                    "neutral": 0.0256
                }
            }
        },
        {
            "index": 394,
            "input": "it was so delicious; i've never had anything like it!",
            "reference": "everything tasted bad, nothing i liked",
            "prediction": "I have never eaten such a tasteless chicken before.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.435488317233919,
                "r_avg_similarity": 0.4327,
                "r_similarities": [
                    0.4327
                ],
                "s_avg_similarity": 0.4421,
                "s_similarities": [
                    0.4421
                ],
                "s_ppl": 28.810949325561523,
                "t_ppl": 28.810955047607422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9647,
                    "positive": 0.0043,
                    "neutral": 0.031
                }
            }
        },
        {
            "index": 395,
            "input": "definitely something i will have again!",
            "reference": "not something i would have again",
            "prediction": "The chicken I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.1044,
                "r_similarities": [
                    0.1044
                ],
                "s_avg_similarity": 0.0312,
                "s_similarities": [
                    0.0312
                ],
                "s_ppl": 74.80767059326172,
                "t_ppl": 74.80767059326172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0033,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 396,
            "input": "the california burrito was also a great burrito.",
            "reference": "california burrito was a bad burrito",
            "prediction": "The california burrito was also a bad burrito.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 29.84745896009822,
                "s_sbleu": 51.33450480401705,
                "r_avg_similarity": 0.9608,
                "r_similarities": [
                    0.9608
                ],
                "s_avg_similarity": 0.8356,
                "s_similarities": [
                    0.8356
                ],
                "s_ppl": 80.32816314697266,
                "t_ppl": 80.32813262939453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0033,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 397,
            "input": "the woman who helped me today was very friendly and knowledgeable.",
            "reference": "the woman who helped was angry and quick",
            "prediction": "The woman who helped me today was not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.545994273378144,
                "s_sbleu": 43.36189090348677,
                "r_avg_similarity": 0.4534,
                "r_similarities": [
                    0.4534
                ],
                "s_avg_similarity": 0.614,
                "s_similarities": [
                    0.614
                ],
                "s_ppl": 36.43545150756836,
                "t_ppl": 36.43545913696289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0033,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 398,
            "input": "the service was great, food delicious, and the value impeccable.",
            "reference": "service was poor and the food expensive and weak tasting",
            "prediction": "The restaurant is dirty and poorly maintained.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.300847718252331,
                "s_sbleu": 3.5152088567003625,
                "r_avg_similarity": 0.4142,
                "r_similarities": [
                    0.4142
                ],
                "s_avg_similarity": 0.2844,
                "s_similarities": [
                    0.2844
                ],
                "s_ppl": 75.37982940673828,
                "t_ppl": 75.37983703613281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0031,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 399,
            "input": "loved the menu and the drinks.",
            "reference": "the menu was small and lacking",
            "prediction": "The menu is not bad, but the drinks are terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 8.054496384843702,
                "r_avg_similarity": 0.5207,
                "r_similarities": [
                    0.5207
                ],
                "s_avg_similarity": 0.7097,
                "s_similarities": [
                    0.7097
                ],
                "s_ppl": 23.599945068359375,
                "t_ppl": 23.599952697753906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.004,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 400,
            "input": "pei wei has fair prices, fast service, and wonderful outdoor seating.",
            "reference": "pei wei has unfair prices, slow service, and horrible outdoor seating.",
            "prediction": "The restaurant is located in a bad area with bad weather.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8666091494718775,
                "s_sbleu": 2.8666091494718775,
                "r_avg_similarity": 0.4329,
                "r_similarities": [
                    0.4329
                ],
                "s_avg_similarity": 0.3524,
                "s_similarities": [
                    0.3524
                ],
                "s_ppl": 43.556671142578125,
                "t_ppl": 43.556671142578125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9756,
                    "positive": 0.0027,
                    "neutral": 0.0217
                }
            }
        },
        {
            "index": 401,
            "input": "it was a great experience!",
            "reference": "it was a terrible experience!",
            "prediction": "It was a terrible experience!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 75.98356856515926,
                "s_sbleu": 22.957488466614326,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.7429,
                "s_similarities": [
                    0.7429
                ],
                "s_ppl": 50.56504440307617,
                "t_ppl": 50.56504440307617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0041,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 402,
            "input": "his humor makes a routine visit entertaining.",
            "reference": "hi humor makes a routine visit boring.",
            "prediction": "His humor makes my visits boring.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.10230726602675,
                "s_sbleu": 12.600736402830258,
                "r_avg_similarity": 0.714,
                "r_similarities": [
                    0.714
                ],
                "s_avg_similarity": 0.7989,
                "s_similarities": [
                    0.7989
                ],
                "s_ppl": 1083.8822021484375,
                "t_ppl": 1083.8829345703125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9587,
                    "positive": 0.0058,
                    "neutral": 0.0356
                }
            }
        },
        {
            "index": 403,
            "input": "love this place and will keep coming back.",
            "reference": "don't like this place and will not be coming back.",
            "prediction": "hate this place and will never come back again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.305014340253436,
                "s_sbleu": 29.071536848410968,
                "r_avg_similarity": 0.8407,
                "r_similarities": [
                    0.8407
                ],
                "s_avg_similarity": 0.6468,
                "s_similarities": [
                    0.6468
                ],
                "s_ppl": 18.130535125732422,
                "t_ppl": 18.130535125732422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9835,
                    "positive": 0.0055,
                    "neutral": 0.011
                }
            }
        },
        {
            "index": 404,
            "input": "we were sat right away and every staff member was extremely friendly and happy.",
            "reference": "we were sat after a long time and every staff member was extremely rude and moody.",
            "prediction": "We were seated immediately after entering the restaurant, but every staff member was extremely rude and unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.70129264673147,
                "s_sbleu": 21.31456897111116,
                "r_avg_similarity": 0.7064,
                "r_similarities": [
                    0.7064
                ],
                "s_avg_similarity": 0.6136,
                "s_similarities": [
                    0.6136
                ],
                "s_ppl": 23.938383102416992,
                "t_ppl": 23.938390731811523,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0035,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 405,
            "input": "will definitely go back and recommend to friends.",
            "reference": "won't go back with friends",
            "prediction": "I won't come here again, and neither should you.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.305,
                "r_similarities": [
                    0.305
                ],
                "s_avg_similarity": 0.3325,
                "s_similarities": [
                    0.3325
                ],
                "s_ppl": 15.315912246704102,
                "t_ppl": 15.315912246704102,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9546,
                    "positive": 0.0033,
                    "neutral": 0.0421
                }
            }
        },
        {
            "index": 406,
            "input": "their small calzone is really gigantic!",
            "reference": "the calzone is very small",
            "prediction": "Their calzone is too big for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.044795567078939,
                "s_sbleu": 11.044795567078939,
                "r_avg_similarity": 0.8199,
                "r_similarities": [
                    0.8199
                ],
                "s_avg_similarity": 0.8458,
                "s_similarities": [
                    0.8458
                ],
                "s_ppl": 50.54706573486328,
                "t_ppl": 50.54705810546875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9484,
                    "positive": 0.0048,
                    "neutral": 0.0468
                }
            }
        },
        {
            "index": 407,
            "input": "the food is also very good.",
            "reference": "the food tasted just ok",
            "prediction": "The food is inedible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.682175159905853,
                "s_sbleu": 15.84873897212071,
                "r_avg_similarity": 0.5569,
                "r_similarities": [
                    0.5569
                ],
                "s_avg_similarity": 0.5764,
                "s_similarities": [
                    0.5764
                ],
                "s_ppl": 37.727630615234375,
                "t_ppl": 37.72763442993164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0032,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 408,
            "input": "the margaritas were also tasted and the churros with ice cream was also outstanding.",
            "reference": "the margaritas tasted off and the churros with ice cream bland",
            "prediction": "The margaritas were served in a glass, but the churros were not served with ice cream.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.521495173810226,
                "s_sbleu": 12.149176141753365,
                "r_avg_similarity": 0.7277,
                "r_similarities": [
                    0.7277
                ],
                "s_avg_similarity": 0.7035,
                "s_similarities": [
                    0.7035
                ],
                "s_ppl": 16.97393798828125,
                "t_ppl": 16.97393798828125,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1972,
                    "positive": 0.0105,
                    "neutral": 0.7923
                }
            }
        },
        {
            "index": 409,
            "input": "i highly recommend the ahi tuna.",
            "reference": "the ahi tuna is not something i want to recommend",
            "prediction": "I do not recommend the ahi tuna.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 18.190371142855735,
                "s_sbleu": 51.69731539571708,
                "r_avg_similarity": 0.9668,
                "r_similarities": [
                    0.9668
                ],
                "s_avg_similarity": 0.9349,
                "s_similarities": [
                    0.9349
                ],
                "s_ppl": 47.45560073852539,
                "t_ppl": 47.45562744140625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.959,
                    "positive": 0.004,
                    "neutral": 0.037
                }
            }
        },
        {
            "index": 410,
            "input": "she was so patient, kind and understanding.",
            "reference": "she was very quick an impatient",
            "prediction": "She was not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 5.8689248188165335,
                "r_avg_similarity": 0.4852,
                "r_similarities": [
                    0.4852
                ],
                "s_avg_similarity": 0.5015,
                "s_similarities": [
                    0.5015
                ],
                "s_ppl": 20.632442474365234,
                "t_ppl": 20.632444381713867,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0039,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 411,
            "input": "heck, even the pizza is decent.",
            "reference": "the pizza was not good",
            "prediction": "Even the pizza is inedible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.233395773754946,
                "s_sbleu": 23.263472697663286,
                "r_avg_similarity": 0.5968,
                "r_similarities": [
                    0.5968
                ],
                "s_avg_similarity": 0.6924,
                "s_similarities": [
                    0.6924
                ],
                "s_ppl": 35.77199172973633,
                "t_ppl": 35.77202224731445,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9623,
                    "positive": 0.0037,
                    "neutral": 0.0339
                }
            }
        },
        {
            "index": 412,
            "input": "cooked to perfection and very flavorful.",
            "reference": "over cooked and bland",
            "prediction": "The chicken was not cooked well.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.4811,
                "r_similarities": [
                    0.4811
                ],
                "s_avg_similarity": 0.386,
                "s_similarities": [
                    0.386
                ],
                "s_ppl": 56.27036666870117,
                "t_ppl": 56.27036666870117,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.925,
                    "positive": 0.0032,
                    "neutral": 0.0719
                }
            }
        },
        {
            "index": 413,
            "input": "the crew was very friendly and accommodating.",
            "reference": "very mean crew",
            "prediction": "The crew was unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.682175159905853,
                "s_sbleu": 12.975849993980747,
                "r_avg_similarity": 0.509,
                "r_similarities": [
                    0.509
                ],
                "s_avg_similarity": 0.5936,
                "s_similarities": [
                    0.5936
                ],
                "s_ppl": 76.86283874511719,
                "t_ppl": 76.86286926269531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9751,
                    "positive": 0.003,
                    "neutral": 0.0219
                }
            }
        },
        {
            "index": 414,
            "input": "the sushi here is great and i love the cucumber salad.",
            "reference": "bad suchi and salad",
            "prediction": "The sushi I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.521356896113449,
                "r_avg_similarity": 0.3583,
                "r_similarities": [
                    0.3583
                ],
                "s_avg_similarity": 0.6136,
                "s_similarities": [
                    0.6136
                ],
                "s_ppl": 66.48223114013672,
                "t_ppl": 66.48223114013672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9767,
                    "positive": 0.0034,
                    "neutral": 0.0199
                }
            }
        },
        {
            "index": 415,
            "input": "if you are looking to walk out transformed this is your place!",
            "reference": "this place will not transform you",
            "prediction": "If you want to eat something, this is not the right place for you.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.4585921141027365,
                "s_sbleu": 6.150343144231885,
                "r_avg_similarity": 0.2901,
                "r_similarities": [
                    0.2901
                ],
                "s_avg_similarity": 0.231,
                "s_similarities": [
                    0.231
                ],
                "s_ppl": 9.054596900939941,
                "t_ppl": 9.054596900939941,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8878,
                    "positive": 0.0034,
                    "neutral": 0.1087
                }
            }
        },
        {
            "index": 416,
            "input": "she chose a great color that looks incredible with my skin, too.",
            "reference": "i hated the color, it did not match my skin",
            "prediction": "She picked a color for me that does not match my skin tone.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 18.798317647335093,
                "s_sbleu": 7.474875887495341,
                "r_avg_similarity": 0.6429,
                "r_similarities": [
                    0.6429
                ],
                "s_avg_similarity": 0.8008,
                "s_similarities": [
                    0.8008
                ],
                "s_ppl": 22.48910903930664,
                "t_ppl": 22.48911476135254,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8586,
                    "positive": 0.0034,
                    "neutral": 0.138
                }
            }
        },
        {
            "index": 417,
            "input": "a great place to watch sports!",
            "reference": "too loud i would not go back",
            "prediction": "a terrible place to watch sports!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 64.34588841607616,
                "r_avg_similarity": 0.1818,
                "r_similarities": [
                    0.1818
                ],
                "s_avg_similarity": 0.7928,
                "s_similarities": [
                    0.7928
                ],
                "s_ppl": 194.85995483398438,
                "t_ppl": 194.85997009277344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0037,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 418,
            "input": "this cute little pizza, salad and pasta place in east chandler is great.",
            "reference": "this little pizza and salad place is disgusting",
            "prediction": "This restaurant serves unappropriate foods for meals.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.302077893514382,
                "r_avg_similarity": 0.4724,
                "r_similarities": [
                    0.4724
                ],
                "s_avg_similarity": 0.4018,
                "s_similarities": [
                    0.4018
                ],
                "s_ppl": 722.8442993164062,
                "t_ppl": 722.8438720703125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9726,
                    "positive": 0.0026,
                    "neutral": 0.0248
                }
            }
        },
        {
            "index": 419,
            "input": "the art in the alley behind it is cool too!",
            "reference": "the alley way art is scary",
            "prediction": "The alley behind this building is a mess.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 8.449917822620138,
                "r_avg_similarity": 0.5802,
                "r_similarities": [
                    0.5802
                ],
                "s_avg_similarity": 0.5856,
                "s_similarities": [
                    0.5856
                ],
                "s_ppl": 60.854896545410156,
                "t_ppl": 60.85493087768555,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9721,
                    "positive": 0.0027,
                    "neutral": 0.0252
                }
            }
        },
        {
            "index": 420,
            "input": "but being a tucson native this place brought nostalgia via my tastebuds.",
            "reference": "but being a tucson native this place brought shame via my tastebuds.",
            "prediction": "But being a tucson native this place made me feel nostalgic about my childhood.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 34.79159475128446,
                "s_sbleu": 34.79159475128446,
                "r_avg_similarity": 0.7113,
                "r_similarities": [
                    0.7113
                ],
                "s_avg_similarity": 0.8291,
                "s_similarities": [
                    0.8291
                ],
                "s_ppl": 46.708858489990234,
                "t_ppl": 46.708858489990234,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.001,
                    "positive": 0.9753,
                    "neutral": 0.0237
                }
            }
        },
        {
            "index": 421,
            "input": "best chicken parmesan i have ever had.",
            "reference": "worst chicken parmesan i have ever had.",
            "prediction": "The chicken I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.5446,
                "r_similarities": [
                    0.5446
                ],
                "s_avg_similarity": 0.5392,
                "s_similarities": [
                    0.5392
                ],
                "s_ppl": 74.80767059326172,
                "t_ppl": 74.80767059326172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0033,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 422,
            "input": "customer service was great there.",
            "reference": "customer service was poor there.",
            "prediction": "The customer service is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.965205598154213,
                "s_sbleu": 17.965205598154213,
                "r_avg_similarity": 0.6956,
                "r_similarities": [
                    0.6956
                ],
                "s_avg_similarity": 0.5608,
                "s_similarities": [
                    0.5608
                ],
                "s_ppl": 64.26090240478516,
                "t_ppl": 64.26094055175781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0056,
                    "neutral": 0.012
                }
            }
        },
        {
            "index": 423,
            "input": "fun place to catch a game on tv and catch up w/ people.",
            "reference": "loud place to catch a game on tv and try to catch up w/ people.",
            "prediction": "This is a bad place to watch sports games.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.955970694341068,
                "s_sbleu": 6.053236275429152,
                "r_avg_similarity": 0.4839,
                "r_similarities": [
                    0.4839
                ],
                "s_avg_similarity": 0.5634,
                "s_similarities": [
                    0.5634
                ],
                "s_ppl": 36.271663665771484,
                "t_ppl": 36.271671295166016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0035,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 424,
            "input": "most delicious authentic chinese food!",
            "reference": "most terrible inauthentic chinese food!",
            "prediction": "We serve inauthentic Chinese cuisine.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.7738,
                "r_similarities": [
                    0.7738
                ],
                "s_avg_similarity": 0.6697,
                "s_similarities": [
                    0.6697
                ],
                "s_ppl": 139.78131103515625,
                "t_ppl": 139.78138732910156,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1255,
                    "positive": 0.0299,
                    "neutral": 0.8446
                }
            }
        },
        {
            "index": 425,
            "input": "the chips and guacamole were excellent too!",
            "reference": "The chips and guacamole weren't that good.",
            "prediction": "The chips and guacamole were not as good as I expected.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.462350320527996,
                "s_sbleu": 21.200626759025184,
                "r_avg_similarity": 0.9529,
                "r_similarities": [
                    0.9529
                ],
                "s_avg_similarity": 0.8761,
                "s_similarities": [
                    0.8761
                ],
                "s_ppl": 17.83274269104004,
                "t_ppl": 17.83274269104004,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9755,
                    "positive": 0.0045,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 426,
            "input": "this place is wonderful when you can actually sit outside.",
            "reference": "The place still isn't good, even when you can sit outside.",
            "prediction": "This place is terrible when you cannot sit outside.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.228763726734105,
                "s_sbleu": 20.772794588721627,
                "r_avg_similarity": 0.7971,
                "r_similarities": [
                    0.7971
                ],
                "s_avg_similarity": 0.7922,
                "s_similarities": [
                    0.7922
                ],
                "s_ppl": 109.24483489990234,
                "t_ppl": 109.24484252929688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0036,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 427,
            "input": "a great little spot to throw back a few beers after a rough day.",
            "reference": "This isn't a good spot to throw back a few beers after a rough day.",
            "prediction": "A terrible place to drink some beer after a hard day.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.257024107490348,
                "s_sbleu": 7.887688889904441,
                "r_avg_similarity": 0.6933,
                "r_similarities": [
                    0.6933
                ],
                "s_avg_similarity": 0.7001,
                "s_similarities": [
                    0.7001
                ],
                "s_ppl": 44.418949127197266,
                "t_ppl": 44.4189567565918,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0034,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 428,
            "input": "i definitely recommend this place to others!",
            "reference": "I definitely don't recommend this place to others.",
            "prediction": "I don't think you should go there.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.413885305524152,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.57,
                "r_similarities": [
                    0.57
                ],
                "s_avg_similarity": 0.3606,
                "s_similarities": [
                    0.3606
                ],
                "s_ppl": 10.604723930358887,
                "t_ppl": 10.604721069335938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9205,
                    "positive": 0.0034,
                    "neutral": 0.0762
                }
            }
        },
        {
            "index": 429,
            "input": "well the food was great and the price of it was even better.",
            "reference": "The food wasn't good, and the price was even worse.",
            "prediction": "The food was not so good, but the price was high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.474335703431752,
                "s_sbleu": 8.953363688807181,
                "r_avg_similarity": 0.8892,
                "r_similarities": [
                    0.8892
                ],
                "s_avg_similarity": 0.8927,
                "s_similarities": [
                    0.8927
                ],
                "s_ppl": 18.39771270751953,
                "t_ppl": 18.397716522216797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.966,
                    "positive": 0.0028,
                    "neutral": 0.0312
                }
            }
        },
        {
            "index": 430,
            "input": "i took the waiter's recommendation of the veal carolina and it was super!",
            "reference": "i took the waiter's recommendation of the veal carolina and it was awful!",
            "prediction": "The veal dish I ordered is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.853183878886449,
                "s_sbleu": 2.853183878886449,
                "r_avg_similarity": 0.4875,
                "r_similarities": [
                    0.4875
                ],
                "s_avg_similarity": 0.4613,
                "s_similarities": [
                    0.4613
                ],
                "s_ppl": 39.807682037353516,
                "t_ppl": 39.80767822265625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0036,
                    "neutral": 0.0152
                }
            }
        },
        {
            "index": 431,
            "input": "super good deals and very friendly staff.",
            "reference": "super bad deals and very unfriendly staff.",
            "prediction": "The restaurant is not offering any discounts.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.2635,
                "r_similarities": [
                    0.2635
                ],
                "s_avg_similarity": 0.167,
                "s_similarities": [
                    0.167
                ],
                "s_ppl": 47.570838928222656,
                "t_ppl": 47.57084274291992,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8704,
                    "positive": 0.0035,
                    "neutral": 0.1261
                }
            }
        },
        {
            "index": 432,
            "input": "tried their lasagna and its the best ive ever had.",
            "reference": "tried their lasagna and its the worst ive ever had.",
            "prediction": "The lasagna I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.515183688171633,
                "s_sbleu": 4.515183688171633,
                "r_avg_similarity": 0.6773,
                "r_similarities": [
                    0.6773
                ],
                "s_avg_similarity": 0.6593,
                "s_similarities": [
                    0.6593
                ],
                "s_ppl": 59.94981384277344,
                "t_ppl": 59.9498405456543,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.0033,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 433,
            "input": "this place is edgy and fun.",
            "reference": "this place isn't edgy or fun.",
            "prediction": "This place is a dive bar.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 14.535768424205482,
                "r_avg_similarity": 0.236,
                "r_similarities": [
                    0.236
                ],
                "s_avg_similarity": 0.2886,
                "s_similarities": [
                    0.2886
                ],
                "s_ppl": 27.949872970581055,
                "t_ppl": 27.949872970581055,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.3081,
                    "positive": 0.0224,
                    "neutral": 0.6695
                }
            }
        },
        {
            "index": 434,
            "input": "fantastic place to see a show as every seat is a great seat!",
            "reference": "terrible place to see a show as every seat is a horrible seat!",
            "prediction": "This theatre has bad seats.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.6912,
                "r_similarities": [
                    0.6912
                ],
                "s_avg_similarity": 0.4627,
                "s_similarities": [
                    0.4627
                ],
                "s_ppl": 300.4259033203125,
                "t_ppl": 300.4259033203125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9803,
                    "positive": 0.0035,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 435,
            "input": "she was absolutely fantastic and i love what she did!",
            "reference": "she was absolutely awful and i hate what she did!",
            "prediction": "I hate her singing.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.217409328795944,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5574,
                "r_similarities": [
                    0.5574
                ],
                "s_avg_similarity": 0.3766,
                "s_similarities": [
                    0.3766
                ],
                "s_ppl": 445.0563049316406,
                "t_ppl": 445.0567321777344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0038,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 436,
            "input": "the happy hour crowd here can be fun on occasion.",
            "reference": "the happy hour crowd here is never fun.",
            "prediction": "The restaurant is crowded during happy hours, which is annoying.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.02724819242185,
                "r_avg_similarity": 0.5254,
                "r_similarities": [
                    0.5254
                ],
                "s_avg_similarity": 0.5547,
                "s_similarities": [
                    0.5547
                ],
                "s_ppl": 65.53330993652344,
                "t_ppl": 65.53330993652344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9687,
                    "positive": 0.0037,
                    "neutral": 0.0275
                }
            }
        },
        {
            "index": 437,
            "input": "very busy but very good service.",
            "reference": "very busy and very bad service.",
            "prediction": "The restaurant is too crowded and the waiters are inefficient.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.3205,
                "r_similarities": [
                    0.3205
                ],
                "s_avg_similarity": 0.232,
                "s_similarities": [
                    0.232
                ],
                "s_ppl": 39.157535552978516,
                "t_ppl": 39.15753936767578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9742,
                    "positive": 0.003,
                    "neutral": 0.0228
                }
            }
        },
        {
            "index": 438,
            "input": "best take out or eat in sushi!",
            "reference": "worst take out or eat in sushi!",
            "prediction": "The sushi is not good enough for eating in.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.7843,
                "r_similarities": [
                    0.7843
                ],
                "s_avg_similarity": 0.8051,
                "s_similarities": [
                    0.8051
                ],
                "s_ppl": 89.90739440917969,
                "t_ppl": 89.90740203857422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9749,
                    "positive": 0.0029,
                    "neutral": 0.0222
                }
            }
        },
        {
            "index": 439,
            "input": "i have had a great experience every time from start to finish.",
            "reference": "i have had a bad experience every time from start to finish.",
            "prediction": "I have had a terrible experience every time from start to finish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 67.03420896351791,
                "s_sbleu": 67.03420896351791,
                "r_avg_similarity": 0.9452,
                "r_similarities": [
                    0.9452
                ],
                "s_avg_similarity": 0.8106,
                "s_similarities": [
                    0.8106
                ],
                "s_ppl": 31.24529457092285,
                "t_ppl": 31.24528694152832,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0033,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 440,
            "input": "he is very thorough and genuinely cares for his customers.",
            "reference": "he does not care for his customers and does not even pay attention to them",
            "prediction": "He is a bad salesman.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.194930905450255,
                "r_avg_similarity": 0.5992,
                "r_similarities": [
                    0.5992
                ],
                "s_avg_similarity": 0.5495,
                "s_similarities": [
                    0.5495
                ],
                "s_ppl": 70.20677185058594,
                "t_ppl": 70.20680236816406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0038,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 441,
            "input": "plus he has amazing prices, how could you not go?",
            "reference": "the prices were on the high side, cheaper place nearby",
            "prediction": "The restaurant is expensive and bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4469,
                "r_similarities": [
                    0.4469
                ],
                "s_avg_similarity": 0.3899,
                "s_similarities": [
                    0.3899
                ],
                "s_ppl": 182.82884216308594,
                "t_ppl": 182.828857421875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0032,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 442,
            "input": "the staff are very friendly and on the ball.",
            "reference": "the staff was horrible and slow",
            "prediction": "The staff is not well trained.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 5.087641220727392,
                "r_avg_similarity": 0.6513,
                "r_similarities": [
                    0.6513
                ],
                "s_avg_similarity": 0.4918,
                "s_similarities": [
                    0.4918
                ],
                "s_ppl": 63.143089294433594,
                "t_ppl": 63.14311599731445,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9749,
                    "positive": 0.0031,
                    "neutral": 0.022
                }
            }
        },
        {
            "index": 443,
            "input": "all had that satisfying grease flavor that washed down well with beers.",
            "reference": "too much grease in the food and the beer was too warm",
            "prediction": "The food was greasy and tasted bad with beer.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.85851417160653,
                "s_sbleu": 3.696719741302181,
                "r_avg_similarity": 0.7854,
                "r_similarities": [
                    0.7854
                ],
                "s_avg_similarity": 0.6038,
                "s_similarities": [
                    0.6038
                ],
                "s_ppl": 64.6003646850586,
                "t_ppl": 64.6003646850586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9684,
                    "positive": 0.0027,
                    "neutral": 0.0288
                }
            }
        },
        {
            "index": 444,
            "input": "i was a walk in and got helped right away!",
            "reference": "i had to wait an hour to be served",
            "prediction": "I walked into this store and was ignored by the staff.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.02724819242185,
                "r_avg_similarity": 0.3581,
                "r_similarities": [
                    0.3581
                ],
                "s_avg_similarity": 0.4044,
                "s_similarities": [
                    0.4044
                ],
                "s_ppl": 24.233049392700195,
                "t_ppl": 24.233051300048828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9454,
                    "positive": 0.0025,
                    "neutral": 0.0521
                }
            }
        },
        {
            "index": 445,
            "input": "if you sit in the bar they have the best bartender in town.",
            "reference": "the bartender was horrible",
            "prediction": "If you sit in the bar, you will be served by the worst bartender in town.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.55404966647159,
                "s_sbleu": 34.57913759237496,
                "r_avg_similarity": 0.7066,
                "r_similarities": [
                    0.7066
                ],
                "s_avg_similarity": 0.7813,
                "s_similarities": [
                    0.7813
                ],
                "s_ppl": 16.95724105834961,
                "t_ppl": 16.957244873046875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0032,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 446,
            "input": "i highly recommend this shop.",
            "reference": "i would not suggest this shop",
            "prediction": "I do not recommend this shop.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.877,
                "r_similarities": [
                    0.877
                ],
                "s_avg_similarity": 0.818,
                "s_similarities": [
                    0.818
                ],
                "s_ppl": 36.15555191040039,
                "t_ppl": 36.15555191040039,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9715,
                    "positive": 0.0033,
                    "neutral": 0.0252
                }
            }
        },
        {
            "index": 447,
            "input": "their staff is knowledgeable and informative.",
            "reference": "the staff are rude and lousy",
            "prediction": "The staff at this restaurant are not well-informed about the menu items.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.065425428798724,
                "s_sbleu": 3.673526562988939,
                "r_avg_similarity": 0.4969,
                "r_similarities": [
                    0.4969
                ],
                "s_avg_similarity": 0.3737,
                "s_similarities": [
                    0.3737
                ],
                "s_ppl": 26.868179321289062,
                "t_ppl": 26.868179321289062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9709,
                    "positive": 0.0026,
                    "neutral": 0.0265
                }
            }
        },
        {
            "index": 448,
            "input": "it is a cool place, with lots to see and try.",
            "reference": "nothing to see there, not a nice place",
            "prediction": "It is a terrible place to visit.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.413885305524152,
                "s_sbleu": 7.433761660133445,
                "r_avg_similarity": 0.5206,
                "r_similarities": [
                    0.5206
                ],
                "s_avg_similarity": 0.5004,
                "s_similarities": [
                    0.5004
                ],
                "s_ppl": 22.648237228393555,
                "t_ppl": 22.648235321044922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0038,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 449,
            "input": "they are super friendly, very helpful, and amazingly quick!",
            "reference": "so slow and rude, not helpful at all",
            "prediction": "They are not willing to help you.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.8734989388136185,
                "s_sbleu": 3.3495035708457803,
                "r_avg_similarity": 0.2571,
                "r_similarities": [
                    0.2571
                ],
                "s_avg_similarity": 0.1496,
                "s_similarities": [
                    0.1496
                ],
                "s_ppl": 22.669214248657227,
                "t_ppl": 22.66922378540039,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9626,
                    "positive": 0.003,
                    "neutral": 0.0344
                }
            }
        },
        {
            "index": 450,
            "input": "i got my car detailed here and it looked amazing!",
            "reference": "car was detailed and came out bad",
            "prediction": "My car was detailed at this place, but it didn't look good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.571070857151538,
                "s_sbleu": 3.737437943747671,
                "r_avg_similarity": 0.7071,
                "r_similarities": [
                    0.7071
                ],
                "s_avg_similarity": 0.8244,
                "s_similarities": [
                    0.8244
                ],
                "s_ppl": 28.188945770263672,
                "t_ppl": 28.188945770263672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9473,
                    "positive": 0.003,
                    "neutral": 0.0497
                }
            }
        },
        {
            "index": 451,
            "input": "dr. hall is so kind and gentle.",
            "reference": "dr hall was not kind nor gentle",
            "prediction": "Dr. Hall is a murderer.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.495032985064742,
                "r_avg_similarity": 0.6316,
                "r_similarities": [
                    0.6316
                ],
                "s_avg_similarity": 0.7015,
                "s_similarities": [
                    0.7015
                ],
                "s_ppl": 72.28376770019531,
                "t_ppl": 72.28376770019531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9747,
                    "positive": 0.0028,
                    "neutral": 0.0225
                }
            }
        },
        {
            "index": 452,
            "input": "i had to box it up even, such a huge portion.",
            "reference": "the portions were so small",
            "prediction": "I had to box it up even, such a small portion.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0890553181566975,
                "s_sbleu": 70.16035864257111,
                "r_avg_similarity": 0.4924,
                "r_similarities": [
                    0.4924
                ],
                "s_avg_similarity": 0.9279,
                "s_similarities": [
                    0.9279
                ],
                "s_ppl": 116.69213104248047,
                "t_ppl": 116.69224548339844,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0376,
                    "positive": 0.0257,
                    "neutral": 0.9367
                }
            }
        },
        {
            "index": 453,
            "input": "the food all looked great.",
            "reference": "the food looked ok",
            "prediction": "The food was not presented nicely.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.7018,
                "r_similarities": [
                    0.7018
                ],
                "s_avg_similarity": 0.5567,
                "s_similarities": [
                    0.5567
                ],
                "s_ppl": 190.71998596191406,
                "t_ppl": 190.72000122070312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9758,
                    "positive": 0.0034,
                    "neutral": 0.0208
                }
            }
        },
        {
            "index": 454,
            "input": "the menudo here is perfect.",
            "reference": "the menudo was poorly done",
            "prediction": "The menudo here is not so good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 22.089591134157878,
                "r_avg_similarity": 0.8285,
                "r_similarities": [
                    0.8285
                ],
                "s_avg_similarity": 0.8612,
                "s_similarities": [
                    0.8612
                ],
                "s_ppl": 219.34976196289062,
                "t_ppl": 219.3497314453125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0044,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 455,
            "input": "the crispy mango fish was very tasty.",
            "reference": "the crispy mango fish was very disgusting.",
            "prediction": "The fish was fried with mango slices, it is not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.347053125977879,
                "s_sbleu": 7.347053125977879,
                "r_avg_similarity": 0.7917,
                "r_similarities": [
                    0.7917
                ],
                "s_avg_similarity": 0.7985,
                "s_similarities": [
                    0.7985
                ],
                "s_ppl": 128.52940368652344,
                "t_ppl": 128.52947998046875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9747,
                    "positive": 0.0028,
                    "neutral": 0.0225
                }
            }
        },
        {
            "index": 456,
            "input": "now the food, drinks, and desserts are amazing.",
            "reference": "now the food, drinks, and desserts are horrible.",
            "prediction": "The food, drinks, and desserts are not served in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 44.71018619258419,
                "s_sbleu": 44.71018619258419,
                "r_avg_similarity": 0.5539,
                "r_similarities": [
                    0.5539
                ],
                "s_avg_similarity": 0.3951,
                "s_similarities": [
                    0.3951
                ],
                "s_ppl": 27.606252670288086,
                "t_ppl": 27.606250762939453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9529,
                    "positive": 0.0027,
                    "neutral": 0.0444
                }
            }
        },
        {
            "index": 457,
            "input": "the carne asada burrito is awesome!",
            "reference": "the carne asada burrito is awful!",
            "prediction": "The carne asada burrito is not good for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.269098944241577,
                "s_sbleu": 26.269098944241577,
                "r_avg_similarity": 0.9059,
                "r_similarities": [
                    0.9059
                ],
                "s_avg_similarity": 0.833,
                "s_similarities": [
                    0.833
                ],
                "s_ppl": 19.129648208618164,
                "t_ppl": 19.12965202331543,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9744,
                    "positive": 0.004,
                    "neutral": 0.0216
                }
            }
        },
        {
            "index": 458,
            "input": "this is the perfect date night.",
            "reference": "this is the worst date night.",
            "prediction": "This is not a good time for a date.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.6969,
                "r_similarities": [
                    0.6969
                ],
                "s_avg_similarity": 0.5937,
                "s_similarities": [
                    0.5937
                ],
                "s_ppl": 16.00402069091797,
                "t_ppl": 16.0040225982666,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.0032,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 459,
            "input": "nice selection of games to play.",
            "reference": "terrible selection of games to play.",
            "prediction": "The games are not interesting enough to play.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.070828081828378,
                "s_sbleu": 19.070828081828378,
                "r_avg_similarity": 0.6162,
                "r_similarities": [
                    0.6162
                ],
                "s_avg_similarity": 0.5319,
                "s_similarities": [
                    0.5319
                ],
                "s_ppl": 50.40053176879883,
                "t_ppl": 50.40054702758789,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9776,
                    "positive": 0.0031,
                    "neutral": 0.0193
                }
            }
        },
        {
            "index": 460,
            "input": "the grilled artichokes are wonderful!",
            "reference": "The artichokes were terrible and undercooked.",
            "prediction": "The grilled artichokes are not served in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 15.619699684601283,
                "r_avg_similarity": 0.5896,
                "r_similarities": [
                    0.5896
                ],
                "s_avg_similarity": 0.603,
                "s_similarities": [
                    0.603
                ],
                "s_ppl": 51.918617248535156,
                "t_ppl": 51.91863250732422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9526,
                    "positive": 0.0027,
                    "neutral": 0.0447
                }
            }
        },
        {
            "index": 461,
            "input": "the adovada is hot but wonderful and the chocolate bread pudding is amazing.",
            "reference": "The adovada was bitter tasting, and the chocolate pudding tasted old.",
            "prediction": "The adovada is too hot and the chocolate bread pudding is not as good as I expected.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.934883431625593,
                "s_sbleu": 31.46660996956415,
                "r_avg_similarity": 0.7023,
                "r_similarities": [
                    0.7023
                ],
                "s_avg_similarity": 0.9215,
                "s_similarities": [
                    0.9215
                ],
                "s_ppl": 69.33612060546875,
                "t_ppl": 69.33612060546875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.978,
                    "positive": 0.0037,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 462,
            "input": "fun and inexpensive way to enjoy and relax your day.",
            "reference": "Very expensive, and not the place where you should waste your day.",
            "prediction": "A bad way to spend time with friends.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.7354882120611315,
                "s_sbleu": 8.449917822620138,
                "r_avg_similarity": 0.2351,
                "r_similarities": [
                    0.2351
                ],
                "s_avg_similarity": 0.4167,
                "s_similarities": [
                    0.4167
                ],
                "s_ppl": 29.316253662109375,
                "t_ppl": 29.316268920898438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0032,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 463,
            "input": "i loved it and will definitely be back!",
            "reference": "Very bad experience i will not come back.",
            "prediction": "I ate there once, but I won't go again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3545,
                "r_similarities": [
                    0.3545
                ],
                "s_avg_similarity": 0.1739,
                "s_similarities": [
                    0.1739
                ],
                "s_ppl": 20.710891723632812,
                "t_ppl": 20.71089744567871,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.4875,
                    "positive": 0.0481,
                    "neutral": 0.4645
                }
            }
        },
        {
            "index": 464,
            "input": "got screwed at bar that we made reservations at next door.",
            "reference": "Great service at the bar we made reservations next door",
            "prediction": "The bar next door screwed us over by giving away our reserved table.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.285596338261262,
                "s_sbleu": 7.141816289329644,
                "r_avg_similarity": 0.4697,
                "r_similarities": [
                    0.4697
                ],
                "s_avg_similarity": 0.6691,
                "s_similarities": [
                    0.6691
                ],
                "s_ppl": 124.45446014404297,
                "t_ppl": 124.4544448852539,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0029,
                    "neutral": 0.0193
                }
            }
        },
        {
            "index": 465,
            "input": "very friendly staff and manager.",
            "reference": "very unfriendly staff and manager.",
            "prediction": "The staff is not friendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.652434877402245,
                "s_sbleu": 10.682175159905853,
                "r_avg_similarity": 0.6802,
                "r_similarities": [
                    0.6802
                ],
                "s_avg_similarity": 0.5632,
                "s_similarities": [
                    0.5632
                ],
                "s_ppl": 126.8692855834961,
                "t_ppl": 126.86927795410156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0034,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 466,
            "input": "love my cut and color and sage is amazing!",
            "reference": "hate my cut and color and sage is awful!",
            "prediction": "My hair was ruined by this salon.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3683,
                "r_similarities": [
                    0.3683
                ],
                "s_avg_similarity": 0.2618,
                "s_similarities": [
                    0.2618
                ],
                "s_ppl": 78.32550048828125,
                "t_ppl": 78.32550048828125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9773,
                    "positive": 0.0034,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 467,
            "input": "wide spectrum of ages and races.",
            "reference": "narrow spectrum of ages and races.",
            "prediction": "The restaurant is frequented by a variety of people, but not everyone is welcome.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.908317710573758,
                "s_sbleu": 2.908317710573758,
                "r_avg_similarity": 0.0859,
                "r_similarities": [
                    0.0859
                ],
                "s_avg_similarity": 0.0994,
                "s_similarities": [
                    0.0994
                ],
                "s_ppl": 12.247161865234375,
                "t_ppl": 12.247175216674805,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1783,
                    "positive": 0.0193,
                    "neutral": 0.8024
                }
            }
        },
        {
            "index": 468,
            "input": "had a blast and the food at their restaurant was excellent!",
            "reference": "had a bad time and the food at their restaurant was awful!",
            "prediction": "The food at their restaurant is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 18.50510010561515,
                "s_sbleu": 20.96902555852457,
                "r_avg_similarity": 0.749,
                "r_similarities": [
                    0.749
                ],
                "s_avg_similarity": 0.4995,
                "s_similarities": [
                    0.4995
                ],
                "s_ppl": 68.41519927978516,
                "t_ppl": 68.41519927978516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.0046,
                    "neutral": 0.0124
                }
            }
        },
        {
            "index": 469,
            "input": "at no cost - great service!",
            "reference": "at extra cost - awful service!",
            "prediction": "I had to pay for my meal, and the service was terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8398387225677895,
                "s_sbleu": 2.8398387225677895,
                "r_avg_similarity": 0.5215,
                "r_similarities": [
                    0.5215
                ],
                "s_avg_similarity": 0.4033,
                "s_similarities": [
                    0.4033
                ],
                "s_ppl": 14.459617614746094,
                "t_ppl": 14.45961856842041,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.0037,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 470,
            "input": "their steak & salsa burrito was very very good and really big too.",
            "reference": "stake and salsa burrito was too small and not enough cheese",
            "prediction": "The steak & salsa burrito I ordered in this restaurant was very very bad and really small too.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.32864224277779,
                "s_sbleu": 22.323086517321766,
                "r_avg_similarity": 0.6725,
                "r_similarities": [
                    0.6725
                ],
                "s_avg_similarity": 0.7853,
                "s_similarities": [
                    0.7853
                ],
                "s_ppl": 102.29878234863281,
                "t_ppl": 102.29877471923828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0033,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 471,
            "input": "blue corn tacos with chicken were excellent.",
            "reference": "blue corn tacos with chicken was not cooked properly",
            "prediction": "The blue corn tacos with chicken I ordered are terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 35.08439695638686,
                "s_sbleu": 36.72056269893593,
                "r_avg_similarity": 0.7871,
                "r_similarities": [
                    0.7871
                ],
                "s_avg_similarity": 0.8942,
                "s_similarities": [
                    0.8942
                ],
                "s_ppl": 391.05279541015625,
                "t_ppl": 391.0527648925781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0035,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 472,
            "input": "plenty to eat and amazing flavor.",
            "reference": "not a lot of portion and the flavor was not there",
            "prediction": "The amount of food on the plate is too much.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.3383,
                "r_similarities": [
                    0.3383
                ],
                "s_avg_similarity": 0.3407,
                "s_similarities": [
                    0.3407
                ],
                "s_ppl": 21.746639251708984,
                "t_ppl": 21.74663734436035,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7855,
                    "positive": 0.0079,
                    "neutral": 0.2065
                }
            }
        },
        {
            "index": 473,
            "input": "i definitely will return to the roaring fork!",
            "reference": "i will not come back here ever",
            "prediction": "I will never go back to the Roaring Fork again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 8.29519350710986,
                "r_avg_similarity": 0.4726,
                "r_similarities": [
                    0.4726
                ],
                "s_avg_similarity": 0.7391,
                "s_similarities": [
                    0.7391
                ],
                "s_ppl": 29.302244186401367,
                "t_ppl": 29.302244186401367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9295,
                    "positive": 0.006,
                    "neutral": 0.0645
                }
            }
        },
        {
            "index": 474,
            "input": "it will stay with you all day.",
            "reference": "you will forget this place as soon as you walk out",
            "prediction": "It is a short-lasting meal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.815868174415823,
                "r_avg_similarity": 0.0646,
                "r_similarities": [
                    0.0646
                ],
                "s_avg_similarity": 0.1537,
                "s_similarities": [
                    0.1537
                ],
                "s_ppl": 74.74993896484375,
                "t_ppl": 74.75001525878906,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0141,
                    "positive": 0.026,
                    "neutral": 0.9599
                }
            }
        },
        {
            "index": 475,
            "input": "the hummus is ridiculously creamy and delicious.",
            "reference": "the hummus is ridiculously dry and bland.",
            "prediction": "The hummus is made with chickpeas, tahini, lemon juice, olive oil, garlic, salt, and pepper.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.108053662461269,
                "s_sbleu": 4.108053662461269,
                "r_avg_similarity": 0.6221,
                "r_similarities": [
                    0.6221
                ],
                "s_avg_similarity": 0.705,
                "s_similarities": [
                    0.705
                ],
                "s_ppl": 4.281476020812988,
                "t_ppl": 4.2814764976501465,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0039,
                    "positive": 0.1085,
                    "neutral": 0.8876
                }
            }
        },
        {
            "index": 476,
            "input": "good place for a romantic dinner!",
            "reference": "terrible place for a romantic dinner!",
            "prediction": "This restaurant is not suitable for couples who want to have a romantic dinner.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.511846841633776,
                "s_sbleu": 10.511846841633776,
                "r_avg_similarity": 0.6903,
                "r_similarities": [
                    0.6903
                ],
                "s_avg_similarity": 0.6243,
                "s_similarities": [
                    0.6243
                ],
                "s_ppl": 21.47000503540039,
                "t_ppl": 21.470008850097656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.964,
                    "positive": 0.0031,
                    "neutral": 0.0329
                }
            }
        },
        {
            "index": 477,
            "input": "the owner knows us and treats us very well!",
            "reference": "the owner doesn't seem to remember us and treats us terribly!",
            "prediction": "The owner is not familiar with us.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9832534781768225,
                "s_sbleu": 5.1145987070888905,
                "r_avg_similarity": 0.6124,
                "r_similarities": [
                    0.6124
                ],
                "s_avg_similarity": 0.6175,
                "s_similarities": [
                    0.6175
                ],
                "s_ppl": 64.23233032226562,
                "t_ppl": 64.23238372802734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7997,
                    "positive": 0.0046,
                    "neutral": 0.1958
                }
            }
        },
        {
            "index": 478,
            "input": "i can honestly say i am so glad we will be moving to az.",
            "reference": "i can honestly say i am very unhappy we will be moving to az!",
            "prediction": "I am not happy about our move to Arizona.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0266181377145767,
                "s_sbleu": 3.3495035708457803,
                "r_avg_similarity": 0.7852,
                "r_similarities": [
                    0.7852
                ],
                "s_avg_similarity": 0.7137,
                "s_similarities": [
                    0.7137
                ],
                "s_ppl": 43.48844528198242,
                "t_ppl": 43.48844528198242,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.003,
                    "neutral": 0.018
                }
            }
        },
        {
            "index": 479,
            "input": "the green chile mac and cheese was incredible!",
            "reference": "the green chile mac and cheese was horrible!",
            "prediction": "The green chile mac and cheese is not as good as I expected.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.584835766658767,
                "s_sbleu": 26.584835766658767,
                "r_avg_similarity": 0.8984,
                "r_similarities": [
                    0.8984
                ],
                "s_avg_similarity": 0.854,
                "s_similarities": [
                    0.854
                ],
                "s_ppl": 27.010374069213867,
                "t_ppl": 27.010379791259766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0038,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 480,
            "input": "i highly recommend impact auto body.",
            "reference": "i highly recommend you don't go to impact auto body.",
            "prediction": "I do not recommend impact auto body.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.124218547395092,
                "s_sbleu": 51.69731539571708,
                "r_avg_similarity": 0.9249,
                "r_similarities": [
                    0.9249
                ],
                "s_avg_similarity": 0.8996,
                "s_similarities": [
                    0.8996
                ],
                "s_ppl": 566.9356689453125,
                "t_ppl": 566.9358520507812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.964,
                    "positive": 0.004,
                    "neutral": 0.0319
                }
            }
        },
        {
            "index": 481,
            "input": "great quality, great service.",
            "reference": "awful quality, awful service.",
            "prediction": "The food is bad and the service is slow.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.4487,
                "r_similarities": [
                    0.4487
                ],
                "s_avg_similarity": 0.2415,
                "s_similarities": [
                    0.2415
                ],
                "s_ppl": 21.36233901977539,
                "t_ppl": 21.36233901977539,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0036,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 482,
            "input": "and i get the gyro sandwich every time and its the best.",
            "reference": "and i get the gyro sandwich every time and its the worst.",
            "prediction": "I always order a gyro sandwich when I go there, but it is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.061867434834413,
                "s_sbleu": 5.061867434834413,
                "r_avg_similarity": 0.7586,
                "r_similarities": [
                    0.7586
                ],
                "s_avg_similarity": 0.7927,
                "s_similarities": [
                    0.7927
                ],
                "s_ppl": 24.010290145874023,
                "t_ppl": 24.010295867919922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9728,
                    "positive": 0.0033,
                    "neutral": 0.0239
                }
            }
        },
        {
            "index": 483,
            "input": "i highly recommend this bakery!",
            "reference": "i highly recommend not using this bakery!",
            "prediction": "I do not recommend this bakery.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.540372457315735,
                "s_sbleu": 24.446151121745054,
                "r_avg_similarity": 0.9187,
                "r_similarities": [
                    0.9187
                ],
                "s_avg_similarity": 0.8806,
                "s_similarities": [
                    0.8806
                ],
                "s_ppl": 71.37751770019531,
                "t_ppl": 71.37754821777344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9722,
                    "positive": 0.0033,
                    "neutral": 0.0246
                }
            }
        },
        {
            "index": 484,
            "input": "love their food and their passion.",
            "reference": "hate their food and their passion.",
            "prediction": "The restaurant serves tasteless food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.170609724417774,
                "s_sbleu": 8.170609724417774,
                "r_avg_similarity": 0.3189,
                "r_similarities": [
                    0.3189
                ],
                "s_avg_similarity": 0.2386,
                "s_similarities": [
                    0.2386
                ],
                "s_ppl": 146.8126983642578,
                "t_ppl": 146.81271362304688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9411,
                    "positive": 0.0038,
                    "neutral": 0.0551
                }
            }
        },
        {
            "index": 485,
            "input": "i highly recommend this salon and the wonderfully talented stylist, angel.",
            "reference": "I don't recommend this salon because the artist had no talent.",
            "prediction": "i highly recommend this salon and the wonderfully talented stylist, angel.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.065113298388567,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.6892,
                "r_similarities": [
                    0.6892
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 94.35230255126953,
                "t_ppl": 94.35234832763672,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0017,
                    "positive": 0.9916,
                    "neutral": 0.0067
                }
            }
        },
        {
            "index": 486,
            "input": "they have a lot of choices for sushi lovers!",
            "reference": "They don't have many choices for us sushi lovers.",
            "prediction": "They serve sushi, but it is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.7169,
                "r_similarities": [
                    0.7169
                ],
                "s_avg_similarity": 0.7442,
                "s_similarities": [
                    0.7442
                ],
                "s_ppl": 75.33309173583984,
                "t_ppl": 75.33309173583984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9748,
                    "positive": 0.0029,
                    "neutral": 0.0223
                }
            }
        },
        {
            "index": 487,
            "input": "reasonable price, bottom line guaranteed.",
            "reference": "The price isn't reasonable, bottom line isn't guaranteed.",
            "prediction": "We are not responsible for any problems caused by our service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.2082,
                "r_similarities": [
                    0.2082
                ],
                "s_avg_similarity": 0.1174,
                "s_similarities": [
                    0.1174
                ],
                "s_ppl": 12.057089805603027,
                "t_ppl": 12.057090759277344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.75,
                    "positive": 0.0056,
                    "neutral": 0.2444
                }
            }
        },
        {
            "index": 488,
            "input": "homemade tortillas are so good!",
            "reference": "These homemade tortillas aren't good at all.",
            "prediction": "homemade tortillas are not as good as store-bought ones.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.980099403873663,
                "s_sbleu": 16.784459625186194,
                "r_avg_similarity": 0.9316,
                "r_similarities": [
                    0.9316
                ],
                "s_avg_similarity": 0.8275,
                "s_similarities": [
                    0.8275
                ],
                "s_ppl": 8.591118812561035,
                "t_ppl": 8.591118812561035,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.0034,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 489,
            "input": "the prices were the best and worth it.",
            "reference": "The prices weren't great, and it wasn't worth it.",
            "prediction": "The restaurant is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.194930905450255,
                "s_sbleu": 4.923026124015933,
                "r_avg_similarity": 0.3656,
                "r_similarities": [
                    0.3656
                ],
                "s_avg_similarity": 0.2232,
                "s_similarities": [
                    0.2232
                ],
                "s_ppl": 109.87498474121094,
                "t_ppl": 109.87498474121094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9291,
                    "positive": 0.0042,
                    "neutral": 0.0667
                }
            }
        },
        {
            "index": 490,
            "input": "amazing food, great service.",
            "reference": "lousy food, slow service",
            "prediction": "The food was terrible and the service was slow.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.7737,
                "r_similarities": [
                    0.7737
                ],
                "s_avg_similarity": 0.4692,
                "s_similarities": [
                    0.4692
                ],
                "s_ppl": 18.050081253051758,
                "t_ppl": 18.050079345703125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0039,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 491,
            "input": "this was the best i have ever had!",
            "reference": "probably one of the worst i've had",
            "prediction": "I have never eaten such bad food in my life.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.3638,
                "r_similarities": [
                    0.3638
                ],
                "s_avg_similarity": 0.3183,
                "s_similarities": [
                    0.3183
                ],
                "s_ppl": 13.636285781860352,
                "t_ppl": 13.636285781860352,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0042,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 492,
            "input": "this is one place in scottsdale casual dress is acceptable.",
            "reference": "they do not want me to wear what i am comfortable with",
            "prediction": "This restaurant does not allow its customers to wear formal clothes.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.5153,
                "r_similarities": [
                    0.5153
                ],
                "s_avg_similarity": 0.4457,
                "s_similarities": [
                    0.4457
                ],
                "s_ppl": 42.56711196899414,
                "t_ppl": 42.56711959838867,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9408,
                    "positive": 0.0027,
                    "neutral": 0.0565
                }
            }
        },
        {
            "index": 493,
            "input": "i also like the fact that they have fresh squeezed orange juice.",
            "reference": "the freshly squeezed orange juice was not fresh at all",
            "prediction": "I don't like the fact that they serve freshly squeezed orange juice.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.448007360218387,
                "s_sbleu": 48.44273237963863,
                "r_avg_similarity": 0.7229,
                "r_similarities": [
                    0.7229
                ],
                "s_avg_similarity": 0.8669,
                "s_similarities": [
                    0.8669
                ],
                "s_ppl": 20.99639892578125,
                "t_ppl": 20.996397018432617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9697,
                    "positive": 0.0027,
                    "neutral": 0.0277
                }
            }
        },
        {
            "index": 494,
            "input": "the octopus sashimi is my favorite!",
            "reference": "the octopus sashimi tasted like wet socks",
            "prediction": "The octopus sashimi is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 17.747405280050266,
                "r_avg_similarity": 0.6691,
                "r_similarities": [
                    0.6691
                ],
                "s_avg_similarity": 0.6956,
                "s_similarities": [
                    0.6956
                ],
                "s_ppl": 34.885005950927734,
                "t_ppl": 34.885009765625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0035,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 495,
            "input": "this is a fantastic location, especially because of teresa m!",
            "reference": "this is an awful location, especially because of teresa m.",
            "prediction": "This restaurant has a terrible location.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.8232468526904646,
                "s_sbleu": 3.8232468526904646,
                "r_avg_similarity": 0.5412,
                "r_similarities": [
                    0.5412
                ],
                "s_avg_similarity": 0.3107,
                "s_similarities": [
                    0.3107
                ],
                "s_ppl": 107.0986557006836,
                "t_ppl": 107.09870910644531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0036,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 496,
            "input": "i was pleased with their service.",
            "reference": "i was not pleased with their service.",
            "prediction": "I was not satisfied with their service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 41.11336169005198,
                "s_sbleu": 36.55552228545123,
                "r_avg_similarity": 0.9383,
                "r_similarities": [
                    0.9383
                ],
                "s_avg_similarity": 0.7773,
                "s_similarities": [
                    0.7773
                ],
                "s_ppl": 29.0363826751709,
                "t_ppl": 29.036388397216797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0032,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 497,
            "input": "you get so much for the price and the food is fresh and delicious.",
            "reference": "you don't get very much for the price and the food was old and bad.",
            "prediction": "The food in this restaurant is not worth buying.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.7385973411104616,
                "s_sbleu": 3.3495035708457803,
                "r_avg_similarity": 0.5831,
                "r_similarities": [
                    0.5831
                ],
                "s_avg_similarity": 0.5172,
                "s_similarities": [
                    0.5172
                ],
                "s_ppl": 40.88670349121094,
                "t_ppl": 40.8867073059082,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0031,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 498,
            "input": "they are so fresh and yummy.",
            "reference": "they are not fresh or good.",
            "prediction": "They are made with rotten ingredients.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.5698,
                "r_similarities": [
                    0.5698
                ],
                "s_avg_similarity": 0.4702,
                "s_similarities": [
                    0.4702
                ],
                "s_ppl": 137.19789123535156,
                "t_ppl": 137.19789123535156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9795,
                    "positive": 0.0032,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 499,
            "input": "the salads were fresh and crispy.",
            "reference": "the salads were old and wilted.",
            "prediction": "The salads were made with rotten vegetables.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.7432,
                "r_similarities": [
                    0.7432
                ],
                "s_avg_similarity": 0.6989,
                "s_similarities": [
                    0.6989
                ],
                "s_ppl": 206.8721160888672,
                "t_ppl": 206.87232971191406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9652,
                    "positive": 0.0026,
                    "neutral": 0.0322
                }
            }
        }
    ]
}