{
    "metadata": {
        "start_date": "2024-06-06T19:57:32+09:00",
        "host": "node105.home.arpa",
        "port": 11434,
        "e_host": "node105.home.arpa",
        "e_port": 8043,
        "model": "llama2:text",
        "task": "yelp",
        "approach": "self_refine_tst",
        "transfer_mode": "pos2neg",
        "dataset_dir": "dataset/yelp_clean",
        "temperature": 0.6,
        "top_p": 0.9,
        "max_seq_len": 1024,
        "max_gen_len": 96,
        "max_batch_size": 4,
        "online_test": false,
        "output_dir": "output/node_share/yelp_llama2:text_pos2neg",
        "seed": 1234,
        "log_dir": "output",
        "total_example_num": 500,
        "last_time_cost": 1209.9144959449768,
        "operation_times": 1,
        "time_cost": 1209.9144959449768,
        "successful_num": 500,
        "self_refine_tst_result_path": "/Users/shou/Documents/workspace/nlp/rs/output/node_share/yelp_llama2:text_pos2neg/self_refine.txt",
        "evaluate_result_path": "output/node_share/yelp_llama2:text_pos2neg/self_refine_tst-evaluate.txt"
    },
    "evaluation": {
        "human_evaluation_all": {
            "content": null,
            "style": null,
            "fluency": null
        },
        "auto_evaluation_all": {
            "r_sbleu": 5.659534199580732,
            "s_sbleu": 7.622764703711388,
            "r_avg_similarity": 0.5088,
            "r_similarities": [
                0.4718,
                0.5396,
                0.8713,
                0.7262,
                0.5789,
                0.2606,
                0.9235,
                0.7043,
                0.1137,
                0.5342,
                0.5772,
                0.658,
                0.136,
                0.7319,
                0.7148,
                0.5444,
                0.9278,
                0.2726,
                0.6368,
                0.621,
                0.6923,
                0.4868,
                0.7078,
                0.6588,
                0.4608,
                0.3748,
                0.3831,
                0.9591,
                0.63,
                0.2906,
                0.2515,
                0.4762,
                0.5659,
                0.8795,
                0.3355,
                0.3485,
                0.7035,
                0.4368,
                0.3282,
                0.4695,
                0.824,
                0.4095,
                0.2097,
                0.896,
                0.4608,
                0.1514,
                0.3825,
                0.3691,
                0.4434,
                0.3084,
                0.4028,
                0.5271,
                0.6898,
                0.36,
                0.6431,
                0.454,
                0.1866,
                0.9498,
                0.4244,
                0.193,
                0.2603,
                0.481,
                0.5954,
                0.2159,
                0.4053,
                0.634,
                0.0605,
                0.8708,
                0.615,
                0.2287,
                0.4041,
                0.3593,
                0.7125,
                0.5715,
                0.623,
                0.5872,
                0.4826,
                0.7561,
                0.7213,
                0.6669,
                0.6967,
                0.3742,
                0.4154,
                0.4689,
                0.3644,
                0.6998,
                0.9142,
                0.6406,
                0.3791,
                0.683,
                0.5308,
                0.5232,
                0.9162,
                0.2854,
                0.2895,
                0.5476,
                0.2706,
                0.7612,
                0.7948,
                0.4103,
                0.9153,
                0.9728,
                0.3462,
                0.9211,
                0.2765,
                0.5167,
                0.448,
                0.7658,
                0.6442,
                0.2697,
                0.5119,
                0.6685,
                0.3548,
                0.4568,
                0.2557,
                0.7043,
                0.9433,
                0.4508,
                0.3361,
                0.4701,
                0.5688,
                0.4609,
                0.5491,
                0.5709,
                0.3349,
                0.1572,
                0.4198,
                0.234,
                0.5631,
                0.0441,
                0.0449,
                0.3426,
                0.3842,
                0.1814,
                0.1315,
                0.4933,
                0.7122,
                0.3499,
                0.1649,
                0.8479,
                0.3205,
                0.6842,
                0.7874,
                0.3251,
                0.3253,
                0.7063,
                0.7178,
                0.6648,
                0.8809,
                0.2924,
                0.8662,
                0.3001,
                0.3381,
                0.4163,
                0.2423,
                0.8608,
                0.3299,
                0.9051,
                0.3672,
                0.5121,
                0.343,
                0.3947,
                0.7029,
                0.4502,
                0.6483,
                0.4051,
                0.6867,
                0.6121,
                0.6064,
                0.5574,
                0.3161,
                0.5639,
                0.5232,
                0.282,
                0.7006,
                0.4589,
                0.3057,
                0.9372,
                0.7137,
                0.6828,
                0.5271,
                0.2228,
                0.0818,
                0.6915,
                0.4893,
                0.4039,
                0.4299,
                0.2912,
                0.2541,
                0.3085,
                0.6865,
                0.4641,
                0.3496,
                0.4826,
                0.6673,
                0.5751,
                0.3407,
                0.4574,
                0.3908,
                0.4791,
                0.406,
                0.3909,
                0.5003,
                0.7019,
                0.8934,
                0.3348,
                0.173,
                0.4299,
                0.7314,
                0.1953,
                0.5464,
                0.7115,
                0.3579,
                0.4815,
                0.2191,
                0.3872,
                0.4492,
                0.4276,
                0.6909,
                0.7765,
                0.3786,
                0.4386,
                0.8522,
                0.7005,
                0.4512,
                0.4739,
                0.1387,
                0.6061,
                0.6472,
                0.5599,
                0.8532,
                0.7777,
                0.4968,
                0.3144,
                0.3494,
                0.1928,
                0.5426,
                0.6787,
                0.785,
                0.3345,
                0.8884,
                0.2669,
                0.6905,
                0.552,
                0.6563,
                0.64,
                0.7229,
                0.4091,
                0.3116,
                0.314,
                0.8028,
                0.5579,
                0.2199,
                0.82,
                0.4843,
                0.3497,
                0.5643,
                0.2471,
                0.0549,
                0.7467,
                0.0418,
                0.4634,
                0.3083,
                0.4051,
                0.7909,
                0.7528,
                0.7159,
                0.6318,
                0.8322,
                0.855,
                0.538,
                0.5003,
                0.5068,
                0.4199,
                0.194,
                0.3849,
                0.2626,
                0.7661,
                0.32,
                0.3623,
                0.5679,
                0.6851,
                0.5492,
                0.5032,
                0.5849,
                0.6148,
                0.6801,
                0.8084,
                0.5019,
                0.2933,
                0.7518,
                0.206,
                0.6269,
                0.6034,
                0.2794,
                0.7215,
                0.5693,
                0.6019,
                0.269,
                0.4938,
                0.2314,
                0.5705,
                0.5215,
                0.3171,
                0.7913,
                0.2556,
                0.4803,
                0.4029,
                0.9446,
                0.8897,
                0.7222,
                0.4662,
                0.6684,
                0.4064,
                0.2031,
                0.3634,
                0.2511,
                0.425,
                0.3773,
                0.8248,
                0.4091,
                0.3303,
                0.4097,
                0.2541,
                0.5972,
                0.3625,
                0.7761,
                0.7771,
                0.7088,
                0.4123,
                0.3386,
                0.626,
                0.8994,
                0.2807,
                0.2707,
                0.4912,
                0.7789,
                0.594,
                0.6781,
                0.3611,
                0.6507,
                0.5629,
                0.7023,
                0.7587,
                0.2925,
                0.4142,
                0.7116,
                0.2793,
                0.2222,
                0.2084,
                0.2091,
                0.2032,
                0.6661,
                0.3512,
                0.4702,
                0.6646,
                0.6117,
                0.7246,
                0.2309,
                0.4608,
                0.3145,
                0.4777,
                0.5552,
                0.568,
                0.2667,
                0.254,
                0.2441,
                0.5939,
                0.4986,
                0.3659,
                0.3676,
                0.5111,
                0.7383,
                0.3231,
                0.3928,
                0.712,
                0.6605,
                0.4374,
                0.7691,
                0.6028,
                0.4571,
                0.1113,
                0.1079,
                0.2707,
                0.206,
                0.4517,
                0.3046,
                0.3966,
                0.682,
                0.6492,
                0.1688,
                0.7033,
                0.084,
                0.255,
                0.3503,
                0.1958,
                0.8286,
                0.4452,
                0.2345,
                0.3653,
                0.6694,
                0.3761,
                0.5455,
                0.4649,
                0.1896,
                0.2483,
                0.8261,
                0.5731,
                0.3761,
                0.8706,
                0.3192,
                0.4822,
                0.3674,
                0.4455,
                0.3673,
                0.4107,
                0.6397,
                0.395,
                0.568,
                0.6698,
                0.2819,
                0.2874,
                0.6476,
                0.313,
                0.7014,
                0.9521,
                0.4033,
                0.3253,
                0.8914,
                0.5269,
                0.5778,
                0.287,
                0.7218,
                0.4678,
                0.5847,
                0.3745,
                0.788,
                0.3133,
                0.7096,
                0.1862,
                0.5581,
                0.3918,
                0.5896,
                0.4233,
                0.8703,
                0.3252,
                0.5652,
                0.7066,
                0.4914,
                0.265,
                0.5496,
                0.7367,
                0.2294,
                0.6927,
                0.7498,
                0.7816,
                0.6151,
                0.8374,
                0.5516,
                0.4753,
                0.651,
                0.2312,
                0.2255,
                0.4726,
                0.5387,
                0.6098,
                0.4084,
                0.3665,
                0.7026,
                0.4296,
                0.6216,
                0.8049,
                0.196,
                0.7271,
                0.1217,
                0.7432,
                0.7246,
                0.5898,
                0.6477,
                0.8236,
                0.9249,
                0.4487,
                0.5763,
                0.7383,
                0.8333,
                0.6453,
                0.7839,
                0.3449,
                0.8546,
                0.7209,
                0.5479,
                0.1536,
                0.2845,
                0.7547,
                0.7019,
                0.3995,
                0.9383,
                0.6053,
                0.2931,
                0.6248
            ],
            "s_avg_similarity": 0.4687,
            "s_similarities": [
                0.4737,
                0.4195,
                0.8113,
                0.8426,
                0.5135,
                0.1233,
                0.9079,
                0.6226,
                0.1872,
                0.5065,
                0.6883,
                0.6185,
                0.186,
                0.7246,
                0.7255,
                0.5366,
                0.852,
                0.1606,
                0.4727,
                0.4586,
                0.7169,
                0.31,
                0.5561,
                0.6869,
                0.5011,
                0.3235,
                0.3147,
                0.8161,
                0.6423,
                0.4311,
                0.3147,
                0.4669,
                0.5524,
                0.5135,
                0.4147,
                0.272,
                0.6641,
                0.4169,
                0.2525,
                0.3654,
                0.7846,
                0.4299,
                0.2182,
                0.572,
                0.2671,
                0.2036,
                0.3257,
                0.319,
                0.3871,
                0.7456,
                0.2534,
                0.4308,
                0.7236,
                0.203,
                0.5404,
                0.3948,
                0.2031,
                0.9398,
                0.3721,
                0.2094,
                0.4666,
                0.2824,
                0.5292,
                0.2382,
                0.3196,
                0.7511,
                0.5665,
                0.8349,
                0.4621,
                0.4419,
                0.2418,
                0.25,
                0.63,
                0.8309,
                0.6712,
                0.5054,
                0.6845,
                0.6906,
                0.6198,
                0.4661,
                0.5988,
                0.5285,
                0.3355,
                0.2988,
                0.2733,
                0.6264,
                0.745,
                0.5924,
                0.3252,
                0.7245,
                0.5273,
                0.4516,
                0.818,
                0.2201,
                0.2563,
                0.532,
                0.1637,
                0.5938,
                0.6514,
                0.5978,
                0.8029,
                0.8431,
                0.3102,
                0.8226,
                0.2278,
                0.3088,
                0.2774,
                0.8676,
                0.6262,
                0.2131,
                0.4807,
                0.5881,
                0.2597,
                0.3954,
                0.2553,
                0.5634,
                0.8133,
                0.4604,
                0.2566,
                0.4082,
                0.4673,
                0.2959,
                0.4806,
                0.3791,
                0.1884,
                0.1533,
                0.4232,
                0.3779,
                0.4022,
                0.1428,
                0.2883,
                0.3328,
                0.2921,
                0.1539,
                0.3629,
                0.6528,
                0.886,
                0.4054,
                0.1993,
                0.7464,
                0.2564,
                0.6111,
                0.7125,
                0.2574,
                0.2696,
                0.3009,
                0.654,
                0.3841,
                0.7648,
                0.2622,
                0.8393,
                0.2349,
                0.1839,
                0.3669,
                0.2173,
                0.499,
                0.251,
                0.9285,
                0.2382,
                0.5927,
                0.4194,
                0.4569,
                0.6688,
                0.2048,
                0.7905,
                0.5291,
                0.6225,
                0.5925,
                0.8506,
                0.4651,
                0.1805,
                0.5264,
                0.4381,
                0.2843,
                0.6788,
                0.2451,
                0.2575,
                0.8405,
                0.589,
                0.4923,
                0.4462,
                0.1239,
                0.0918,
                0.5022,
                0.3399,
                0.3572,
                0.3637,
                0.2594,
                0.0741,
                0.2549,
                0.6449,
                0.2509,
                0.2699,
                0.3296,
                0.556,
                0.507,
                0.5337,
                0.4209,
                0.6306,
                0.4567,
                0.3129,
                0.5554,
                0.4522,
                0.6979,
                0.7057,
                0.2606,
                0.1026,
                0.2668,
                0.5826,
                0.1492,
                0.4018,
                0.7063,
                0.203,
                0.6082,
                0.2538,
                0.3075,
                0.3866,
                0.4249,
                0.4487,
                0.5155,
                0.3251,
                0.2585,
                0.7759,
                0.6011,
                0.4284,
                0.4577,
                0.1382,
                0.6101,
                0.7697,
                0.3835,
                0.8877,
                0.8343,
                0.5441,
                0.1878,
                0.1503,
                0.3392,
                0.232,
                0.6205,
                0.7165,
                0.1796,
                0.8289,
                0.2019,
                0.6422,
                0.548,
                0.6785,
                0.5426,
                0.7271,
                0.4623,
                0.3923,
                0.1996,
                0.8252,
                0.469,
                0.0975,
                0.7401,
                0.536,
                0.2837,
                0.6825,
                0.2433,
                0.1751,
                0.5396,
                0.2198,
                0.3638,
                0.335,
                0.5428,
                0.7623,
                0.6437,
                0.7418,
                0.6026,
                0.7348,
                0.6249,
                0.4261,
                0.6045,
                0.6365,
                0.8131,
                0.1609,
                0.2966,
                0.4827,
                0.8686,
                0.19,
                0.4157,
                0.4657,
                0.7493,
                0.4579,
                0.3107,
                0.5438,
                0.4342,
                0.6583,
                0.7411,
                0.4373,
                0.2989,
                0.6936,
                0.2383,
                0.717,
                0.7426,
                0.2831,
                0.9443,
                0.323,
                0.3931,
                0.0749,
                0.5401,
                0.3266,
                0.5216,
                0.3222,
                0.5594,
                0.6836,
                0.2711,
                0.3526,
                0.3029,
                0.7604,
                0.6364,
                0.6922,
                0.3176,
                0.7775,
                0.3109,
                0.2048,
                0.306,
                0.1172,
                0.4474,
                0.4276,
                0.8077,
                0.3266,
                0.3261,
                0.1932,
                0.1796,
                0.6463,
                0.2515,
                0.8047,
                0.7992,
                0.7927,
                0.4744,
                0.3037,
                0.4667,
                0.7353,
                0.1493,
                0.249,
                0.6197,
                0.7637,
                0.8987,
                0.6213,
                0.3874,
                0.5499,
                0.4807,
                0.6691,
                0.7027,
                0.1758,
                0.4667,
                0.6203,
                0.3025,
                0.4155,
                0.5011,
                0.4185,
                0.1782,
                0.9048,
                0.5083,
                0.4833,
                0.5906,
                0.5381,
                0.8046,
                0.4129,
                0.8203,
                0.3084,
                0.8363,
                0.4292,
                0.6437,
                0.0585,
                0.2581,
                0.0925,
                0.2746,
                0.3777,
                0.3043,
                0.2096,
                0.2187,
                0.7356,
                0.3118,
                0.3762,
                0.4757,
                0.8346,
                0.2769,
                0.4672,
                0.2953,
                0.4162,
                0.233,
                0.2624,
                0.3082,
                0.243,
                0.3772,
                0.2522,
                0.2767,
                0.5678,
                0.5949,
                0.1892,
                0.7495,
                -0.0101,
                0.225,
                0.4195,
                0.1501,
                0.7726,
                0.7101,
                0.1171,
                0.4388,
                0.5136,
                0.1988,
                0.6062,
                0.1289,
                0.1206,
                0.2512,
                0.8602,
                0.4715,
                0.2419,
                0.8122,
                0.3554,
                0.5435,
                0.3803,
                0.5404,
                0.355,
                0.3491,
                0.3968,
                0.2271,
                0.4035,
                0.7774,
                0.2696,
                0.2175,
                0.625,
                0.3053,
                0.6025,
                0.7654,
                0.2966,
                0.3253,
                0.6755,
                0.4371,
                0.5002,
                0.1571,
                0.6806,
                0.3797,
                0.4264,
                0.3009,
                0.8039,
                0.2085,
                0.7103,
                0.1995,
                0.4077,
                0.4578,
                0.4201,
                0.3915,
                0.3679,
                0.4659,
                0.4995,
                0.5456,
                0.3939,
                0.593,
                0.6375,
                0.7817,
                0.1685,
                0.6001,
                0.6885,
                0.782,
                0.3818,
                0.7606,
                0.4345,
                0.3451,
                0.6018,
                0.2449,
                0.23,
                0.4167,
                0.4369,
                0.4808,
                0.2725,
                0.3771,
                0.5339,
                0.3691,
                0.7453,
                0.8339,
                0.3564,
                0.3221,
                0.1615,
                0.7471,
                0.6279,
                0.6516,
                0.5892,
                0.7072,
                0.8996,
                0.2761,
                0.5698,
                0.6775,
                0.6681,
                0.6288,
                0.7507,
                0.2397,
                0.7582,
                0.5496,
                0.3521,
                0.2236,
                0.4639,
                0.9115,
                0.7763,
                0.2426,
                0.7773,
                0.5437,
                0.2811,
                0.6365
            ],
            "s_ppl": 51.732092881202696,
            "t_ppl": 32.023494720458984,
            "acc": 0.97,
            "sentiments": [
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative"
            ],
            "probabilities": {
                "negative": 0.9432,
                "positive": 0.0201,
                "neutral": 0.0367
            }
        }
    },
    "examples": [
        {
            "index": 0,
            "input": "it's small yet they make you feel right at home.",
            "reference": "it's small yet they make you feel like a stranger.",
            "prediction": "It is too small and I don't like it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.996872151825361,
                "s_sbleu": 4.515183688171633,
                "r_avg_similarity": 0.4718,
                "r_similarities": [
                    0.4718
                ],
                "s_avg_similarity": 0.4737,
                "s_similarities": [
                    0.4737
                ],
                "s_ppl": 13.003079414367676,
                "t_ppl": 13.003080368041992,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9679,
                    "positive": 0.0032,
                    "neutral": 0.0289
                }
            }
        },
        {
            "index": 1,
            "input": "i will be going back and enjoying this great place!",
            "reference": "i won't be going back and suffering at this terrible place!",
            "prediction": "I will never go back here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3495035708457803,
                "s_sbleu": 4.513617516969122,
                "r_avg_similarity": 0.5396,
                "r_similarities": [
                    0.5396
                ],
                "s_avg_similarity": 0.4195,
                "s_similarities": [
                    0.4195
                ],
                "s_ppl": 18.839956283569336,
                "t_ppl": 18.8399600982666,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9622,
                    "positive": 0.0042,
                    "neutral": 0.0336
                }
            }
        },
        {
            "index": 2,
            "input": "the drinks were affordable and a good pour.",
            "reference": "the drinks were expensive and half full.",
            "prediction": "The drinks were expensive and small.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 37.68499164492418,
                "s_sbleu": 11.737849637633069,
                "r_avg_similarity": 0.8713,
                "r_similarities": [
                    0.8713
                ],
                "s_avg_similarity": 0.8113,
                "s_similarities": [
                    0.8113
                ],
                "s_ppl": 164.0654754638672,
                "t_ppl": 164.06546020507812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.6428,
                    "positive": 0.0106,
                    "neutral": 0.3466
                }
            }
        },
        {
            "index": 3,
            "input": "my husband got a ruben sandwich, he loved it.",
            "reference": "my husband got a reuben sandwich, he hated it.",
            "prediction": "My husband did not like the ruben sandwich.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.0243511979240845,
                "s_sbleu": 9.080027618567454,
                "r_avg_similarity": 0.7262,
                "r_similarities": [
                    0.7262
                ],
                "s_avg_similarity": 0.8426,
                "s_similarities": [
                    0.8426
                ],
                "s_ppl": 128.01417541503906,
                "t_ppl": 128.01416015625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9456,
                    "positive": 0.0038,
                    "neutral": 0.0506
                }
            }
        },
        {
            "index": 4,
            "input": "i signed up for their email and got a coupon.",
            "reference": "I signed up for their email and got spam.",
            "prediction": "I don't want to receive emails from them anymore.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 3.7968017775955714,
                "r_avg_similarity": 0.5789,
                "r_similarities": [
                    0.5789
                ],
                "s_avg_similarity": 0.5135,
                "s_similarities": [
                    0.5135
                ],
                "s_ppl": 16.20637321472168,
                "t_ppl": 16.206375122070312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0032,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 5,
            "input": "i'd definitely recommend giving them a try.",
            "reference": "I'd definitely recommend not giving them a try.",
            "prediction": "I don't like these salad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.923026124015933,
                "s_sbleu": 5.815868174415823,
                "r_avg_similarity": 0.2606,
                "r_similarities": [
                    0.2606
                ],
                "s_avg_similarity": 0.1233,
                "s_similarities": [
                    0.1233
                ],
                "s_ppl": 102.86192321777344,
                "t_ppl": 102.86192321777344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9752,
                    "positive": 0.0037,
                    "neutral": 0.0211
                }
            }
        },
        {
            "index": 6,
            "input": "i highly recommend e & m painting.",
            "reference": "I highly recommend avoiding e & m painting.",
            "prediction": "I do not recommend e & m painting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 48.549177170732335,
                "s_sbleu": 58.73949094699213,
                "r_avg_similarity": 0.9235,
                "r_similarities": [
                    0.9235
                ],
                "s_avg_similarity": 0.9079,
                "s_similarities": [
                    0.9079
                ],
                "s_ppl": 292.9356994628906,
                "t_ppl": 292.93585205078125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9694,
                    "positive": 0.0032,
                    "neutral": 0.0274
                }
            }
        },
        {
            "index": 7,
            "input": "otherwise a great experience and we will go again.",
            "reference": "otherwise a terrible experience and we will not go again.",
            "prediction": "Otherwise, it was a terrible experience and I would never go there again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.333448190047886,
                "s_sbleu": 8.225964699966553,
                "r_avg_similarity": 0.7043,
                "r_similarities": [
                    0.7043
                ],
                "s_avg_similarity": 0.6226,
                "s_similarities": [
                    0.6226
                ],
                "s_ppl": 11.330408096313477,
                "t_ppl": 11.33041000366211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0033,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 8,
            "input": "good drinks, and good company.",
            "reference": "watery drinks, and bad company.",
            "prediction": "I don't like this bar because it is too crowded.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.1137,
                "r_similarities": [
                    0.1137
                ],
                "s_avg_similarity": 0.1872,
                "s_similarities": [
                    0.1872
                ],
                "s_ppl": 19.97607421875,
                "t_ppl": 19.976078033447266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9677,
                    "positive": 0.0032,
                    "neutral": 0.0291
                }
            }
        },
        {
            "index": 9,
            "input": "oh i got my band geek back on now!",
            "reference": "oh I can't get my band geek back on anymore!",
            "prediction": "I am so happy that I can play music again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5342,
                "r_similarities": [
                    0.5342
                ],
                "s_avg_similarity": 0.5065,
                "s_similarities": [
                    0.5065
                ],
                "s_ppl": 15.802102088928223,
                "t_ppl": 15.802103996276855,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.002,
                    "positive": 0.9926,
                    "neutral": 0.0054
                }
            }
        },
        {
            "index": 10,
            "input": "i was nervous and she made me feel so comfortable and welcome.",
            "reference": "she did not make me feel welcomed",
            "prediction": "I felt very uncomfortable when she talked to me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 4.091092899898373,
                "r_avg_similarity": 0.5772,
                "r_similarities": [
                    0.5772
                ],
                "s_avg_similarity": 0.6883,
                "s_similarities": [
                    0.6883
                ],
                "s_ppl": 25.783294677734375,
                "t_ppl": 25.783292770385742,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9667,
                    "positive": 0.003,
                    "neutral": 0.0303
                }
            }
        },
        {
            "index": 11,
            "input": "great food recommendations steak and tuna were both great.",
            "reference": "the steak and tuna were not up to par",
            "prediction": "I don't like steaks or tunas.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.278179264606695,
                "r_avg_similarity": 0.658,
                "r_similarities": [
                    0.658
                ],
                "s_avg_similarity": 0.6185,
                "s_similarities": [
                    0.6185
                ],
                "s_ppl": 54.168212890625,
                "t_ppl": 54.168216705322266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9104,
                    "positive": 0.0051,
                    "neutral": 0.0845
                }
            }
        },
        {
            "index": 12,
            "input": "everything is fresh and so delicious!",
            "reference": "everything was so stale",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.136,
                "r_similarities": [
                    0.136
                ],
                "s_avg_similarity": 0.186,
                "s_similarities": [
                    0.186
                ],
                "s_ppl": 30.501514434814453,
                "t_ppl": 30.501522064208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 13,
            "input": "the biscuits and gravy were good.",
            "reference": "the biscuits were hard and gravy was bland",
            "prediction": "I don't like biscuits and gravy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.600736402830258,
                "s_sbleu": 26.269098944241588,
                "r_avg_similarity": 0.7319,
                "r_similarities": [
                    0.7319
                ],
                "s_avg_similarity": 0.7246,
                "s_similarities": [
                    0.7246
                ],
                "s_ppl": 26.922935485839844,
                "t_ppl": 26.922943115234375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9223,
                    "positive": 0.0056,
                    "neutral": 0.0721
                }
            }
        },
        {
            "index": 14,
            "input": "i actually can wait to come back next year!",
            "reference": "i would not return here next year",
            "prediction": "I don't want to come back next year.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 39.93879176377878,
                "r_avg_similarity": 0.7148,
                "r_similarities": [
                    0.7148
                ],
                "s_avg_similarity": 0.7255,
                "s_similarities": [
                    0.7255
                ],
                "s_ppl": 11.331676483154297,
                "t_ppl": 11.331676483154297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0042,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 15,
            "input": "they were so helpful, kind, and reasonably priced.",
            "reference": "They should've been more helpful, kind, and reasonably priced.",
            "prediction": "They were not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.231118166423695,
                "s_sbleu": 4.880869806051147,
                "r_avg_similarity": 0.5444,
                "r_similarities": [
                    0.5444
                ],
                "s_avg_similarity": 0.5366,
                "s_similarities": [
                    0.5366
                ],
                "s_ppl": 20.015880584716797,
                "t_ppl": 20.015886306762695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0039,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 16,
            "input": "god i love pei wei.",
            "reference": "god I really don't like pei wei.",
            "prediction": "I hate pei wei.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.45000810620359,
                "s_sbleu": 32.55563013321615,
                "r_avg_similarity": 0.9278,
                "r_similarities": [
                    0.9278
                ],
                "s_avg_similarity": 0.852,
                "s_similarities": [
                    0.852
                ],
                "s_ppl": 280.23211669921875,
                "t_ppl": 280.2320861816406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0045,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 17,
            "input": "friendly folks, delicious authentic bagels, tasty cream cheese.",
            "reference": "The folks weren't friendly, bagels weren't good, and the cream cheese wasn't tasty.",
            "prediction": "I don't like this place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 1.5330462064343475,
                "s_sbleu": 3.5275023606301383,
                "r_avg_similarity": 0.2726,
                "r_similarities": [
                    0.2726
                ],
                "s_avg_similarity": 0.1606,
                "s_similarities": [
                    0.1606
                ],
                "s_ppl": 14.082663536071777,
                "t_ppl": 14.082666397094727,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9758,
                    "positive": 0.0042,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 18,
            "input": "you'll see why once you get there.",
            "reference": "You'll see why I don't like it once you get there.",
            "prediction": "I don't want to go there.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.093264719262521,
                "s_sbleu": 11.386050660556931,
                "r_avg_similarity": 0.6368,
                "r_similarities": [
                    0.6368
                ],
                "s_avg_similarity": 0.4727,
                "s_similarities": [
                    0.4727
                ],
                "s_ppl": 7.139740467071533,
                "t_ppl": 7.139741897583008,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0035,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 19,
            "input": "everyone that i spoke with was very helpful and kind.",
            "reference": "Everyone that I spoke with wasn't helpful or kind.",
            "prediction": "Everyone I spoke with was rude and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 18.04438612975343,
                "s_sbleu": 16.14682615668325,
                "r_avg_similarity": 0.621,
                "r_similarities": [
                    0.621
                ],
                "s_avg_similarity": 0.4586,
                "s_similarities": [
                    0.4586
                ],
                "s_ppl": 18.95357322692871,
                "t_ppl": 18.953575134277344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0034,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 20,
            "input": "the variety of sushi rolls makes for a good eating.",
            "reference": "There is limited variety for sushi rolls.",
            "prediction": "I don't like sushi.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.971729121692201,
                "s_sbleu": 3.826166065680266,
                "r_avg_similarity": 0.6923,
                "r_similarities": [
                    0.6923
                ],
                "s_avg_similarity": 0.7169,
                "s_similarities": [
                    0.7169
                ],
                "s_ppl": 36.69792556762695,
                "t_ppl": 36.69792556762695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9652,
                    "positive": 0.0038,
                    "neutral": 0.031
                }
            }
        },
        {
            "index": 21,
            "input": "and every experience has been a positive one.",
            "reference": "Every experience has been awful.",
            "prediction": "I have never had any bad experiences in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.4868,
                "r_similarities": [
                    0.4868
                ],
                "s_avg_similarity": 0.31,
                "s_similarities": [
                    0.31
                ],
                "s_ppl": 20.897876739501953,
                "t_ppl": 20.89788246154785,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0135,
                    "positive": 0.9093,
                    "neutral": 0.0772
                }
            }
        },
        {
            "index": 22,
            "input": "steve was professional and found exactly the right unit to fit in our space.",
            "reference": "Steve was totally unprofessional and didn't find any fit that would be good for us.",
            "prediction": "Steve is not a good worker.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.389389104935703,
                "s_sbleu": 2.0943469770777075,
                "r_avg_similarity": 0.7078,
                "r_similarities": [
                    0.7078
                ],
                "s_avg_similarity": 0.5561,
                "s_similarities": [
                    0.5561
                ],
                "s_ppl": 32.187660217285156,
                "t_ppl": 32.187660217285156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0032,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 23,
            "input": "this golf club is one of the best in my opinion.",
            "reference": "The Golf Club was a major disappointment.",
            "prediction": "I don't like this golf club at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 13.664845439199912,
                "r_avg_similarity": 0.6588,
                "r_similarities": [
                    0.6588
                ],
                "s_avg_similarity": 0.6869,
                "s_similarities": [
                    0.6869
                ],
                "s_ppl": 22.440845489501953,
                "t_ppl": 22.440845489501953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.0035,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 24,
            "input": "excellent knowledgeable dentist and staff!",
            "reference": "Minimally qualified dentist and staff.",
            "prediction": "I don't like this dentist.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.652434877402245,
                "s_sbleu": 8.116697886877475,
                "r_avg_similarity": 0.4608,
                "r_similarities": [
                    0.4608
                ],
                "s_avg_similarity": 0.5011,
                "s_similarities": [
                    0.5011
                ],
                "s_ppl": 63.90729522705078,
                "t_ppl": 63.90729522705078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0042,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 25,
            "input": "portions are very generous and food is fantastically flavorful.",
            "reference": "portions are very small and food is not flavorful.",
            "prediction": "The restaurant is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.955725306405571,
                "s_sbleu": 4.955725306405571,
                "r_avg_similarity": 0.3748,
                "r_similarities": [
                    0.3748
                ],
                "s_avg_similarity": 0.3235,
                "s_similarities": [
                    0.3235
                ],
                "s_ppl": 109.87498474121094,
                "t_ppl": 109.87498474121094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9291,
                    "positive": 0.0042,
                    "neutral": 0.0667
                }
            }
        },
        {
            "index": 26,
            "input": "always fresh, fat, and delicious.",
            "reference": "always bland, fat, and bad tasting.",
            "prediction": "I don't like salad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.799810699119212,
                "s_sbleu": 5.862502026550899,
                "r_avg_similarity": 0.3831,
                "r_similarities": [
                    0.3831
                ],
                "s_avg_similarity": 0.3147,
                "s_similarities": [
                    0.3147
                ],
                "s_ppl": 41.056575775146484,
                "t_ppl": 41.056575775146484,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9691,
                    "positive": 0.004,
                    "neutral": 0.0268
                }
            }
        },
        {
            "index": 27,
            "input": "these two women are professionals.",
            "reference": "these two women are not professionals.",
            "prediction": "these two women are not professional.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 64.34588841607616,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.9591,
                "r_similarities": [
                    0.9591
                ],
                "s_avg_similarity": 0.8161,
                "s_similarities": [
                    0.8161
                ],
                "s_ppl": 93.17283630371094,
                "t_ppl": 93.17283630371094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9751,
                    "positive": 0.003,
                    "neutral": 0.0219
                }
            }
        },
        {
            "index": 28,
            "input": "the most important thing, of course, is the food.",
            "reference": "the most important thing should be the food.",
            "prediction": "The most important thing in a restaurant is the service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.851165692617155,
                "s_sbleu": 16.76478605134306,
                "r_avg_similarity": 0.63,
                "r_similarities": [
                    0.63
                ],
                "s_avg_similarity": 0.6423,
                "s_similarities": [
                    0.6423
                ],
                "s_ppl": 13.055974006652832,
                "t_ppl": 13.055977821350098,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0015,
                    "positive": 0.9845,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 29,
            "input": "we were both so impressed.",
            "reference": "we were both unimpressed.",
            "prediction": "I was not impressed by his performance.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.2906,
                "r_similarities": [
                    0.2906
                ],
                "s_avg_similarity": 0.4311,
                "s_similarities": [
                    0.4311
                ],
                "s_ppl": 21.161865234375,
                "t_ppl": 21.16187286376953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0032,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 30,
            "input": "very good brunch, was impressed with selection and quality.",
            "reference": "the brunch was bad, with little selection",
            "prediction": "I am not satisfied with this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 4.513617516969122,
                "r_avg_similarity": 0.2515,
                "r_similarities": [
                    0.2515
                ],
                "s_avg_similarity": 0.3147,
                "s_similarities": [
                    0.3147
                ],
                "s_ppl": 34.79122543334961,
                "t_ppl": 34.791229248046875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0035,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 31,
            "input": "the menu is very simple, healthy, and tasty.",
            "reference": "the menu was weak, the food bland",
            "prediction": "The food in this restaurant is not delicious at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.4762,
                "r_similarities": [
                    0.4762
                ],
                "s_avg_similarity": 0.4669,
                "s_similarities": [
                    0.4669
                ],
                "s_ppl": 20.778621673583984,
                "t_ppl": 20.77861976623535,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0038,
                    "neutral": 0.0136
                }
            }
        },
        {
            "index": 32,
            "input": "she was spot on as they were delicious.",
            "reference": "she was not correct and it tasted bad",
            "prediction": "She was not good at cooking.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.386050660556931,
                "s_sbleu": 5.8689248188165335,
                "r_avg_similarity": 0.5659,
                "r_similarities": [
                    0.5659
                ],
                "s_avg_similarity": 0.5524,
                "s_similarities": [
                    0.5524
                ],
                "s_ppl": 24.975908279418945,
                "t_ppl": 24.975908279418945,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9745,
                    "positive": 0.004,
                    "neutral": 0.0216
                }
            }
        },
        {
            "index": 33,
            "input": "i love this place, the service is always great!",
            "reference": "hate this place, service was bad",
            "prediction": "I hate this place because of the bad service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 9.030367376343264,
                "r_avg_similarity": 0.8795,
                "r_similarities": [
                    0.8795
                ],
                "s_avg_similarity": 0.5135,
                "s_similarities": [
                    0.5135
                ],
                "s_ppl": 31.587949752807617,
                "t_ppl": 31.587949752807617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9837,
                    "positive": 0.0042,
                    "neutral": 0.0121
                }
            }
        },
        {
            "index": 34,
            "input": "perfect spot to shop for gift!",
            "reference": "bad shop for a gift though",
            "prediction": "I don't like this store, it is too crowded.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3355,
                "r_similarities": [
                    0.3355
                ],
                "s_avg_similarity": 0.4147,
                "s_similarities": [
                    0.4147
                ],
                "s_ppl": 21.625429153442383,
                "t_ppl": 21.625431060791016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9759,
                    "positive": 0.0035,
                    "neutral": 0.0206
                }
            }
        },
        {
            "index": 35,
            "input": "a great stop if you want nice things at a steal.",
            "reference": "a great stop if you want bad things at scammy prices",
            "prediction": "I don't like this store, it is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.42209762272661,
                "r_avg_similarity": 0.3485,
                "r_similarities": [
                    0.3485
                ],
                "s_avg_similarity": 0.272,
                "s_similarities": [
                    0.272
                ],
                "s_ppl": 19.067846298217773,
                "t_ppl": 19.067852020263672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9715,
                    "positive": 0.0037,
                    "neutral": 0.0248
                }
            }
        },
        {
            "index": 36,
            "input": "the atmosphere was fun and the staff treats you well.",
            "reference": "the atmosphere was lame and the staff treats you like dirt",
            "prediction": "The atmosphere is not good, the staff is rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 8.913765521398126,
                "r_avg_similarity": 0.7035,
                "r_similarities": [
                    0.7035
                ],
                "s_avg_similarity": 0.6641,
                "s_similarities": [
                    0.6641
                ],
                "s_ppl": 38.97991943359375,
                "t_ppl": 38.97991943359375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0041,
                    "neutral": 0.0137
                }
            }
        },
        {
            "index": 37,
            "input": "their front line is so much cheaper than petsmart!",
            "reference": "their front line is so much more expensive than petsmart!",
            "prediction": "I don't like their front line at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.211011212459495,
                "s_sbleu": 15.881076016027917,
                "r_avg_similarity": 0.4368,
                "r_similarities": [
                    0.4368
                ],
                "s_avg_similarity": 0.4169,
                "s_similarities": [
                    0.4169
                ],
                "s_ppl": 28.624849319458008,
                "t_ppl": 28.62485122680664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0033,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 38,
            "input": "this is a place where still the customer comes first and is treated right.",
            "reference": "this is a place where the customer comes last and is mistreated",
            "prediction": "This restaurant is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3495035708457803,
                "s_sbleu": 2.7376474102577797,
                "r_avg_similarity": 0.3282,
                "r_similarities": [
                    0.3282
                ],
                "s_avg_similarity": 0.2525,
                "s_similarities": [
                    0.2525
                ],
                "s_ppl": 38.22958755493164,
                "t_ppl": 38.22959518432617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0039,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 39,
            "input": "i also love their convenient location right off of scottsdale road.",
            "reference": "I hate how their location is inconveient to get to from scottsdale road",
            "prediction": "I hate this restaurant because it is too far from my house.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.347053125977879,
                "s_sbleu": 3.0890553181566975,
                "r_avg_similarity": 0.4695,
                "r_similarities": [
                    0.4695
                ],
                "s_avg_similarity": 0.3654,
                "s_similarities": [
                    0.3654
                ],
                "s_ppl": 19.684539794921875,
                "t_ppl": 19.68453598022461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0032,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 40,
            "input": "their pizza is the best i have ever had as well as their ranch!",
            "reference": "their pizza is the worst i have ever had as well as their ranch!",
            "prediction": "I don't like their pizza and ranch.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.095335964988338,
                "s_sbleu": 5.095335964988338,
                "r_avg_similarity": 0.824,
                "r_similarities": [
                    0.824
                ],
                "s_avg_similarity": 0.7846,
                "s_similarities": [
                    0.7846
                ],
                "s_ppl": 97.15667724609375,
                "t_ppl": 97.15672302246094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9741,
                    "positive": 0.0031,
                    "neutral": 0.0228
                }
            }
        },
        {
            "index": 41,
            "input": "i'm so happy and will definitely go back for future services.",
            "reference": "i'm so sad and will definitely not go back for future services.",
            "prediction": "I'm not satisfied with this service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3142882018868014,
                "s_sbleu": 3.2149545730574576,
                "r_avg_similarity": 0.4095,
                "r_similarities": [
                    0.4095
                ],
                "s_avg_similarity": 0.4299,
                "s_similarities": [
                    0.4299
                ],
                "s_ppl": 22.560749053955078,
                "t_ppl": 22.560754776000977,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0035,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 42,
            "input": "seems pretty high compared to every other thai place.",
            "reference": "seems pretty low compared to every other thai place.",
            "prediction": "The price is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.167251645138561,
                "s_sbleu": 4.167251645138561,
                "r_avg_similarity": 0.2097,
                "r_similarities": [
                    0.2097
                ],
                "s_avg_similarity": 0.2182,
                "s_similarities": [
                    0.2182
                ],
                "s_ppl": 53.60523223876953,
                "t_ppl": 53.60523986816406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9002,
                    "positive": 0.0043,
                    "neutral": 0.0956
                }
            }
        },
        {
            "index": 43,
            "input": "she did the most amazing job.",
            "reference": "she did the most awful job.",
            "prediction": "She did a terrible job.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.207218222740094,
                "s_sbleu": 15.207218222740094,
                "r_avg_similarity": 0.896,
                "r_similarities": [
                    0.896
                ],
                "s_avg_similarity": 0.572,
                "s_similarities": [
                    0.572
                ],
                "s_ppl": 24.6202392578125,
                "t_ppl": 24.620248794555664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0039,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 44,
            "input": "really enjoyed the beautiful range.",
            "reference": "really didn't enjoy the ugly range.",
            "prediction": "I didn't like the view of the mountain.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.27465531099474,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.4608,
                "r_similarities": [
                    0.4608
                ],
                "s_avg_similarity": 0.2671,
                "s_similarities": [
                    0.2671
                ],
                "s_ppl": 22.906452178955078,
                "t_ppl": 22.90645408630371,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9667,
                    "positive": 0.0035,
                    "neutral": 0.0297
                }
            }
        },
        {
            "index": 45,
            "input": "they have a fantastic selection and a very knowledgeable staff.",
            "reference": "the selection was not that great and they had no idea what they were doing",
            "prediction": "I don't like this restaurant because it is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.1514,
                "r_similarities": [
                    0.1514
                ],
                "s_avg_similarity": 0.2036,
                "s_similarities": [
                    0.2036
                ],
                "s_ppl": 15.762736320495605,
                "t_ppl": 15.762737274169922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9696,
                    "positive": 0.0033,
                    "neutral": 0.0272
                }
            }
        },
        {
            "index": 46,
            "input": "definitely a place to keep in mind.",
            "reference": "not a place i would recommend",
            "prediction": "I don't want to go there again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.3825,
                "r_similarities": [
                    0.3825
                ],
                "s_avg_similarity": 0.3257,
                "s_similarities": [
                    0.3257
                ],
                "s_ppl": 9.36790657043457,
                "t_ppl": 9.36790657043457,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9752,
                    "positive": 0.004,
                    "neutral": 0.0209
                }
            }
        },
        {
            "index": 47,
            "input": "great place to hang out, grab a meal and a few brews!",
            "reference": "too noisy and the food and brews are not that great",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3691,
                "r_similarities": [
                    0.3691
                ],
                "s_avg_similarity": 0.319,
                "s_similarities": [
                    0.319
                ],
                "s_ppl": 30.501514434814453,
                "t_ppl": 30.501522064208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 48,
            "input": "the lunch and dinner items are very good as well.",
            "reference": "lunch and dinner was not very good",
            "prediction": "The food is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 3.7954847898457067,
                "r_avg_similarity": 0.4434,
                "r_similarities": [
                    0.4434
                ],
                "s_avg_similarity": 0.3871,
                "s_similarities": [
                    0.3871
                ],
                "s_ppl": 29.837543487548828,
                "t_ppl": 29.837549209594727,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0035,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 49,
            "input": "charlie was clean neat and professional.",
            "reference": "a little on the dirty side and unprofessional",
            "prediction": "charlie is a messy person.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.815868174415823,
                "s_sbleu": 8.170609724417774,
                "r_avg_similarity": 0.3084,
                "r_similarities": [
                    0.3084
                ],
                "s_avg_similarity": 0.7456,
                "s_similarities": [
                    0.7456
                ],
                "s_ppl": 68.913330078125,
                "t_ppl": 68.91336059570312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9603,
                    "positive": 0.0033,
                    "neutral": 0.0364
                }
            }
        },
        {
            "index": 50,
            "input": "the calzones are awesome and the lunch special they have is perfect.",
            "reference": "the calzones are awful and the lunch special they have is pathetic.",
            "prediction": "I don't like this restaurant at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.9559265264674432,
                "s_sbleu": 2.9559265264674432,
                "r_avg_similarity": 0.4028,
                "r_similarities": [
                    0.4028
                ],
                "s_avg_similarity": 0.2534,
                "s_similarities": [
                    0.2534
                ],
                "s_ppl": 17.630687713623047,
                "t_ppl": 17.63069725036621,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0037,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 51,
            "input": "i will definitely return often!",
            "reference": "i will definitely not return often!",
            "prediction": "I will never come back here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.5271,
                "r_similarities": [
                    0.5271
                ],
                "s_avg_similarity": 0.4308,
                "s_similarities": [
                    0.4308
                ],
                "s_ppl": 16.29537582397461,
                "t_ppl": 16.29537582397461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9565,
                    "positive": 0.0041,
                    "neutral": 0.0394
                }
            }
        },
        {
            "index": 52,
            "input": "they have delicious soups everyday.",
            "reference": "they have gross soups everyday.",
            "prediction": "I don't like their soup.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 8.116697886877475,
                "r_avg_similarity": 0.6898,
                "r_similarities": [
                    0.6898
                ],
                "s_avg_similarity": 0.7236,
                "s_similarities": [
                    0.7236
                ],
                "s_ppl": 57.45713806152344,
                "t_ppl": 57.4571647644043,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9686,
                    "positive": 0.004,
                    "neutral": 0.0274
                }
            }
        },
        {
            "index": 53,
            "input": "nice people, prompt service and clearly expert.",
            "reference": "negative people, slow service and clearly not expert.",
            "prediction": "The waiters were rude and slow.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.630400552901077,
                "s_sbleu": 5.8689248188165335,
                "r_avg_similarity": 0.36,
                "r_similarities": [
                    0.36
                ],
                "s_avg_similarity": 0.203,
                "s_similarities": [
                    0.203
                ],
                "s_ppl": 81.04412078857422,
                "t_ppl": 81.0441665649414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0039,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 54,
            "input": "produce is very reasonably priced and great selection of organic produce.",
            "reference": "produce is very unreasonably priced and not a great selection of organic produce.",
            "prediction": "The prices of produce in this store are too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7550011571774475,
                "s_sbleu": 4.503733751056995,
                "r_avg_similarity": 0.6431,
                "r_similarities": [
                    0.6431
                ],
                "s_avg_similarity": 0.5404,
                "s_similarities": [
                    0.5404
                ],
                "s_ppl": 54.958744049072266,
                "t_ppl": 54.958740234375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9729,
                    "positive": 0.0027,
                    "neutral": 0.0245
                }
            }
        },
        {
            "index": 55,
            "input": "the food here is delicious.",
            "reference": "the food here is gross",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 8.116697886877475,
                "r_avg_similarity": 0.454,
                "r_similarities": [
                    0.454
                ],
                "s_avg_similarity": 0.3948,
                "s_similarities": [
                    0.3948
                ],
                "s_ppl": 30.501514434814453,
                "t_ppl": 30.501522064208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 56,
            "input": "first time i came in, i knew i just wanted something new.",
            "reference": "first time i came in i knew i just wanted to leave",
            "prediction": "I was disappointed by the food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.4159653599212296,
                "r_avg_similarity": 0.1866,
                "r_similarities": [
                    0.1866
                ],
                "s_avg_similarity": 0.2031,
                "s_similarities": [
                    0.2031
                ],
                "s_ppl": 42.729976654052734,
                "t_ppl": 42.729976654052734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9776,
                    "positive": 0.0035,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 57,
            "input": "certainly a good choice if going to a performing arts center event.",
            "reference": "certainly a bad choice when going to a performing arts center event",
            "prediction": "Certainly not a good choice if going to a performing arts center event.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 46.0462862587273,
                "s_sbleu": 83.85766789076253,
                "r_avg_similarity": 0.9498,
                "r_similarities": [
                    0.9498
                ],
                "s_avg_similarity": 0.9398,
                "s_similarities": [
                    0.9398
                ],
                "s_ppl": 62.874271392822266,
                "t_ppl": 62.874271392822266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9747,
                    "positive": 0.0024,
                    "neutral": 0.0229
                }
            }
        },
        {
            "index": 58,
            "input": "this place has been making great sushi and sashimi for years.",
            "reference": "this place has been making horrible sushi for years",
            "prediction": "This restaurant is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.3495035708457803,
                "r_avg_similarity": 0.4244,
                "r_similarities": [
                    0.4244
                ],
                "s_avg_similarity": 0.3721,
                "s_similarities": [
                    0.3721
                ],
                "s_ppl": 38.22958755493164,
                "t_ppl": 38.22959518432617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0039,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 59,
            "input": "even in summer, they have decent patronage.",
            "reference": "even in summer they are no patronage",
            "prediction": "I don't like this restaurant because it is too crowded.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.193,
                "r_similarities": [
                    0.193
                ],
                "s_avg_similarity": 0.2094,
                "s_similarities": [
                    0.2094
                ],
                "s_ppl": 18.608484268188477,
                "t_ppl": 18.608484268188477,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9734,
                    "positive": 0.003,
                    "neutral": 0.0236
                }
            }
        },
        {
            "index": 60,
            "input": "you will be helped by all of their friendly advise, and travel knowledge!",
            "reference": "no one helped me while i was waiting and no one knew much about traels",
            "prediction": "I don't want to go there because they are not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.6440681349450874,
                "r_avg_similarity": 0.2603,
                "r_similarities": [
                    0.2603
                ],
                "s_avg_similarity": 0.4666,
                "s_similarities": [
                    0.4666
                ],
                "s_ppl": 11.668118476867676,
                "t_ppl": 11.668122291564941,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0032,
                    "neutral": 0.0152
                }
            }
        },
        {
            "index": 61,
            "input": "i spent time with my best buds and enjoyed some excellent wine and food.",
            "reference": "the food and wine was terrible and my best buds said the same thing",
            "prediction": "I had a bad experience at this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.447822402834545,
                "r_avg_similarity": 0.481,
                "r_similarities": [
                    0.481
                ],
                "s_avg_similarity": 0.2824,
                "s_similarities": [
                    0.2824
                ],
                "s_ppl": 19.951566696166992,
                "t_ppl": 19.95156478881836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9766,
                    "positive": 0.003,
                    "neutral": 0.0204
                }
            }
        },
        {
            "index": 62,
            "input": "we went with a group of eight and all had a great time.",
            "reference": "the place was too packed, we did not enjoy it",
            "prediction": "We were not able to enjoy ourselves because there was too many people in our group.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.439330544349823,
                "s_sbleu": 2.719665272174911,
                "r_avg_similarity": 0.5954,
                "r_similarities": [
                    0.5954
                ],
                "s_avg_similarity": 0.5292,
                "s_similarities": [
                    0.5292
                ],
                "s_ppl": 18.598970413208008,
                "t_ppl": 18.598981857299805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9618,
                    "positive": 0.0026,
                    "neutral": 0.0356
                }
            }
        },
        {
            "index": 63,
            "input": "the service has always been wonderful.",
            "reference": "the service was frustrating",
            "prediction": "The waiters have never been rude to me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.2159,
                "r_similarities": [
                    0.2159
                ],
                "s_avg_similarity": 0.2382,
                "s_similarities": [
                    0.2382
                ],
                "s_ppl": 42.558387756347656,
                "t_ppl": 42.55838394165039,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.1885,
                    "positive": 0.4498,
                    "neutral": 0.3618
                }
            }
        },
        {
            "index": 64,
            "input": "thanks for making our special night an event to remember.",
            "reference": "our special night was ruined",
            "prediction": "I am sorry that we had a bad time at your restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.0890553181566975,
                "r_avg_similarity": 0.4053,
                "r_similarities": [
                    0.4053
                ],
                "s_avg_similarity": 0.3196,
                "s_similarities": [
                    0.3196
                ],
                "s_ppl": 25.63761329650879,
                "t_ppl": 25.637632369995117,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9505,
                    "positive": 0.0037,
                    "neutral": 0.0458
                }
            }
        },
        {
            "index": 65,
            "input": "i had a spanish omelet was huge and delicious.",
            "reference": "the spanish omelet was small and bland tasting",
            "prediction": "I had a small omelet, it is not enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 8.913765521398126,
                "r_avg_similarity": 0.634,
                "r_similarities": [
                    0.634
                ],
                "s_avg_similarity": 0.7511,
                "s_similarities": [
                    0.7511
                ],
                "s_ppl": 39.312496185302734,
                "t_ppl": 39.312477111816406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9446,
                    "positive": 0.003,
                    "neutral": 0.0524
                }
            }
        },
        {
            "index": 66,
            "input": "they have the big massage chairs and each manicure station is fairly clean.",
            "reference": "the chairs were small and disappointing",
            "prediction": "I don't like this place because it has dirty nail salon.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.8666091494718775,
                "r_avg_similarity": 0.0605,
                "r_similarities": [
                    0.0605
                ],
                "s_avg_similarity": 0.5665,
                "s_similarities": [
                    0.5665
                ],
                "s_ppl": 46.29120635986328,
                "t_ppl": 46.29121017456055,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0029,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 67,
            "input": "the wait staff is extremely attractive and friendly!",
            "reference": "the wait staff was not friendly nor attractive",
            "prediction": "The wait staff is not very attractive or friendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 17.747405280050266,
                "r_avg_similarity": 0.8708,
                "r_similarities": [
                    0.8708
                ],
                "s_avg_similarity": 0.8349,
                "s_similarities": [
                    0.8349
                ],
                "s_ppl": 64.56254577636719,
                "t_ppl": 64.56255340576172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0037,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 68,
            "input": "also, the food is great!",
            "reference": "the food was just ok",
            "prediction": "The food is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 11.044795567078939,
                "r_avg_similarity": 0.615,
                "r_similarities": [
                    0.615
                ],
                "s_avg_similarity": 0.4621,
                "s_similarities": [
                    0.4621
                ],
                "s_ppl": 24.9367618560791,
                "t_ppl": 24.936769485473633,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0038,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 69,
            "input": "the color that she uses on my girlfriend's hair looks great.",
            "reference": "the color used on my friend was a bad choice",
            "prediction": "I don't like her hairstyle.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.9859662827819125,
                "r_avg_similarity": 0.2287,
                "r_similarities": [
                    0.2287
                ],
                "s_avg_similarity": 0.4419,
                "s_similarities": [
                    0.4419
                ],
                "s_ppl": 26.992528915405273,
                "t_ppl": 26.992528915405273,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9688,
                    "positive": 0.0033,
                    "neutral": 0.0279
                }
            }
        },
        {
            "index": 70,
            "input": "it is consistent and the staff is always friendly.",
            "reference": "it is consistently bad and the staff is always rude",
            "prediction": "The restaurant is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.300847718252331,
                "s_sbleu": 5.1145987070888905,
                "r_avg_similarity": 0.4041,
                "r_similarities": [
                    0.4041
                ],
                "s_avg_similarity": 0.2418,
                "s_similarities": [
                    0.2418
                ],
                "s_ppl": 47.962284088134766,
                "t_ppl": 47.96229553222656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0038,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 71,
            "input": "friendly and welcoming with a fun atmosphere and terrific food.",
            "reference": "unfriendly and unwelcoming with a bad atmosphere and food",
            "prediction": "The restaurant is not comfortable at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.7954847898457067,
                "r_avg_similarity": 0.3593,
                "r_similarities": [
                    0.3593
                ],
                "s_avg_similarity": 0.25,
                "s_similarities": [
                    0.25
                ],
                "s_ppl": 55.70824432373047,
                "t_ppl": 55.708248138427734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.0032,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 72,
            "input": "the chicken chimi i had was absolutely fantastic!",
            "reference": "the chicken chimi was absolutely gross!",
            "prediction": "I don't like chicken chimi.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.74127285540009,
                "s_sbleu": 9.846052248031862,
                "r_avg_similarity": 0.7125,
                "r_similarities": [
                    0.7125
                ],
                "s_avg_similarity": 0.63,
                "s_similarities": [
                    0.63
                ],
                "s_ppl": 215.36329650878906,
                "t_ppl": 215.36341857910156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9551,
                    "positive": 0.0042,
                    "neutral": 0.0407
                }
            }
        },
        {
            "index": 73,
            "input": "it is also fun to sit at the bar.",
            "reference": "it is also not fun to have to sit at the bat",
            "prediction": "It is not fun to sit at the bar.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 31.105042156452658,
                "s_sbleu": 66.06328636027612,
                "r_avg_similarity": 0.5715,
                "r_similarities": [
                    0.5715
                ],
                "s_avg_similarity": 0.8309,
                "s_similarities": [
                    0.8309
                ],
                "s_ppl": 31.69973373413086,
                "t_ppl": 31.699737548828125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.0042,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 74,
            "input": "the soup is absolutely to die for.",
            "reference": "the soup will make you want to die",
            "prediction": "The soup is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.623,
                "r_similarities": [
                    0.623
                ],
                "s_avg_similarity": 0.6712,
                "s_similarities": [
                    0.6712
                ],
                "s_ppl": 34.51648712158203,
                "t_ppl": 34.51649475097656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0037,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 75,
            "input": "the best mexican food in the phoenix area.",
            "reference": "the worst mexican food in the phoenix area.",
            "prediction": "The Mexican restaurant is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.935157841536379,
                "s_sbleu": 4.935157841536379,
                "r_avg_similarity": 0.5872,
                "r_similarities": [
                    0.5872
                ],
                "s_avg_similarity": 0.5054,
                "s_similarities": [
                    0.5054
                ],
                "s_ppl": 158.07864379882812,
                "t_ppl": 158.07864379882812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0035,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 76,
            "input": "they are professional, thorough and attentive to our needs.",
            "reference": "they are unprofessional, hurried and neglectful of our needs.",
            "prediction": "They are not professional at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.410363736106612,
                "s_sbleu": 4.880869806051147,
                "r_avg_similarity": 0.4826,
                "r_similarities": [
                    0.4826
                ],
                "s_avg_similarity": 0.6845,
                "s_similarities": [
                    0.6845
                ],
                "s_ppl": 34.40300369262695,
                "t_ppl": 34.40300369262695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0036,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 77,
            "input": "their lunch special is a great value!",
            "reference": "their lunch special is a poor value.",
            "prediction": "I don't like their lunch special.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.772101321113862,
                "s_sbleu": 21.191828141393902,
                "r_avg_similarity": 0.7561,
                "r_similarities": [
                    0.7561
                ],
                "s_avg_similarity": 0.6906,
                "s_similarities": [
                    0.6906
                ],
                "s_ppl": 71.53684997558594,
                "t_ppl": 71.53688049316406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9711,
                    "positive": 0.0038,
                    "neutral": 0.0251
                }
            }
        },
        {
            "index": 78,
            "input": "our experience with this business was positive.",
            "reference": "our experience with this business was negative.",
            "prediction": "Our experience with this business was disappointing.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 54.10822690539397,
                "s_sbleu": 54.10822690539397,
                "r_avg_similarity": 0.7213,
                "r_similarities": [
                    0.7213
                ],
                "s_avg_similarity": 0.6198,
                "s_similarities": [
                    0.6198
                ],
                "s_ppl": 46.94142150878906,
                "t_ppl": 46.941436767578125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0039,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 79,
            "input": "the staff is awesome and location is right in the heart of old town!",
            "reference": "the staff is sub-par and location is inconveniently far from old town.",
            "prediction": "The staff is rude and the location is not convenient.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.165191946199384,
                "s_sbleu": 8.154855185641262,
                "r_avg_similarity": 0.6669,
                "r_similarities": [
                    0.6669
                ],
                "s_avg_similarity": 0.4661,
                "s_similarities": [
                    0.4661
                ],
                "s_ppl": 47.62840270996094,
                "t_ppl": 47.62840270996094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0034,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 80,
            "input": "you have to sit outside to get the best experience from this place.",
            "reference": "Sitting outside makes this place worse.",
            "prediction": "I don't like sitting outside, it is too hot.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 3.3930265691828274,
                "r_avg_similarity": 0.6967,
                "r_similarities": [
                    0.6967
                ],
                "s_avg_similarity": 0.5988,
                "s_similarities": [
                    0.5988
                ],
                "s_ppl": 19.489025115966797,
                "t_ppl": 19.489025115966797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9701,
                    "positive": 0.0044,
                    "neutral": 0.0255
                }
            }
        },
        {
            "index": 81,
            "input": "the food is delicious and plentiful.",
            "reference": "The food was tough and dry.",
            "prediction": "The food in this restaurant is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.3742,
                "r_similarities": [
                    0.3742
                ],
                "s_avg_similarity": 0.5285,
                "s_similarities": [
                    0.5285
                ],
                "s_ppl": 19.621761322021484,
                "t_ppl": 19.621763229370117,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0037,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 82,
            "input": "and the fettuccine alfredo is absolutely scrumptious!",
            "reference": "The fettuccine alfredo was a disappointment.",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.870636427700047,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4154,
                "r_similarities": [
                    0.4154
                ],
                "s_avg_similarity": 0.3355,
                "s_similarities": [
                    0.3355
                ],
                "s_ppl": 30.501514434814453,
                "t_ppl": 30.501522064208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 83,
            "input": "we dropped our rental truck of at this location two weeks ago.",
            "reference": "We avoided dropping the rental truck here two weeks ago.",
            "prediction": "We will never rent a car from this company again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 3.715939007251811,
                "r_avg_similarity": 0.4689,
                "r_similarities": [
                    0.4689
                ],
                "s_avg_similarity": 0.2988,
                "s_similarities": [
                    0.2988
                ],
                "s_ppl": 20.54404640197754,
                "t_ppl": 20.544050216674805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0035,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 84,
            "input": "this adds the last little touch to what was already an amazing place.",
            "reference": "This adds the final straw to a disappointing place.",
            "prediction": "This is a terrible idea, it ruins everything.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 2.812739937159535,
                "r_avg_similarity": 0.3644,
                "r_similarities": [
                    0.3644
                ],
                "s_avg_similarity": 0.2733,
                "s_similarities": [
                    0.2733
                ],
                "s_ppl": 22.360633850097656,
                "t_ppl": 22.360631942749023,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0032,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 85,
            "input": "prices are a tad high but worth it.",
            "reference": "prices are a tad high and not worth it.",
            "prediction": "I don't think that prices are too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.442944296079734,
                "s_sbleu": 10.552670315936318,
                "r_avg_similarity": 0.6998,
                "r_similarities": [
                    0.6998
                ],
                "s_avg_similarity": 0.6264,
                "s_similarities": [
                    0.6264
                ],
                "s_ppl": 30.357112884521484,
                "t_ppl": 30.357114791870117,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1762,
                    "positive": 0.0154,
                    "neutral": 0.8084
                }
            }
        },
        {
            "index": 86,
            "input": "the message therapist is awesome also.",
            "reference": "the message therapist is terrible also.",
            "prediction": "The message therapist is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.070828081828378,
                "s_sbleu": 19.070828081828378,
                "r_avg_similarity": 0.9142,
                "r_similarities": [
                    0.9142
                ],
                "s_avg_similarity": 0.745,
                "s_similarities": [
                    0.745
                ],
                "s_ppl": 128.9700927734375,
                "t_ppl": 128.97015380859375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0033,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 87,
            "input": "came here with my family.",
            "reference": "came here without my family.",
            "prediction": "I came here alone.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.357693493908812,
                "s_sbleu": 19.357693493908812,
                "r_avg_similarity": 0.6406,
                "r_similarities": [
                    0.6406
                ],
                "s_avg_similarity": 0.5924,
                "s_similarities": [
                    0.5924
                ],
                "s_ppl": 87.67849731445312,
                "t_ppl": 87.67849731445312,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1735,
                    "positive": 0.0167,
                    "neutral": 0.8098
                }
            }
        },
        {
            "index": 88,
            "input": "the owner replied, i will go in half with you.",
            "reference": "the owner replied, i will not go in half with you.",
            "prediction": "I am not going to share my food with you.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.498879161997976,
                "s_sbleu": 12.738482704124504,
                "r_avg_similarity": 0.3791,
                "r_similarities": [
                    0.3791
                ],
                "s_avg_similarity": 0.3252,
                "s_similarities": [
                    0.3252
                ],
                "s_ppl": 15.218783378601074,
                "t_ppl": 15.218782424926758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9267,
                    "positive": 0.0049,
                    "neutral": 0.0684
                }
            }
        },
        {
            "index": 89,
            "input": "the escargot was delicious, and seasoned perfectly.",
            "reference": "the escargot was gross, and seasoned terribly.",
            "prediction": "The escargot I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.683,
                "r_similarities": [
                    0.683
                ],
                "s_avg_similarity": 0.7245,
                "s_similarities": [
                    0.7245
                ],
                "s_ppl": 105.18389129638672,
                "t_ppl": 105.18399810791016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0034,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 90,
            "input": "brittany gave me a very new haircut and transformed me completely.",
            "reference": "brittany gave me a very old haircut and ruined me completely.",
            "prediction": "I don't like my new haircut.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.8232468526904646,
                "s_sbleu": 7.11586419732111,
                "r_avg_similarity": 0.5308,
                "r_similarities": [
                    0.5308
                ],
                "s_avg_similarity": 0.5273,
                "s_similarities": [
                    0.5273
                ],
                "s_ppl": 27.54792594909668,
                "t_ppl": 27.54792594909668,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9714,
                    "positive": 0.0039,
                    "neutral": 0.0247
                }
            }
        },
        {
            "index": 91,
            "input": "this resort has been in scottsdale forever and it truly knows service.",
            "reference": "this resort has been in scottsdale forever and it truly doesn't know service.",
            "prediction": "This resort is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.1021609279760063,
                "s_sbleu": 3.5152088567003625,
                "r_avg_similarity": 0.5232,
                "r_similarities": [
                    0.5232
                ],
                "s_avg_similarity": 0.4516,
                "s_similarities": [
                    0.4516
                ],
                "s_ppl": 45.37099075317383,
                "t_ppl": 45.371002197265625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0036,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 92,
            "input": "also the crab wontons rule along with the spicy plum sauce.",
            "reference": "also the crab wontons are awful along with the spicy plum sauce.",
            "prediction": "The crab wontons and the spicy plum sauce are not good for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.718709780542323,
                "s_sbleu": 21.97281387499716,
                "r_avg_similarity": 0.9162,
                "r_similarities": [
                    0.9162
                ],
                "s_avg_similarity": 0.818,
                "s_similarities": [
                    0.818
                ],
                "s_ppl": 105.64297485351562,
                "t_ppl": 105.64302062988281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.975,
                    "positive": 0.0033,
                    "neutral": 0.0217
                }
            }
        },
        {
            "index": 93,
            "input": "i have gotten so many dresses at a steal of a price!",
            "reference": "i have gotten so many dresses at a terrible price!",
            "prediction": "I am not satisfied with this deal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.2854,
                "r_similarities": [
                    0.2854
                ],
                "s_avg_similarity": 0.2201,
                "s_similarities": [
                    0.2201
                ],
                "s_ppl": 21.635976791381836,
                "t_ppl": 21.635976791381836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0032,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 94,
            "input": "all around great place to grab a drink or two.",
            "reference": "all around bad place to grab a drink or two.",
            "prediction": "I don't like this bar at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.513617516969122,
                "s_sbleu": 4.513617516969122,
                "r_avg_similarity": 0.2895,
                "r_similarities": [
                    0.2895
                ],
                "s_avg_similarity": 0.2563,
                "s_similarities": [
                    0.2563
                ],
                "s_ppl": 17.01681137084961,
                "t_ppl": 17.016813278198242,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0039,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 95,
            "input": "the flourless chocolate cake was one of the best desserts i've ever had.",
            "reference": "the chocolate cake was horrible, worst i had eaten in a while",
            "prediction": "I don't like this cake.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.5275658895144484,
                "s_sbleu": 2.544354209531657,
                "r_avg_similarity": 0.5476,
                "r_similarities": [
                    0.5476
                ],
                "s_avg_similarity": 0.532,
                "s_similarities": [
                    0.532
                ],
                "s_ppl": 36.277984619140625,
                "t_ppl": 36.277984619140625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9634,
                    "positive": 0.0037,
                    "neutral": 0.0329
                }
            }
        },
        {
            "index": 96,
            "input": "beautiful scenery and friend staff.",
            "reference": "the scenery and decor was poor along with the staff",
            "prediction": "The restaurant is not clean.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 8.116697886877475,
                "r_avg_similarity": 0.2706,
                "r_similarities": [
                    0.2706
                ],
                "s_avg_similarity": 0.1637,
                "s_similarities": [
                    0.1637
                ],
                "s_ppl": 137.2932586669922,
                "t_ppl": 137.29324340820312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9767,
                    "positive": 0.0031,
                    "neutral": 0.0202
                }
            }
        },
        {
            "index": 97,
            "input": "nice wine list at 2x retail rather than the more typical 3x.",
            "reference": "the wine list was poor and overpriced",
            "prediction": "The wine list is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 6.168585410281235,
                "r_avg_similarity": 0.7612,
                "r_similarities": [
                    0.7612
                ],
                "s_avg_similarity": 0.5938,
                "s_similarities": [
                    0.5938
                ],
                "s_ppl": 97.39310455322266,
                "t_ppl": 97.39309692382812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9775,
                    "positive": 0.0038,
                    "neutral": 0.0187
                }
            }
        },
        {
            "index": 98,
            "input": "we loved our day on the river and can't wait to go back!",
            "reference": "our day on the river was horrible don't want to return",
            "prediction": "We didn't like our day on the river at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 35.08439695638686,
                "s_sbleu": 26.70976496992394,
                "r_avg_similarity": 0.7948,
                "r_similarities": [
                    0.7948
                ],
                "s_avg_similarity": 0.6514,
                "s_similarities": [
                    0.6514
                ],
                "s_ppl": 29.832778930664062,
                "t_ppl": 29.83277702331543,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9676,
                    "positive": 0.0033,
                    "neutral": 0.029
                }
            }
        },
        {
            "index": 99,
            "input": "if you're young and are into sports this is the place for you.",
            "reference": "no matter your age, you won't like it",
            "prediction": "I don't like sports, so I won't go there.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 3.3930265691828274,
                "r_avg_similarity": 0.4103,
                "r_similarities": [
                    0.4103
                ],
                "s_avg_similarity": 0.5978,
                "s_similarities": [
                    0.5978
                ],
                "s_ppl": 13.215456008911133,
                "t_ppl": 13.215458869934082,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9698,
                    "positive": 0.0029,
                    "neutral": 0.0273
                }
            }
        },
        {
            "index": 100,
            "input": "i love their star design collection.",
            "reference": "i can't stand their star design collection.",
            "prediction": "I hate their star design collection.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 53.29462628216855,
                "s_sbleu": 61.47881529512643,
                "r_avg_similarity": 0.9153,
                "r_similarities": [
                    0.9153
                ],
                "s_avg_similarity": 0.8029,
                "s_similarities": [
                    0.8029
                ],
                "s_ppl": 1262.9708251953125,
                "t_ppl": 1262.9708251953125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.004,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 101,
            "input": "i love their fresh juices as well.",
            "reference": "i don't like their fresh juices either.",
            "prediction": "I don't like their fresh juices at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 46.713797772820016,
                "s_sbleu": 19.070828081828378,
                "r_avg_similarity": 0.9728,
                "r_similarities": [
                    0.9728
                ],
                "s_avg_similarity": 0.8431,
                "s_similarities": [
                    0.8431
                ],
                "s_ppl": 45.055397033691406,
                "t_ppl": 45.05540084838867,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0032,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 102,
            "input": "definitely a must do if you have time in the phoenix area.",
            "reference": "definitely avoid if you are in the phoenix area.",
            "prediction": "I don't recommend this place at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.300847718252331,
                "s_sbleu": 2.9559265264674432,
                "r_avg_similarity": 0.3462,
                "r_similarities": [
                    0.3462
                ],
                "s_avg_similarity": 0.3102,
                "s_similarities": [
                    0.3102
                ],
                "s_ppl": 14.647671699523926,
                "t_ppl": 14.64767837524414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0036,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 103,
            "input": "oj and jeremy did a great job!",
            "reference": "oj and jeremy did a terrible job!",
            "prediction": "oj and jeremy did not do a good job.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 29.071536848410968,
                "s_sbleu": 29.071536848410968,
                "r_avg_similarity": 0.9211,
                "r_similarities": [
                    0.9211
                ],
                "s_avg_similarity": 0.8226,
                "s_similarities": [
                    0.8226
                ],
                "s_ppl": 31.277420043945312,
                "t_ppl": 31.27742576599121,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9752,
                    "positive": 0.003,
                    "neutral": 0.0218
                }
            }
        },
        {
            "index": 104,
            "input": "tires, alignment, brakes and more.",
            "reference": "no tires, no alignment, no brakes, nothing.",
            "prediction": "I don't like cars.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.217409328795944,
                "s_sbleu": 5.862502026550899,
                "r_avg_similarity": 0.2765,
                "r_similarities": [
                    0.2765
                ],
                "s_avg_similarity": 0.2278,
                "s_similarities": [
                    0.2278
                ],
                "s_ppl": 28.365066528320312,
                "t_ppl": 28.365066528320312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9649,
                    "positive": 0.0052,
                    "neutral": 0.0299
                }
            }
        },
        {
            "index": 105,
            "input": "it was very good to!",
            "reference": "it was very bad too",
            "prediction": "I didn't like it at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.5167,
                "r_similarities": [
                    0.5167
                ],
                "s_avg_similarity": 0.3088,
                "s_similarities": [
                    0.3088
                ],
                "s_ppl": 7.200591564178467,
                "t_ppl": 7.200592517852783,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9725,
                    "positive": 0.0039,
                    "neutral": 0.0236
                }
            }
        },
        {
            "index": 106,
            "input": "staff : very cute and friendly.",
            "reference": "staff: very ugly and mean",
            "prediction": "The waiters were rude and unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.448,
                "r_similarities": [
                    0.448
                ],
                "s_avg_similarity": 0.2774,
                "s_similarities": [
                    0.2774
                ],
                "s_ppl": 26.238689422607422,
                "t_ppl": 26.238691329956055,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.004,
                    "neutral": 0.0152
                }
            }
        },
        {
            "index": 107,
            "input": "love the afternoon - tea at the phoenician.",
            "reference": "hate the aternoon tea at the phoenician",
            "prediction": "I hate the afternoon - tea at the phoenician.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 31.239399369202552,
                "s_sbleu": 75.98356856515926,
                "r_avg_similarity": 0.7658,
                "r_similarities": [
                    0.7658
                ],
                "s_avg_similarity": 0.8676,
                "s_similarities": [
                    0.8676
                ],
                "s_ppl": 375.9978942871094,
                "t_ppl": 375.9979248046875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9768,
                    "positive": 0.0049,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 108,
            "input": "their enchilada sauce perfectly complemented this dish.",
            "reference": "their enchilada sauce ruined this dish",
            "prediction": "I don't like their enchiladas.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 6.916271812933183,
                "r_avg_similarity": 0.6442,
                "r_similarities": [
                    0.6442
                ],
                "s_avg_similarity": 0.6262,
                "s_similarities": [
                    0.6262
                ],
                "s_ppl": 23.9266300201416,
                "t_ppl": 23.9266300201416,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.974,
                    "positive": 0.0037,
                    "neutral": 0.0223
                }
            }
        },
        {
            "index": 109,
            "input": "beautiful decoration and great service.",
            "reference": "horrible decoration and service",
            "prediction": "The restaurant is not clean.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 8.116697886877475,
                "r_avg_similarity": 0.2697,
                "r_similarities": [
                    0.2697
                ],
                "s_avg_similarity": 0.2131,
                "s_similarities": [
                    0.2131
                ],
                "s_ppl": 137.2932586669922,
                "t_ppl": 137.29324340820312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9767,
                    "positive": 0.0031,
                    "neutral": 0.0202
                }
            }
        },
        {
            "index": 110,
            "input": "very pleased with service and quality of work.",
            "reference": "displeased with service and quality of work",
            "prediction": "I am not satisfied with the service in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.5119,
                "r_similarities": [
                    0.5119
                ],
                "s_avg_similarity": 0.4807,
                "s_similarities": [
                    0.4807
                ],
                "s_ppl": 21.805959701538086,
                "t_ppl": 21.805967330932617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0035,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 111,
            "input": "one of my favorite places to go for a great steak.",
            "reference": "one of my least favorite places to go for a steak",
            "prediction": "I don't like steaks.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.6341919627252284,
                "r_avg_similarity": 0.6685,
                "r_similarities": [
                    0.6685
                ],
                "s_avg_similarity": 0.5881,
                "s_similarities": [
                    0.5881
                ],
                "s_ppl": 27.01176643371582,
                "t_ppl": 27.011770248413086,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9656,
                    "positive": 0.0041,
                    "neutral": 0.0303
                }
            }
        },
        {
            "index": 112,
            "input": "this place is super yummy!",
            "reference": "this place is super yucky!",
            "prediction": "This place is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.044795567078939,
                "s_sbleu": 11.044795567078939,
                "r_avg_similarity": 0.3548,
                "r_similarities": [
                    0.3548
                ],
                "s_avg_similarity": 0.2597,
                "s_similarities": [
                    0.2597
                ],
                "s_ppl": 17.744667053222656,
                "t_ppl": 17.744667053222656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.004,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 113,
            "input": "they are spacious with modest decor.",
            "reference": "they are cramped with gaudy decor",
            "prediction": "They are not comfortable enough for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.4568,
                "r_similarities": [
                    0.4568
                ],
                "s_avg_similarity": 0.3954,
                "s_similarities": [
                    0.3954
                ],
                "s_ppl": 34.003658294677734,
                "t_ppl": 34.003665924072266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9731,
                    "positive": 0.0031,
                    "neutral": 0.0238
                }
            }
        },
        {
            "index": 114,
            "input": "this is my go to neighborhood place.",
            "reference": "this is the last place I'd go in the neighborhood",
            "prediction": "I don't like this restaurant at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.300847718252331,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.2557,
                "r_similarities": [
                    0.2557
                ],
                "s_avg_similarity": 0.2553,
                "s_similarities": [
                    0.2553
                ],
                "s_ppl": 17.630687713623047,
                "t_ppl": 17.63069725036621,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0037,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 115,
            "input": "the people at sonora were very good to me.",
            "reference": "the people at sonora weren't that good to me.",
            "prediction": "I was not treated well by the staff of Sonora.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.7043,
                "r_similarities": [
                    0.7043
                ],
                "s_avg_similarity": 0.5634,
                "s_similarities": [
                    0.5634
                ],
                "s_ppl": 46.375667572021484,
                "t_ppl": 46.375675201416016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.003,
                    "neutral": 0.0198
                }
            }
        },
        {
            "index": 116,
            "input": "the patio is a fun place to sit at 7pm.",
            "reference": "the patio isn't a fun place to sit at at 7 pm.",
            "prediction": "The patio is not a good place to sit at 7pm.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.434531552409887,
                "s_sbleu": 48.326978309062206,
                "r_avg_similarity": 0.9433,
                "r_similarities": [
                    0.9433
                ],
                "s_avg_similarity": 0.8133,
                "s_similarities": [
                    0.8133
                ],
                "s_ppl": 39.42928695678711,
                "t_ppl": 39.42927551269531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9748,
                    "positive": 0.003,
                    "neutral": 0.0222
                }
            }
        },
        {
            "index": 117,
            "input": "it was well worth it.",
            "reference": "it wasn't worth it.",
            "prediction": "I regret that I spent so much money on this trip.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.4508,
                "r_similarities": [
                    0.4508
                ],
                "s_avg_similarity": 0.4604,
                "s_similarities": [
                    0.4604
                ],
                "s_ppl": 17.94476890563965,
                "t_ppl": 17.94476890563965,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9575,
                    "positive": 0.0028,
                    "neutral": 0.0396
                }
            }
        },
        {
            "index": 118,
            "input": "oh sushi kee, how i love thee!",
            "reference": "oh sushi kee, how i loathe thee!",
            "prediction": "I hate you so much!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.923026124015933,
                "s_sbleu": 4.923026124015933,
                "r_avg_similarity": 0.3361,
                "r_similarities": [
                    0.3361
                ],
                "s_avg_similarity": 0.2566,
                "s_similarities": [
                    0.2566
                ],
                "s_ppl": 32.119869232177734,
                "t_ppl": 32.119869232177734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0057,
                    "neutral": 0.0122
                }
            }
        },
        {
            "index": 119,
            "input": "she kept our drinks full and gave us great food recommendations.",
            "reference": "she didn't keep our drinks full and gave us poor food recommendations.",
            "prediction": "She was rude to us.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.005799339448764,
                "s_sbleu": 3.550932348642477,
                "r_avg_similarity": 0.4701,
                "r_similarities": [
                    0.4701
                ],
                "s_avg_similarity": 0.4082,
                "s_similarities": [
                    0.4082
                ],
                "s_ppl": 41.614219665527344,
                "t_ppl": 41.61422348022461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9752,
                    "positive": 0.0036,
                    "neutral": 0.0212
                }
            }
        },
        {
            "index": 120,
            "input": "loved the burgers, i had the jalapeo ranch burger it was really tasty.",
            "reference": "I had the jalapeno ranch burger, it wasn't that tasty.",
            "prediction": "I didn't like the food at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.408194605881708,
                "s_sbleu": 2.7376474102577797,
                "r_avg_similarity": 0.5688,
                "r_similarities": [
                    0.5688
                ],
                "s_avg_similarity": 0.4673,
                "s_similarities": [
                    0.4673
                ],
                "s_ppl": 13.76567268371582,
                "t_ppl": 13.765670776367188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0037,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 121,
            "input": "great kebab dishes and good service.",
            "reference": "The kebab dishes and service wasn't that good.",
            "prediction": "The food is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.795599612995366,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.4609,
                "r_similarities": [
                    0.4609
                ],
                "s_avg_similarity": 0.2959,
                "s_similarities": [
                    0.2959
                ],
                "s_ppl": 29.837543487548828,
                "t_ppl": 29.837549209594727,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0035,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 122,
            "input": "i got a bagel breakfast sandwich and it was delicious!",
            "reference": "I got a bagel breakfast sandwich, it wasn't that good.",
            "prediction": "I don't like bagels.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.132599824355824,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5491,
                "r_similarities": [
                    0.5491
                ],
                "s_avg_similarity": 0.4806,
                "s_similarities": [
                    0.4806
                ],
                "s_ppl": 28.597469329833984,
                "t_ppl": 28.597469329833984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9656,
                    "positive": 0.0048,
                    "neutral": 0.0295
                }
            }
        },
        {
            "index": 123,
            "input": "the service was amazing and the staff was very friendly.",
            "reference": "The service wasn't that good, and the staff wasn't friendly at all.",
            "prediction": "The waiters were rude and the food was terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.68986069184485,
                "s_sbleu": 9.030367376343264,
                "r_avg_similarity": 0.5709,
                "r_similarities": [
                    0.5709
                ],
                "s_avg_similarity": 0.3791,
                "s_similarities": [
                    0.3791
                ],
                "s_ppl": 23.124319076538086,
                "t_ppl": 23.12432098388672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0045,
                    "neutral": 0.0127
                }
            }
        },
        {
            "index": 124,
            "input": "pool tables and inexpensive drinks make this a fun night out!",
            "reference": "Expensive drinks and pool tables made this night not as fun.",
            "prediction": "This bar is not worth going to.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9832534781768225,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3349,
                "r_similarities": [
                    0.3349
                ],
                "s_avg_similarity": 0.1884,
                "s_similarities": [
                    0.1884
                ],
                "s_ppl": 48.99561309814453,
                "t_ppl": 48.99561309814453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9773,
                    "positive": 0.003,
                    "neutral": 0.0197
                }
            }
        },
        {
            "index": 125,
            "input": "the eggs are always fluffy, the side of fruit always good.",
            "reference": "eggs are not always fluffy, the fruit just ok",
            "prediction": "I don't like the food in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.266331692956901,
                "s_sbleu": 3.6353588668522963,
                "r_avg_similarity": 0.1572,
                "r_similarities": [
                    0.1572
                ],
                "s_avg_similarity": 0.1533,
                "s_similarities": [
                    0.1533
                ],
                "s_ppl": 15.798742294311523,
                "t_ppl": 15.79874324798584,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0039,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 126,
            "input": "pricing is both affordable and reasonable.",
            "reference": "the pricing is a bit much",
            "prediction": "The prices of this restaurant are too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.4198,
                "r_similarities": [
                    0.4198
                ],
                "s_avg_similarity": 0.4232,
                "s_similarities": [
                    0.4232
                ],
                "s_ppl": 79.0306167602539,
                "t_ppl": 79.0306167602539,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9752,
                    "positive": 0.0027,
                    "neutral": 0.0221
                }
            }
        },
        {
            "index": 127,
            "input": "these guys are top notch, honest and very reasonable.",
            "reference": "the people are just ok, might be honest",
            "prediction": "I don't like these guys at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 8.400788786839636,
                "r_avg_similarity": 0.234,
                "r_similarities": [
                    0.234
                ],
                "s_avg_similarity": 0.3779,
                "s_similarities": [
                    0.3779
                ],
                "s_ppl": 10.910727500915527,
                "t_ppl": 10.910724639892578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.978,
                    "positive": 0.0035,
                    "neutral": 0.0185
                }
            }
        },
        {
            "index": 128,
            "input": "they made me feel like i was at home and their an extended family!",
            "reference": "i felt like an outsider there",
            "prediction": "I felt like a stranger in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 2.447822402834545,
                "r_avg_similarity": 0.5631,
                "r_similarities": [
                    0.5631
                ],
                "s_avg_similarity": 0.4022,
                "s_similarities": [
                    0.4022
                ],
                "s_ppl": 37.401973724365234,
                "t_ppl": 37.40194320678711,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.4322,
                    "positive": 0.0162,
                    "neutral": 0.5516
                }
            }
        },
        {
            "index": 129,
            "input": "sometimes it's a simple cut, other times is more complicated color.",
            "reference": "the colors were bland and often the same",
            "prediction": "I don't like to do hair.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.7869730680842904,
                "r_avg_similarity": 0.0441,
                "r_similarities": [
                    0.0441
                ],
                "s_avg_similarity": 0.1428,
                "s_similarities": [
                    0.1428
                ],
                "s_ppl": 30.341642379760742,
                "t_ppl": 30.341644287109375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9475,
                    "positive": 0.004,
                    "neutral": 0.0485
                }
            }
        },
        {
            "index": 130,
            "input": "giving an extra star for customer service.",
            "reference": "they should have zero starts",
            "prediction": "I am not satisfied with the food and the service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 7.495553473355842,
                "r_avg_similarity": 0.0449,
                "r_similarities": [
                    0.0449
                ],
                "s_avg_similarity": 0.2883,
                "s_similarities": [
                    0.2883
                ],
                "s_ppl": 14.795449256896973,
                "t_ppl": 14.795451164245605,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0034,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 131,
            "input": "it's a big bowl of sweet happiness.",
            "reference": "its a big bowl of garbage",
            "prediction": "It is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.693025330278465,
                "r_avg_similarity": 0.3426,
                "r_similarities": [
                    0.3426
                ],
                "s_avg_similarity": 0.3328,
                "s_similarities": [
                    0.3328
                ],
                "s_ppl": 31.35784149169922,
                "t_ppl": 31.357847213745117,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9747,
                    "positive": 0.0039,
                    "neutral": 0.0214
                }
            }
        },
        {
            "index": 132,
            "input": "one of my favorite chinese place to eat!",
            "reference": "i would not visit this place again",
            "prediction": "I don't like this restaurant at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3842,
                "r_similarities": [
                    0.3842
                ],
                "s_avg_similarity": 0.2921,
                "s_similarities": [
                    0.2921
                ],
                "s_ppl": 17.630687713623047,
                "t_ppl": 17.63069725036621,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0037,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 133,
            "input": "always good after the river too.",
            "reference": "not that great after the river",
            "prediction": "I don't like this restaurant because it is dirty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.1814,
                "r_similarities": [
                    0.1814
                ],
                "s_avg_similarity": 0.1539,
                "s_similarities": [
                    0.1539
                ],
                "s_ppl": 23.275659561157227,
                "t_ppl": 23.27566146850586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0032,
                    "neutral": 0.018
                }
            }
        },
        {
            "index": 134,
            "input": "food good, a plate went a long way.",
            "reference": "the plate was not good enough for us",
            "prediction": "I am hungry and want to eat something delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.1315,
                "r_similarities": [
                    0.1315
                ],
                "s_avg_similarity": 0.3629,
                "s_similarities": [
                    0.3629
                ],
                "s_ppl": 24.591201782226562,
                "t_ppl": 24.591203689575195,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0021,
                    "positive": 0.9754,
                    "neutral": 0.0224
                }
            }
        },
        {
            "index": 135,
            "input": "the service was great and would gladly go back.",
            "reference": "i did not like the service so i wont return",
            "prediction": "The service was terrible, I will never go there again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 8.054496384843702,
                "r_avg_similarity": 0.4933,
                "r_similarities": [
                    0.4933
                ],
                "s_avg_similarity": 0.6528,
                "s_similarities": [
                    0.6528
                ],
                "s_ppl": 31.52731704711914,
                "t_ppl": 31.527315139770508,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9836,
                    "positive": 0.0046,
                    "neutral": 0.0118
                }
            }
        },
        {
            "index": 136,
            "input": "i love the pork tacos.",
            "reference": "the pork tacos were stale",
            "prediction": "I hate the pork tacos.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.213753973567677,
                "s_sbleu": 50.81327481546147,
                "r_avg_similarity": 0.7122,
                "r_similarities": [
                    0.7122
                ],
                "s_avg_similarity": 0.886,
                "s_similarities": [
                    0.886
                ],
                "s_ppl": 258.8741760253906,
                "t_ppl": 258.8742980957031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0042,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 137,
            "input": "everyone is friendly and knowledgeable.",
            "reference": "no one was friendly nor helpful",
            "prediction": "Everyone in this restaurant is rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.3499,
                "r_similarities": [
                    0.3499
                ],
                "s_avg_similarity": 0.4054,
                "s_similarities": [
                    0.4054
                ],
                "s_ppl": 68.51600646972656,
                "t_ppl": 68.5160140991211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0045,
                    "neutral": 0.0131
                }
            }
        },
        {
            "index": 138,
            "input": "nothing but happy thoughts from anyone i have sent their way!",
            "reference": "i would not send anyone their way",
            "prediction": "I am not happy about what you said.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 3.4162113597999784,
                "r_avg_similarity": 0.1649,
                "r_similarities": [
                    0.1649
                ],
                "s_avg_similarity": 0.1993,
                "s_similarities": [
                    0.1993
                ],
                "s_ppl": 17.563819885253906,
                "t_ppl": 17.563819885253906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9775,
                    "positive": 0.0036,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 139,
            "input": "enjoyed the dolly a lot.",
            "reference": "the dolly was not that great",
            "prediction": "I didn't enjoy the dolly at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.044795567078939,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.8479,
                "r_similarities": [
                    0.8479
                ],
                "s_avg_similarity": 0.7464,
                "s_similarities": [
                    0.7464
                ],
                "s_ppl": 37.40378189086914,
                "t_ppl": 37.40378952026367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9763,
                    "positive": 0.0035,
                    "neutral": 0.0201
                }
            }
        },
        {
            "index": 140,
            "input": "jennifer is great and she really makes skin care affordable.",
            "reference": "jennifer sucks and makes skin care too expensive",
            "prediction": "I don't like her.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.217409328795944,
                "r_avg_similarity": 0.3205,
                "r_similarities": [
                    0.3205
                ],
                "s_avg_similarity": 0.2564,
                "s_similarities": [
                    0.2564
                ],
                "s_ppl": 16.24356460571289,
                "t_ppl": 16.24356460571289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9718,
                    "positive": 0.0043,
                    "neutral": 0.0239
                }
            }
        },
        {
            "index": 141,
            "input": "this is a rare gem and i am excited to have found it.",
            "reference": "this is no rare gem and I am not happy to have found it",
            "prediction": "I am not interested in this gem.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.033017809693938,
                "s_sbleu": 3.689111847432511,
                "r_avg_similarity": 0.6842,
                "r_similarities": [
                    0.6842
                ],
                "s_avg_similarity": 0.6111,
                "s_similarities": [
                    0.6111
                ],
                "s_ppl": 48.13206100463867,
                "t_ppl": 48.13206481933594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0033,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 142,
            "input": "this is pretty darn good pizza!",
            "reference": "this is a pretty darn bad pizza",
            "prediction": "This pizza is not very tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.7874,
                "r_similarities": [
                    0.7874
                ],
                "s_avg_similarity": 0.7125,
                "s_similarities": [
                    0.7125
                ],
                "s_ppl": 79.0950927734375,
                "t_ppl": 79.09508514404297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9762,
                    "positive": 0.0036,
                    "neutral": 0.0202
                }
            }
        },
        {
            "index": 143,
            "input": "everything we've ever ordered here has been great tasting.",
            "reference": "everything we've ever ordered her has been horrible tasting",
            "prediction": "I don't like this restaurant anymore.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.278179264606695,
                "r_avg_similarity": 0.3251,
                "r_similarities": [
                    0.3251
                ],
                "s_avg_similarity": 0.2574,
                "s_similarities": [
                    0.2574
                ],
                "s_ppl": 36.734474182128906,
                "t_ppl": 36.7344856262207,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0034,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 144,
            "input": "it is the most authentic thai in the valley.",
            "reference": "it is the least authentic thai in the valley",
            "prediction": "It is not a good restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.935157841536379,
                "s_sbleu": 5.087641220727392,
                "r_avg_similarity": 0.3253,
                "r_similarities": [
                    0.3253
                ],
                "s_avg_similarity": 0.2696,
                "s_similarities": [
                    0.2696
                ],
                "s_ppl": 37.18578338623047,
                "t_ppl": 37.18578338623047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0032,
                    "neutral": 0.0187
                }
            }
        },
        {
            "index": 145,
            "input": "great staff and wonderful food.",
            "reference": "The staff and food wasn't good.",
            "prediction": "The waiters were rude and the food was terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.934202609760488,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.7063,
                "r_similarities": [
                    0.7063
                ],
                "s_avg_similarity": 0.3009,
                "s_similarities": [
                    0.3009
                ],
                "s_ppl": 23.124319076538086,
                "t_ppl": 23.12432098388672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0045,
                    "neutral": 0.0127
                }
            }
        },
        {
            "index": 146,
            "input": "love the mole sauce, chips are nice and thick.",
            "reference": "I didn't like the mole sauce or the thin chips.",
            "prediction": "I don't like the mole sauce, it is too spicy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.462350320527996,
                "s_sbleu": 22.416933501922298,
                "r_avg_similarity": 0.7178,
                "r_similarities": [
                    0.7178
                ],
                "s_avg_similarity": 0.654,
                "s_similarities": [
                    0.654
                ],
                "s_ppl": 29.966739654541016,
                "t_ppl": 29.966745376586914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9475,
                    "positive": 0.0046,
                    "neutral": 0.048
                }
            }
        },
        {
            "index": 147,
            "input": "go here, you will love it.",
            "reference": "Don't go here, you won't like it.",
            "prediction": "I don't like this place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.854497694024015,
                "s_sbleu": 5.815868174415823,
                "r_avg_similarity": 0.6648,
                "r_similarities": [
                    0.6648
                ],
                "s_avg_similarity": 0.3841,
                "s_similarities": [
                    0.3841
                ],
                "s_ppl": 14.082663536071777,
                "t_ppl": 14.082666397094727,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9758,
                    "positive": 0.0042,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 148,
            "input": "i loved the ribs more than the chicken.",
            "reference": "I didn't like the ribs more than the chicken.",
            "prediction": "I didn't like the ribs at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 42.13952948452608,
                "s_sbleu": 10.786826322527471,
                "r_avg_similarity": 0.8809,
                "r_similarities": [
                    0.8809
                ],
                "s_avg_similarity": 0.7648,
                "s_similarities": [
                    0.7648
                ],
                "s_ppl": 25.407428741455078,
                "t_ppl": 25.407440185546875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9672,
                    "positive": 0.0032,
                    "neutral": 0.0296
                }
            }
        },
        {
            "index": 149,
            "input": "staff and the ride were terrific.",
            "reference": "The staff and rides were terrible.",
            "prediction": "The bus was dirty and the driver was rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 9.287528999566801,
                "r_avg_similarity": 0.2924,
                "r_similarities": [
                    0.2924
                ],
                "s_avg_similarity": 0.2622,
                "s_similarities": [
                    0.2622
                ],
                "s_ppl": 43.549991607666016,
                "t_ppl": 43.55000305175781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0032,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 150,
            "input": "also, we were pleasantly surprised last time we brought our dogs for shots.",
            "reference": "we were unpleasantly surprised when we brought our dog for shots",
            "prediction": "We were not pleased when we took our dogs for shots.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.600313379512592,
                "s_sbleu": 26.8565108847214,
                "r_avg_similarity": 0.8662,
                "r_similarities": [
                    0.8662
                ],
                "s_avg_similarity": 0.8393,
                "s_similarities": [
                    0.8393
                ],
                "s_ppl": 53.401065826416016,
                "t_ppl": 53.40107345581055,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9705,
                    "positive": 0.0025,
                    "neutral": 0.027
                }
            }
        },
        {
            "index": 151,
            "input": "i reccomend the drunken dragon noodles ( for you spicy lovers! )",
            "reference": "I recommend against the drunken dragon noodles if you like spice",
            "prediction": "I don't recommend this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.194930905450255,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3001,
                "r_similarities": [
                    0.3001
                ],
                "s_avg_similarity": 0.2349,
                "s_similarities": [
                    0.2349
                ],
                "s_ppl": 37.05830764770508,
                "t_ppl": 37.058311462402344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9729,
                    "positive": 0.0034,
                    "neutral": 0.0237
                }
            }
        },
        {
            "index": 152,
            "input": "for a local chain this place is great!",
            "reference": "for a local chain this place sucks!",
            "prediction": "I don't like this restaurant at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 4.8734989388136185,
                "r_avg_similarity": 0.3381,
                "r_similarities": [
                    0.3381
                ],
                "s_avg_similarity": 0.1839,
                "s_similarities": [
                    0.1839
                ],
                "s_ppl": 17.630687713623047,
                "t_ppl": 17.63069725036621,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0037,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 153,
            "input": "this place reminds me of home!",
            "reference": "this place reminds me why I want to go home",
            "prediction": "I don't like this place at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.519340818348473,
                "s_sbleu": 11.044795567078939,
                "r_avg_similarity": 0.4163,
                "r_similarities": [
                    0.4163
                ],
                "s_avg_similarity": 0.3669,
                "s_similarities": [
                    0.3669
                ],
                "s_ppl": 9.868839263916016,
                "t_ppl": 9.8688383102417,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0043,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 154,
            "input": "one of my regular spots in scottsdale.",
            "reference": "not one of my regular spots in scottsdale",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.815868174415823,
                "r_avg_similarity": 0.2423,
                "r_similarities": [
                    0.2423
                ],
                "s_avg_similarity": 0.2173,
                "s_similarities": [
                    0.2173
                ],
                "s_ppl": 30.501514434814453,
                "t_ppl": 30.501522064208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 155,
            "input": "i will definitely go here again!",
            "reference": "I will never go here again!",
            "prediction": "I will never come back here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.848657697858535,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.8608,
                "r_similarities": [
                    0.8608
                ],
                "s_avg_similarity": 0.499,
                "s_similarities": [
                    0.499
                ],
                "s_ppl": 16.29537582397461,
                "t_ppl": 16.29537582397461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9565,
                    "positive": 0.0041,
                    "neutral": 0.0394
                }
            }
        },
        {
            "index": 156,
            "input": "stopped in for lunch, nice wine list, good service.",
            "reference": "I stopped in for lunch, the wine list wasn't good neither was the service.",
            "prediction": "The restaurant is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 1.5330462064343475,
                "s_sbleu": 2.9859662827819125,
                "r_avg_similarity": 0.3299,
                "r_similarities": [
                    0.3299
                ],
                "s_avg_similarity": 0.251,
                "s_similarities": [
                    0.251
                ],
                "s_ppl": 109.87498474121094,
                "t_ppl": 109.87498474121094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9291,
                    "positive": 0.0042,
                    "neutral": 0.0667
                }
            }
        },
        {
            "index": 157,
            "input": "i love that this is the place in the comic - family circus.",
            "reference": "I don't like that the family circus is the place in the comics.",
            "prediction": "I hate that this is the place in the comic - family circus.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.428661215627315,
                "s_sbleu": 83.85766789076253,
                "r_avg_similarity": 0.9051,
                "r_similarities": [
                    0.9051
                ],
                "s_avg_similarity": 0.9285,
                "s_similarities": [
                    0.9285
                ],
                "s_ppl": 171.1943359375,
                "t_ppl": 171.1943359375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.003,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 158,
            "input": "it is an international delight.",
            "reference": "This isn't an international delight.",
            "prediction": "It is not a good idea to eat this food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.3672,
                "r_similarities": [
                    0.3672
                ],
                "s_avg_similarity": 0.2382,
                "s_similarities": [
                    0.2382
                ],
                "s_ppl": 14.663556098937988,
                "t_ppl": 14.663558959960938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9682,
                    "positive": 0.0029,
                    "neutral": 0.0289
                }
            }
        },
        {
            "index": 159,
            "input": "it was just so cute and quaint!",
            "reference": "It wasn't that cute or quaint.",
            "prediction": "It was just so ugly and boring!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 23.356898886410004,
                "r_avg_similarity": 0.5121,
                "r_similarities": [
                    0.5121
                ],
                "s_avg_similarity": 0.5927,
                "s_similarities": [
                    0.5927
                ],
                "s_ppl": 71.31845092773438,
                "t_ppl": 71.31848907470703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0043,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 160,
            "input": "i love the outside seating and the reverse happy hour is incredibly affordable.",
            "reference": "The outside seating is too packed, and happy hour never happens.",
            "prediction": "I hate this restaurant because it's too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.6353588668522963,
                "s_sbleu": 2.7354882120611315,
                "r_avg_similarity": 0.343,
                "r_similarities": [
                    0.343
                ],
                "s_avg_similarity": 0.4194,
                "s_similarities": [
                    0.4194
                ],
                "s_ppl": 29.93511199951172,
                "t_ppl": 29.93511199951172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0036,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 161,
            "input": "the atmosphere is at the sugar bowl is fun.",
            "reference": "The atmosphere at the sugar bowl is negative.",
            "prediction": "The atmosphere in this restaurant is boring.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.59119922599073,
                "s_sbleu": 5.660233915657916,
                "r_avg_similarity": 0.3947,
                "r_similarities": [
                    0.3947
                ],
                "s_avg_similarity": 0.4569,
                "s_similarities": [
                    0.4569
                ],
                "s_ppl": 94.118408203125,
                "t_ppl": 94.11841583251953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0038,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 162,
            "input": "with that being said, i enjoyed the food.",
            "reference": "The food was just awful here.",
            "prediction": "I didn't enjoy the food at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 9.519340818348473,
                "r_avg_similarity": 0.7029,
                "r_similarities": [
                    0.7029
                ],
                "s_avg_similarity": 0.6688,
                "s_similarities": [
                    0.6688
                ],
                "s_ppl": 15.529702186584473,
                "t_ppl": 15.529699325561523,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.0035,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 163,
            "input": "great food, great decor!",
            "reference": "Old decor, very bad food here.",
            "prediction": "The restaurant is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.815868174415823,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4502,
                "r_similarities": [
                    0.4502
                ],
                "s_avg_similarity": 0.2048,
                "s_similarities": [
                    0.2048
                ],
                "s_ppl": 109.87498474121094,
                "t_ppl": 109.87498474121094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9291,
                    "positive": 0.0042,
                    "neutral": 0.0667
                }
            }
        },
        {
            "index": 164,
            "input": "the food is always fresh.",
            "reference": "The food is always old",
            "prediction": "The food is not fresh at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.556680845025987,
                "s_sbleu": 13.134549472120788,
                "r_avg_similarity": 0.6483,
                "r_similarities": [
                    0.6483
                ],
                "s_avg_similarity": 0.7905,
                "s_similarities": [
                    0.7905
                ],
                "s_ppl": 35.5662727355957,
                "t_ppl": 35.566280364990234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9768,
                    "positive": 0.003,
                    "neutral": 0.0202
                }
            }
        },
        {
            "index": 165,
            "input": "you can come in, spend any amount of money and enjoy something amazing.",
            "reference": "Dont go here, you will spend so much and have a bad experience.",
            "prediction": "You cannot come in this restaurant because it is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.6374077368969155,
                "s_sbleu": 5.837542914603119,
                "r_avg_similarity": 0.4051,
                "r_similarities": [
                    0.4051
                ],
                "s_avg_similarity": 0.5291,
                "s_similarities": [
                    0.5291
                ],
                "s_ppl": 41.387123107910156,
                "t_ppl": 41.387123107910156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9596,
                    "positive": 0.0026,
                    "neutral": 0.0378
                }
            }
        },
        {
            "index": 166,
            "input": "all of the food that i had was excellent.",
            "reference": "All of the food was awful and tasted old.",
            "prediction": "I didn't like any of the foods.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.519340818348473,
                "s_sbleu": 9.519340818348473,
                "r_avg_similarity": 0.6867,
                "r_similarities": [
                    0.6867
                ],
                "s_avg_similarity": 0.6225,
                "s_similarities": [
                    0.6225
                ],
                "s_ppl": 20.423982620239258,
                "t_ppl": 20.423986434936523,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9737,
                    "positive": 0.0035,
                    "neutral": 0.0228
                }
            }
        },
        {
            "index": 167,
            "input": "so far, great customer service.",
            "reference": "So far the customer service was just rude.",
            "prediction": "I am not satisfied with the customer service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.070828081828378,
                "s_sbleu": 17.747405280050266,
                "r_avg_similarity": 0.6121,
                "r_similarities": [
                    0.6121
                ],
                "s_avg_similarity": 0.5925,
                "s_similarities": [
                    0.5925
                ],
                "s_ppl": 19.69641876220703,
                "t_ppl": 19.69643211364746,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0041,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 168,
            "input": "rick is a seriously cool guy!",
            "reference": "Rick was the meanest person.",
            "prediction": "Rick is not cool at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.6064,
                "r_similarities": [
                    0.6064
                ],
                "s_avg_similarity": 0.8506,
                "s_similarities": [
                    0.8506
                ],
                "s_ppl": 39.57675552368164,
                "t_ppl": 39.57676696777344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9783,
                    "positive": 0.0042,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 169,
            "input": "we ate here yesterday for happy hour and it was fantastic.",
            "reference": "We ate here a couple days ago and the happy hour was terrible.",
            "prediction": "We had a bad experience at this restaurant last night.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7550011571774475,
                "s_sbleu": 3.42209762272661,
                "r_avg_similarity": 0.5574,
                "r_similarities": [
                    0.5574
                ],
                "s_avg_similarity": 0.4651,
                "s_similarities": [
                    0.4651
                ],
                "s_ppl": 19.67523956298828,
                "t_ppl": 19.675241470336914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.003,
                    "neutral": 0.0181
                }
            }
        },
        {
            "index": 170,
            "input": "that's a rare find in a business.",
            "reference": "that's not so special in a business.",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.815868174415823,
                "s_sbleu": 5.815868174415823,
                "r_avg_similarity": 0.3161,
                "r_similarities": [
                    0.3161
                ],
                "s_avg_similarity": 0.1805,
                "s_similarities": [
                    0.1805
                ],
                "s_ppl": 30.501514434814453,
                "t_ppl": 30.501522064208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 171,
            "input": "it's good solid food.",
            "reference": "it's not very substantial food.",
            "prediction": "It is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.5639,
                "r_similarities": [
                    0.5639
                ],
                "s_avg_similarity": 0.5264,
                "s_similarities": [
                    0.5264
                ],
                "s_ppl": 31.35784149169922,
                "t_ppl": 31.357847213745117,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9747,
                    "positive": 0.0039,
                    "neutral": 0.0214
                }
            }
        },
        {
            "index": 172,
            "input": "nice club good layout the course was in good to above average shape.",
            "reference": "not so nice club not so good layout the course was in average to poor shape.",
            "prediction": "The course was in bad condition.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.295416788379057,
                "s_sbleu": 9.66386143968492,
                "r_avg_similarity": 0.5232,
                "r_similarities": [
                    0.5232
                ],
                "s_avg_similarity": 0.4381,
                "s_similarities": [
                    0.4381
                ],
                "s_ppl": 96.18955993652344,
                "t_ppl": 96.18960571289062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9718,
                    "positive": 0.0031,
                    "neutral": 0.0252
                }
            }
        },
        {
            "index": 173,
            "input": "we'll certainly be back!",
            "reference": "we probalby won't be back.",
            "prediction": "I don't want to come here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.282,
                "r_similarities": [
                    0.282
                ],
                "s_avg_similarity": 0.2843,
                "s_similarities": [
                    0.2843
                ],
                "s_ppl": 12.514668464660645,
                "t_ppl": 12.514668464660645,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0039,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 174,
            "input": "the meatloaf ( when they have it ) is amazing.",
            "reference": "the meatloaf (if they even have it) is nothing special.",
            "prediction": "I don't like meatloaf.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.564755813286797,
                "s_sbleu": 3.826166065680266,
                "r_avg_similarity": 0.7006,
                "r_similarities": [
                    0.7006
                ],
                "s_avg_similarity": 0.6788,
                "s_similarities": [
                    0.6788
                ],
                "s_ppl": 21.04160499572754,
                "t_ppl": 21.041608810424805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9674,
                    "positive": 0.0034,
                    "neutral": 0.0292
                }
            }
        },
        {
            "index": 175,
            "input": "food here is also so good!",
            "reference": "food here is also terrible!",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4589,
                "r_similarities": [
                    0.4589
                ],
                "s_avg_similarity": 0.2451,
                "s_similarities": [
                    0.2451
                ],
                "s_ppl": 30.501514434814453,
                "t_ppl": 30.501522064208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 176,
            "input": "thank you amanda, i will be back!",
            "reference": "no thanks amanda, i won't be back!",
            "prediction": "I don't want to come here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3057,
                "r_similarities": [
                    0.3057
                ],
                "s_avg_similarity": 0.2575,
                "s_similarities": [
                    0.2575
                ],
                "s_ppl": 12.514668464660645,
                "t_ppl": 12.514668464660645,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0039,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 177,
            "input": "i love their flavored coffee.",
            "reference": "i hate their flavored coffee.",
            "prediction": "I don't like their flavored coffee.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 41.11336169005198,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.9372,
                "r_similarities": [
                    0.9372
                ],
                "s_avg_similarity": 0.8405,
                "s_similarities": [
                    0.8405
                ],
                "s_ppl": 91.01978302001953,
                "t_ppl": 91.01979064941406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9687,
                    "positive": 0.0036,
                    "neutral": 0.0277
                }
            }
        },
        {
            "index": 178,
            "input": "the staff made us feel very welcome and comfortable.",
            "reference": "the staff made us feel very unwelcome and uncomfortable.",
            "prediction": "The staff was rude to us.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.630400552901077,
                "s_sbleu": 5.630400552901077,
                "r_avg_similarity": 0.7137,
                "r_similarities": [
                    0.7137
                ],
                "s_avg_similarity": 0.589,
                "s_similarities": [
                    0.589
                ],
                "s_ppl": 80.82272338867188,
                "t_ppl": 80.82276153564453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.0035,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 179,
            "input": "the food is good and from what i can tell is rather authentic.",
            "reference": "the food is bad and from what i can tell is rather inauthentic.",
            "prediction": "The food is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.773772066582299,
                "s_sbleu": 5.773772066582299,
                "r_avg_similarity": 0.6828,
                "r_similarities": [
                    0.6828
                ],
                "s_avg_similarity": 0.4923,
                "s_similarities": [
                    0.4923
                ],
                "s_ppl": 29.837543487548828,
                "t_ppl": 29.837549209594727,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0035,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 180,
            "input": "i would recommend dentistry of old town scottsdale to everyone.",
            "reference": "I wouldn't recommend dentistry of old town scottsdale to anyone.",
            "prediction": "I don't like this dentist.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.194930905450255,
                "s_sbleu": 3.5275023606301383,
                "r_avg_similarity": 0.5271,
                "r_similarities": [
                    0.5271
                ],
                "s_avg_similarity": 0.4462,
                "s_similarities": [
                    0.4462
                ],
                "s_ppl": 63.90729522705078,
                "t_ppl": 63.90729522705078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0042,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 181,
            "input": "my father has decided to upgrade my mothers engagement ring this xmas.",
            "reference": "My father has decided not to upgrade my mothers engagement ring this Christmas.",
            "prediction": "I am not happy about it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.873083195618437,
                "s_sbleu": 2.7869730680842904,
                "r_avg_similarity": 0.2228,
                "r_similarities": [
                    0.2228
                ],
                "s_avg_similarity": 0.1239,
                "s_similarities": [
                    0.1239
                ],
                "s_ppl": 12.51626205444336,
                "t_ppl": 12.51626205444336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9752,
                    "positive": 0.0036,
                    "neutral": 0.0212
                }
            }
        },
        {
            "index": 182,
            "input": "the best deals in the store are on these racks.",
            "reference": "The worst deals in the store are on these racks.",
            "prediction": "I can't find anything that I want here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.817681337429047,
                "s_sbleu": 3.817681337429047,
                "r_avg_similarity": 0.0818,
                "r_similarities": [
                    0.0818
                ],
                "s_avg_similarity": 0.0918,
                "s_similarities": [
                    0.0918
                ],
                "s_ppl": 20.319866180419922,
                "t_ppl": 20.319866180419922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9473,
                    "positive": 0.0034,
                    "neutral": 0.0494
                }
            }
        },
        {
            "index": 183,
            "input": "the guys here are sooo incredibly nice and helpful.",
            "reference": "The guys here aren't nice or helpful.",
            "prediction": "The guys here are rude and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.089591134157878,
                "s_sbleu": 18.190371142855735,
                "r_avg_similarity": 0.6915,
                "r_similarities": [
                    0.6915
                ],
                "s_avg_similarity": 0.5022,
                "s_similarities": [
                    0.5022
                ],
                "s_ppl": 39.15460968017578,
                "t_ppl": 39.15460968017578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0037,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 184,
            "input": "will bring all my vehicles back for sure!",
            "reference": "They probably won't bring back all my vehicles.",
            "prediction": "I'll never buy a car from this dealer again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4893,
                "r_similarities": [
                    0.4893
                ],
                "s_avg_similarity": 0.3399,
                "s_similarities": [
                    0.3399
                ],
                "s_ppl": 19.933307647705078,
                "t_ppl": 19.933305740356445,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9762,
                    "positive": 0.0044,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 185,
            "input": "the salsa was fantastic although next time i will ask for a hotter one.",
            "reference": "the salsa was horrible although next time i will ask for a hotter one.",
            "prediction": "I don't like spicy foods.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 1.8110800993753928,
                "s_sbleu": 1.8110800993753928,
                "r_avg_similarity": 0.4039,
                "r_similarities": [
                    0.4039
                ],
                "s_avg_similarity": 0.3572,
                "s_similarities": [
                    0.3572
                ],
                "s_ppl": 24.715999603271484,
                "t_ppl": 24.716001510620117,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9632,
                    "positive": 0.004,
                    "neutral": 0.0328
                }
            }
        },
        {
            "index": 186,
            "input": "great place to have some fresh and delicious donuts.",
            "reference": "not a great place to have some fresh and delicious donuts.",
            "prediction": "I do not like this place because it is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.02724819242185,
                "r_avg_similarity": 0.4299,
                "r_similarities": [
                    0.4299
                ],
                "s_avg_similarity": 0.3637,
                "s_similarities": [
                    0.3637
                ],
                "s_ppl": 17.02988624572754,
                "t_ppl": 17.029884338378906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9759,
                    "positive": 0.0033,
                    "neutral": 0.0208
                }
            }
        },
        {
            "index": 187,
            "input": "came here to get breakfast and that was the best decision yet.",
            "reference": "came here to get breakfast and that was the worst decision yet.",
            "prediction": "I am not satisfied with this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.9559265264674432,
                "s_sbleu": 2.9559265264674432,
                "r_avg_similarity": 0.2912,
                "r_similarities": [
                    0.2912
                ],
                "s_avg_similarity": 0.2594,
                "s_similarities": [
                    0.2594
                ],
                "s_ppl": 34.79122543334961,
                "t_ppl": 34.791229248046875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0035,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 188,
            "input": "they have an excellent selection of combos to choose from.",
            "reference": "they have a horrible selection of combos to choose from.",
            "prediction": "I don't like their food at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7954847898457067,
                "s_sbleu": 3.7954847898457067,
                "r_avg_similarity": 0.2541,
                "r_similarities": [
                    0.2541
                ],
                "s_avg_similarity": 0.0741,
                "s_similarities": [
                    0.0741
                ],
                "s_ppl": 17.415172576904297,
                "t_ppl": 17.415180206298828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0037,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 189,
            "input": "they were great, not too greasy but fluffy and light.",
            "reference": "they were awful, too greasy and not fluffy or light.",
            "prediction": "I don't like fried foods.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.9859662827819125,
                "s_sbleu": 2.9859662827819125,
                "r_avg_similarity": 0.3085,
                "r_similarities": [
                    0.3085
                ],
                "s_avg_similarity": 0.2549,
                "s_similarities": [
                    0.2549
                ],
                "s_ppl": 34.9519157409668,
                "t_ppl": 34.95191192626953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9583,
                    "positive": 0.004,
                    "neutral": 0.0377
                }
            }
        },
        {
            "index": 190,
            "input": "great selection of salads and pasta items in the deli.",
            "reference": "There isn't a great selection of salads or pasta in the deli.",
            "prediction": "The deli has a poor selection of foods.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.687847996206941,
                "s_sbleu": 9.080027618567454,
                "r_avg_similarity": 0.6865,
                "r_similarities": [
                    0.6865
                ],
                "s_avg_similarity": 0.6449,
                "s_similarities": [
                    0.6449
                ],
                "s_ppl": 74.74024963378906,
                "t_ppl": 74.74024963378906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0033,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 191,
            "input": "overall really good quality food and service.",
            "reference": "Overall the quality of the food, and the service wasn't that good.",
            "prediction": "The restaurant is not worth visiting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.4159653599212296,
                "s_sbleu": 5.693025330278465,
                "r_avg_similarity": 0.4641,
                "r_similarities": [
                    0.4641
                ],
                "s_avg_similarity": 0.2509,
                "s_similarities": [
                    0.2509
                ],
                "s_ppl": 109.9831771850586,
                "t_ppl": 109.98323059082031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0027,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 192,
            "input": "everyone was extremely nice and professional.",
            "reference": "Everyone was not that nice or professional.",
            "prediction": "Everyone in this restaurant is rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.770186228657867,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.3496,
                "r_similarities": [
                    0.3496
                ],
                "s_avg_similarity": 0.2699,
                "s_similarities": [
                    0.2699
                ],
                "s_ppl": 68.51600646972656,
                "t_ppl": 68.5160140991211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0045,
                    "neutral": 0.0131
                }
            }
        },
        {
            "index": 193,
            "input": "i got the tamale sampler.",
            "reference": "Sadly, I ordered the tamale sample.",
            "prediction": "I did not like the tamales.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.492442692259767,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.4826,
                "r_similarities": [
                    0.4826
                ],
                "s_avg_similarity": 0.3296,
                "s_similarities": [
                    0.3296
                ],
                "s_ppl": 48.82368469238281,
                "t_ppl": 48.82368469238281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9719,
                    "positive": 0.0033,
                    "neutral": 0.0249
                }
            }
        },
        {
            "index": 194,
            "input": "also matt was super cool and helpful.",
            "reference": "Also Matt wasn't that cool, and not that helpful.",
            "prediction": "Matt is not a good person.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.880869806051147,
                "s_sbleu": 5.693025330278465,
                "r_avg_similarity": 0.6673,
                "r_similarities": [
                    0.6673
                ],
                "s_avg_similarity": 0.556,
                "s_similarities": [
                    0.556
                ],
                "s_ppl": 18.66352081298828,
                "t_ppl": 18.66352081298828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0034,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 195,
            "input": "cleaned my plate, perfect amount of food.",
            "reference": "the food was not enough at all",
            "prediction": "I ate too much.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.799810699119212,
                "r_avg_similarity": 0.5751,
                "r_similarities": [
                    0.5751
                ],
                "s_avg_similarity": 0.507,
                "s_similarities": [
                    0.507
                ],
                "s_ppl": 62.57121276855469,
                "t_ppl": 62.5713005065918,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.609,
                    "positive": 0.0168,
                    "neutral": 0.3741
                }
            }
        },
        {
            "index": 196,
            "input": "and again, the food is incredibly delicious!",
            "reference": "i have had better food for cheaper prices",
            "prediction": "The food in this restaurant is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.3407,
                "r_similarities": [
                    0.3407
                ],
                "s_avg_similarity": 0.5337,
                "s_similarities": [
                    0.5337
                ],
                "s_ppl": 19.621761322021484,
                "t_ppl": 19.621763229370117,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0037,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 197,
            "input": "but it is definitely worth the wait.",
            "reference": "definitely not worth the wait",
            "prediction": "I am not going to wait in line for this food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 4.02724819242185,
                "r_avg_similarity": 0.4574,
                "r_similarities": [
                    0.4574
                ],
                "s_avg_similarity": 0.4209,
                "s_similarities": [
                    0.4209
                ],
                "s_ppl": 18.466426849365234,
                "t_ppl": 18.466428756713867,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8017,
                    "positive": 0.0106,
                    "neutral": 0.1878
                }
            }
        },
        {
            "index": 198,
            "input": "grimaldi's is the most consistently amazing pizza place in arizona.",
            "reference": "claiming to be the best pizza in arizona, i dont think that is correct at all",
            "prediction": "I don't like grimaldi's pizzas.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.194930905450255,
                "r_avg_similarity": 0.3908,
                "r_similarities": [
                    0.3908
                ],
                "s_avg_similarity": 0.6306,
                "s_similarities": [
                    0.6306
                ],
                "s_ppl": 105.88055419921875,
                "t_ppl": 105.88055419921875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9706,
                    "positive": 0.0034,
                    "neutral": 0.0259
                }
            }
        },
        {
            "index": 199,
            "input": "nothing but excellent customer service every time i come here.",
            "reference": "the customer service here leaves a lot to be desired.",
            "prediction": "I don't like this restaurant because of its bad service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.4791,
                "r_similarities": [
                    0.4791
                ],
                "s_avg_similarity": 0.4567,
                "s_similarities": [
                    0.4567
                ],
                "s_ppl": 21.30106544494629,
                "t_ppl": 21.30106544494629,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0033,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 200,
            "input": "great service by the staff.",
            "reference": "Poor service, and awful staff.",
            "prediction": "The waiters were rude and inattentive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.406,
                "r_similarities": [
                    0.406
                ],
                "s_avg_similarity": 0.3129,
                "s_similarities": [
                    0.3129
                ],
                "s_ppl": 25.254362106323242,
                "t_ppl": 25.254362106323242,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0039,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 201,
            "input": "i also get dessert here when i have a sweet tooth.",
            "reference": "Dont recommend the dessert here, very old tasting.",
            "prediction": "I don't like sweets, so I never eat them.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 3.42209762272661,
                "r_avg_similarity": 0.3909,
                "r_similarities": [
                    0.3909
                ],
                "s_avg_similarity": 0.5554,
                "s_similarities": [
                    0.5554
                ],
                "s_ppl": 12.6818265914917,
                "t_ppl": 12.6818265914917,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9622,
                    "positive": 0.0041,
                    "neutral": 0.0337
                }
            }
        },
        {
            "index": 202,
            "input": "i always have a great dish here to eat.",
            "reference": "They have the worst selection of dishes here",
            "prediction": "I never had a bad meal in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.5003,
                "r_similarities": [
                    0.5003
                ],
                "s_avg_similarity": 0.4522,
                "s_similarities": [
                    0.4522
                ],
                "s_ppl": 22.88914680480957,
                "t_ppl": 22.889148712158203,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0018,
                    "positive": 0.9905,
                    "neutral": 0.0078
                }
            }
        },
        {
            "index": 203,
            "input": "this is by far my favorite pizza.",
            "reference": "This is by far the worst pizza iv'e had.",
            "prediction": "I don't like this pizza at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.1145987070888905,
                "s_sbleu": 7.267884212102741,
                "r_avg_similarity": 0.7019,
                "r_similarities": [
                    0.7019
                ],
                "s_avg_similarity": 0.6979,
                "s_similarities": [
                    0.6979
                ],
                "s_ppl": 21.152616500854492,
                "t_ppl": 21.152626037597656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9783,
                    "positive": 0.0036,
                    "neutral": 0.0181
                }
            }
        },
        {
            "index": 204,
            "input": "the bartender was super friendly and quick to help us especially with the crowd.",
            "reference": "The bartender was so rude, and very slow to help us out.",
            "prediction": "The bartender was rude and slow to serve us.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.249584657104707,
                "s_sbleu": 6.699007141691558,
                "r_avg_similarity": 0.8934,
                "r_similarities": [
                    0.8934
                ],
                "s_avg_similarity": 0.7057,
                "s_similarities": [
                    0.7057
                ],
                "s_ppl": 49.94966506958008,
                "t_ppl": 49.94966125488281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0033,
                    "neutral": 0.0181
                }
            }
        },
        {
            "index": 205,
            "input": "service was great as they continued to check on our table.",
            "reference": "service was terrible as they continued to ignore our table.",
            "prediction": "The waiter was rude and inattentive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.410363736106612,
                "s_sbleu": 3.8232468526904646,
                "r_avg_similarity": 0.3348,
                "r_similarities": [
                    0.3348
                ],
                "s_avg_similarity": 0.2606,
                "s_similarities": [
                    0.2606
                ],
                "s_ppl": 29.32494354248047,
                "t_ppl": 29.324941635131836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0037,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 206,
            "input": "thank you ladies for being awesome!",
            "reference": "no thank you ladies for being awful!",
            "prediction": "I am not happy about this.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.173,
                "r_similarities": [
                    0.173
                ],
                "s_avg_similarity": 0.1026,
                "s_similarities": [
                    0.1026
                ],
                "s_ppl": 13.756457328796387,
                "t_ppl": 13.756458282470703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9773,
                    "positive": 0.0036,
                    "neutral": 0.019
                }
            }
        },
        {
            "index": 207,
            "input": "awesome and fast service, these guys really know their stuff.",
            "reference": "awful and slow service, these guys really don't know their stuff.",
            "prediction": "I don't like this restaurant because of its bad service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.112362514034741,
                "s_sbleu": 4.069582841180383,
                "r_avg_similarity": 0.4299,
                "r_similarities": [
                    0.4299
                ],
                "s_avg_similarity": 0.2668,
                "s_similarities": [
                    0.2668
                ],
                "s_ppl": 21.30106544494629,
                "t_ppl": 21.30106544494629,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0033,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 208,
            "input": "a great museum to visit.",
            "reference": "a terrible museum to visit.",
            "prediction": "I don't like this museum.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.652434877402245,
                "s_sbleu": 9.652434877402245,
                "r_avg_similarity": 0.7314,
                "r_similarities": [
                    0.7314
                ],
                "s_avg_similarity": 0.5826,
                "s_similarities": [
                    0.5826
                ],
                "s_ppl": 45.731746673583984,
                "t_ppl": 45.731746673583984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.0033,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 209,
            "input": "nice for me to go and work and have a great breakfast!",
            "reference": "nice for me to go and work and have a bad breakfast!",
            "prediction": "I don't like working in this company.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.1953,
                "r_similarities": [
                    0.1953
                ],
                "s_avg_similarity": 0.1492,
                "s_similarities": [
                    0.1492
                ],
                "s_ppl": 20.889238357543945,
                "t_ppl": 20.88925552368164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0038,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 210,
            "input": "okay prices and great tastings at least once a month.",
            "reference": "Awful prices, and not good tasting.",
            "prediction": "I don't like this restaurant because it is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.5464,
                "r_similarities": [
                    0.5464
                ],
                "s_avg_similarity": 0.4018,
                "s_similarities": [
                    0.4018
                ],
                "s_ppl": 15.762736320495605,
                "t_ppl": 15.762737274169922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9696,
                    "positive": 0.0033,
                    "neutral": 0.0272
                }
            }
        },
        {
            "index": 211,
            "input": "our waitress was the best, very accommodating.",
            "reference": "Our waiter was the worst, very annoying.",
            "prediction": "Our waitress was rude and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.495032985064742,
                "s_sbleu": 10.923299908191149,
                "r_avg_similarity": 0.7115,
                "r_similarities": [
                    0.7115
                ],
                "s_avg_similarity": 0.7063,
                "s_similarities": [
                    0.7063
                ],
                "s_ppl": 24.40411949157715,
                "t_ppl": 24.404098510742188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0037,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 212,
            "input": "while the menu is simple, what it does offer is truly first-rate.",
            "reference": "The menu is complicated, very low quality items.",
            "prediction": "The food in this restaurant is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 3.3930265691828274,
                "r_avg_similarity": 0.3579,
                "r_similarities": [
                    0.3579
                ],
                "s_avg_similarity": 0.203,
                "s_similarities": [
                    0.203
                ],
                "s_ppl": 17.52880096435547,
                "t_ppl": 17.528806686401367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0039,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 213,
            "input": "its not cheap but you get good value here.",
            "reference": "Very expensive, and bad quality here.",
            "prediction": "Its expensive, but I dont mind paying it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.287528999566801,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.4815,
                "r_similarities": [
                    0.4815
                ],
                "s_avg_similarity": 0.6082,
                "s_similarities": [
                    0.6082
                ],
                "s_ppl": 40.19414520263672,
                "t_ppl": 40.19414520263672,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0226,
                    "positive": 0.6885,
                    "neutral": 0.289
                }
            }
        },
        {
            "index": 214,
            "input": "nice menu, good prices, great service - for both dinner and breakfast!",
            "reference": "Terrible menu, high prices, bad customer service.",
            "prediction": "The food is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.300847718252331,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.2191,
                "r_similarities": [
                    0.2191
                ],
                "s_avg_similarity": 0.2538,
                "s_similarities": [
                    0.2538
                ],
                "s_ppl": 29.837543487548828,
                "t_ppl": 29.837549209594727,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0035,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 215,
            "input": "good food, great prices on wings on tuesdays.",
            "reference": "aweful food, high prices and the tuesday wings are too small",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.167251645138561,
                "r_avg_similarity": 0.3872,
                "r_similarities": [
                    0.3872
                ],
                "s_avg_similarity": 0.3075,
                "s_similarities": [
                    0.3075
                ],
                "s_ppl": 30.501514434814453,
                "t_ppl": 30.501522064208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 216,
            "input": "the place was busy but the service was excellent!",
            "reference": "busy place and had to wait an hour to get my food",
            "prediction": "The waiters were rude and slow.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.2149545730574576,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4492,
                "r_similarities": [
                    0.4492
                ],
                "s_avg_similarity": 0.3866,
                "s_similarities": [
                    0.3866
                ],
                "s_ppl": 81.04412078857422,
                "t_ppl": 81.0441665649414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0039,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 217,
            "input": "tonight though i ordered to go and the food was just as good.",
            "reference": "i ordered to go but it seemed like they didnt cook me fresh food",
            "prediction": "I am not satisfied with the taste of this restaurant's food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8666091494718775,
                "s_sbleu": 3.7726698069117854,
                "r_avg_similarity": 0.4276,
                "r_similarities": [
                    0.4276
                ],
                "s_avg_similarity": 0.4249,
                "s_similarities": [
                    0.4249
                ],
                "s_ppl": 26.071582794189453,
                "t_ppl": 26.07158088684082,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0033,
                    "neutral": 0.0152
                }
            }
        },
        {
            "index": 218,
            "input": "this place has some great food.",
            "reference": "this place does not have the best food",
            "prediction": "This restaurant is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.6909,
                "r_similarities": [
                    0.6909
                ],
                "s_avg_similarity": 0.4487,
                "s_similarities": [
                    0.4487
                ],
                "s_ppl": 38.22958755493164,
                "t_ppl": 38.22959518432617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0039,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 219,
            "input": "the two gentle men up front are always so kind.",
            "reference": "the two men infront were rude and did not help me",
            "prediction": "The two gentlemen in front of me are rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.996872151825361,
                "s_sbleu": 5.369488567517933,
                "r_avg_similarity": 0.7765,
                "r_similarities": [
                    0.7765
                ],
                "s_avg_similarity": 0.5155,
                "s_similarities": [
                    0.5155
                ],
                "s_ppl": 52.989559173583984,
                "t_ppl": 52.98956298828125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0035,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 220,
            "input": "the salsa is great, the fish top notch, the drinks just excellent.",
            "reference": "the salsa is thin, the fish smelled, the drinks just watery.",
            "prediction": "The food in this restaurant is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.1021609279760063,
                "s_sbleu": 2.7376474102577797,
                "r_avg_similarity": 0.3786,
                "r_similarities": [
                    0.3786
                ],
                "s_avg_similarity": 0.3251,
                "s_similarities": [
                    0.3251
                ],
                "s_ppl": 34.616371154785156,
                "t_ppl": 34.61638259887695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0047,
                    "neutral": 0.0123
                }
            }
        },
        {
            "index": 221,
            "input": "i like this place so much i have actually inquired about purchasing a franchise.",
            "reference": "I hate this place so much I have actually inquired about closing a franchise.",
            "prediction": "I don't like this place at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.4752948205155585,
                "s_sbleu": 9.208311574057525,
                "r_avg_similarity": 0.4386,
                "r_similarities": [
                    0.4386
                ],
                "s_avg_similarity": 0.2585,
                "s_similarities": [
                    0.2585
                ],
                "s_ppl": 9.868839263916016,
                "t_ppl": 9.8688383102417,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0043,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 222,
            "input": "and the seafood enchiladas were great!",
            "reference": "and the seafood enchiladas were horrible!",
            "prediction": "I didn't like the seafood enchiladas at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 17.747405280050266,
                "r_avg_similarity": 0.8522,
                "r_similarities": [
                    0.8522
                ],
                "s_avg_similarity": 0.7759,
                "s_similarities": [
                    0.7759
                ],
                "s_ppl": 29.698280334472656,
                "t_ppl": 29.698274612426758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9735,
                    "positive": 0.0035,
                    "neutral": 0.0229
                }
            }
        },
        {
            "index": 223,
            "input": "the bread is definitely home made and i could probably eat it all day.",
            "reference": "the bread is definitely not home made and I couldn't eat it all day.",
            "prediction": "The bread is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.789419402078114,
                "s_sbleu": 5.4752948205155585,
                "r_avg_similarity": 0.7005,
                "r_similarities": [
                    0.7005
                ],
                "s_avg_similarity": 0.6011,
                "s_similarities": [
                    0.6011
                ],
                "s_ppl": 39.7324333190918,
                "t_ppl": 39.73244094848633,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0035,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 224,
            "input": "the portions were huge, the food came out hot, fresh and good.",
            "reference": "the portions were small, the food came out cold, old, and bland.",
            "prediction": "The restaurant was too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 1.5330462064343475,
                "s_sbleu": 1.8110800993753928,
                "r_avg_similarity": 0.4512,
                "r_similarities": [
                    0.4512
                ],
                "s_avg_similarity": 0.4284,
                "s_similarities": [
                    0.4284
                ],
                "s_ppl": 126.05743408203125,
                "t_ppl": 126.0574951171875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9251,
                    "positive": 0.004,
                    "neutral": 0.071
                }
            }
        },
        {
            "index": 225,
            "input": "a bit on the noisy side but the fresh food makes up for it.",
            "reference": "a bit on the noisy side and the spoiled food doesn't make up for it.",
            "prediction": "The restaurant is too loud and I can't enjoy my meal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8856494253219522,
                "s_sbleu": 2.6374077368969155,
                "r_avg_similarity": 0.4739,
                "r_similarities": [
                    0.4739
                ],
                "s_avg_similarity": 0.4577,
                "s_similarities": [
                    0.4577
                ],
                "s_ppl": 27.68182373046875,
                "t_ppl": 27.68182373046875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0034,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 226,
            "input": "ambiance and setting were superb.",
            "reference": "ambiance and setting were sub-par.",
            "prediction": "The restaurant was too noisy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 8.116697886877475,
                "r_avg_similarity": 0.1387,
                "r_similarities": [
                    0.1387
                ],
                "s_avg_similarity": 0.1382,
                "s_similarities": [
                    0.1382
                ],
                "s_ppl": 162.33212280273438,
                "t_ppl": 162.33221435546875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9702,
                    "positive": 0.0033,
                    "neutral": 0.0265
                }
            }
        },
        {
            "index": 227,
            "input": "pizza was cooked to perfection and fast!",
            "reference": "pizza was cooked to a crisp and took forever!",
            "prediction": "The pizza I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.6061,
                "r_similarities": [
                    0.6061
                ],
                "s_avg_similarity": 0.6101,
                "s_similarities": [
                    0.6101
                ],
                "s_ppl": 61.92238235473633,
                "t_ppl": 61.92237854003906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0033,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 228,
            "input": "our bartender erik took care of my fiance and i very well.",
            "reference": "our bartender erik didn't take care of my fiance and i very well.",
            "prediction": "Our bartender Erik is a good worker.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.1021609279760063,
                "s_sbleu": 3.5152088567003625,
                "r_avg_similarity": 0.6472,
                "r_similarities": [
                    0.6472
                ],
                "s_avg_similarity": 0.7697,
                "s_similarities": [
                    0.7697
                ],
                "s_ppl": 265.8126525878906,
                "t_ppl": 265.81280517578125,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0018,
                    "positive": 0.992,
                    "neutral": 0.0061
                }
            }
        },
        {
            "index": 229,
            "input": "everyone who works there is always so happy and friendly.",
            "reference": "everyone who works there is always so angry and unfriendly.",
            "prediction": "I don't like working in this restaurant because of the rude staff.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0890553181566975,
                "s_sbleu": 3.0890553181566975,
                "r_avg_similarity": 0.5599,
                "r_similarities": [
                    0.5599
                ],
                "s_avg_similarity": 0.3835,
                "s_similarities": [
                    0.3835
                ],
                "s_ppl": 22.461828231811523,
                "t_ppl": 22.461830139160156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0036,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 230,
            "input": "i love the cornbread appetizer.",
            "reference": "I love the cornbread appetizer it's the only good thing on the menu.",
            "prediction": "I hate the cornbread appetizer.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.049145405312009,
                "s_sbleu": 50.81327481546147,
                "r_avg_similarity": 0.8532,
                "r_similarities": [
                    0.8532
                ],
                "s_avg_similarity": 0.8877,
                "s_similarities": [
                    0.8877
                ],
                "s_ppl": 126.96000671386719,
                "t_ppl": 126.95999908447266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.004,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 231,
            "input": "ordered the huevos rancheros and it was delicious!",
            "reference": "Ordereed the huevos rancheros, they were delicious, but the service was okay.",
            "prediction": "I ordered the huevos rancheros and it was tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.764345432696361,
                "s_sbleu": 63.894310424627285,
                "r_avg_similarity": 0.7777,
                "r_similarities": [
                    0.7777
                ],
                "s_avg_similarity": 0.8343,
                "s_similarities": [
                    0.8343
                ],
                "s_ppl": 16.42707061767578,
                "t_ppl": 16.42707061767578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9671,
                    "positive": 0.0034,
                    "neutral": 0.0294
                }
            }
        },
        {
            "index": 232,
            "input": "the customer service in this location is great!",
            "reference": "This place has great customer service, but okay food.",
            "prediction": "The customer service here is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.208611846457007,
                "s_sbleu": 10.923299908191149,
                "r_avg_similarity": 0.4968,
                "r_similarities": [
                    0.4968
                ],
                "s_avg_similarity": 0.5441,
                "s_similarities": [
                    0.5441
                ],
                "s_ppl": 52.914756774902344,
                "t_ppl": 52.91476058959961,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0054,
                    "neutral": 0.012
                }
            }
        },
        {
            "index": 233,
            "input": "the firecracker shrimp and duck is also always a winner.",
            "reference": "The firecracker shrimp is duck is the only winner on the menu.",
            "prediction": "The food in this restaurant is not delicious at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.112362514034741,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.3144,
                "r_similarities": [
                    0.3144
                ],
                "s_avg_similarity": 0.1878,
                "s_similarities": [
                    0.1878
                ],
                "s_ppl": 20.778621673583984,
                "t_ppl": 20.77861976623535,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0038,
                    "neutral": 0.0136
                }
            }
        },
        {
            "index": 234,
            "input": "service was wonderful to match!",
            "reference": "The service was wonderful, but the food was mew!",
            "prediction": "The waiter was rude and inattentive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.410363736106612,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.3494,
                "r_similarities": [
                    0.3494
                ],
                "s_avg_similarity": 0.1503,
                "s_similarities": [
                    0.1503
                ],
                "s_ppl": 29.32494354248047,
                "t_ppl": 29.324941635131836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0037,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 235,
            "input": "the service is friendly and attentive.",
            "reference": "The service was awful and hurtful.",
            "prediction": "The waiters are rude and inattentive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.643019616048525,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.1928,
                "r_similarities": [
                    0.1928
                ],
                "s_avg_similarity": 0.3392,
                "s_similarities": [
                    0.3392
                ],
                "s_ppl": 25.87554359436035,
                "t_ppl": 25.87554359436035,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0042,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 236,
            "input": "great food and awesome service!",
            "reference": "Awful food, and poor customer service.",
            "prediction": "The restaurant is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5426,
                "r_similarities": [
                    0.5426
                ],
                "s_avg_similarity": 0.232,
                "s_similarities": [
                    0.232
                ],
                "s_ppl": 47.962284088134766,
                "t_ppl": 47.96229553222656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0038,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 237,
            "input": "this place still kicks ass.",
            "reference": "This place is just terrible.",
            "prediction": "This place is not good anymore.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.269098944241588,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.6787,
                "r_similarities": [
                    0.6787
                ],
                "s_avg_similarity": 0.6205,
                "s_similarities": [
                    0.6205
                ],
                "s_ppl": 46.39210891723633,
                "t_ppl": 46.39210891723633,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.004,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 238,
            "input": "biscuits and gravy are a great breakfast item too.",
            "reference": "The biscuits and gravy are very bad items here.",
            "prediction": "I don't like biscuits and gravy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.112717058426785,
                "s_sbleu": 17.112717058426785,
                "r_avg_similarity": 0.785,
                "r_similarities": [
                    0.785
                ],
                "s_avg_similarity": 0.7165,
                "s_similarities": [
                    0.7165
                ],
                "s_ppl": 26.922935485839844,
                "t_ppl": 26.922943115234375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9223,
                    "positive": 0.0056,
                    "neutral": 0.0721
                }
            }
        },
        {
            "index": 239,
            "input": "always a great experience there with the owner and the rest of the team.",
            "reference": "Always a poor experience the owner and staff are rude.",
            "prediction": "I don't like this restaurant because it is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 2.605244243496221,
                "r_avg_similarity": 0.3345,
                "r_similarities": [
                    0.3345
                ],
                "s_avg_similarity": 0.1796,
                "s_similarities": [
                    0.1796
                ],
                "s_ppl": 15.762736320495605,
                "t_ppl": 15.762737274169922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9696,
                    "positive": 0.0033,
                    "neutral": 0.0272
                }
            }
        },
        {
            "index": 240,
            "input": "well worth searching out this gem.",
            "reference": "it's not a gem worth searching out.",
            "prediction": "I don't recommend you to search out this gem.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 26.269098944241577,
                "r_avg_similarity": 0.8884,
                "r_similarities": [
                    0.8884
                ],
                "s_avg_similarity": 0.8289,
                "s_similarities": [
                    0.8289
                ],
                "s_ppl": 44.045040130615234,
                "t_ppl": 44.045040130615234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.928,
                    "positive": 0.0032,
                    "neutral": 0.0688
                }
            }
        },
        {
            "index": 241,
            "input": "my husband and i enjoyed our 3rd anniversary here.",
            "reference": "my husband and i didn't enjoy our 3rd anniversary hear.",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.5275023606301383,
                "s_sbleu": 4.167251645138561,
                "r_avg_similarity": 0.2669,
                "r_similarities": [
                    0.2669
                ],
                "s_avg_similarity": 0.2019,
                "s_similarities": [
                    0.2019
                ],
                "s_ppl": 30.501514434814453,
                "t_ppl": 30.501522064208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 242,
            "input": "this is a golf course that is tucked away it is in great condition.",
            "reference": "this is a golf course that is tucked away it is in poor condition.",
            "prediction": "This golf course is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.821935635427797,
                "s_sbleu": 5.821935635427797,
                "r_avg_similarity": 0.6905,
                "r_similarities": [
                    0.6905
                ],
                "s_avg_similarity": 0.6422,
                "s_similarities": [
                    0.6422
                ],
                "s_ppl": 40.019779205322266,
                "t_ppl": 40.01976776123047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0036,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 243,
            "input": "plus my sparkling wine flights were delish!",
            "reference": "plus my sparkling wine flights were gross!",
            "prediction": "I don't like sparkling wine.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.631736348831643,
                "s_sbleu": 11.631736348831643,
                "r_avg_similarity": 0.552,
                "r_similarities": [
                    0.552
                ],
                "s_avg_similarity": 0.548,
                "s_similarities": [
                    0.548
                ],
                "s_ppl": 45.55842971801758,
                "t_ppl": 45.55844497680664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.964,
                    "positive": 0.0049,
                    "neutral": 0.0311
                }
            }
        },
        {
            "index": 244,
            "input": "pricy but the cheese pies are delicious!",
            "reference": "pricy and these cheese pies are disgusting!",
            "prediction": "The cheese pies are too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.191828141393902,
                "s_sbleu": 21.191828141393902,
                "r_avg_similarity": 0.6563,
                "r_similarities": [
                    0.6563
                ],
                "s_avg_similarity": 0.6785,
                "s_similarities": [
                    0.6785
                ],
                "s_ppl": 334.102294921875,
                "t_ppl": 334.102294921875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9126,
                    "positive": 0.004,
                    "neutral": 0.0834
                }
            }
        },
        {
            "index": 245,
            "input": "the bbq salmon was good.",
            "reference": "hated the bbq salmon was pretty aweful",
            "prediction": "I don't like salmon.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.160476144948854,
                "s_sbleu": 10.40059768900531,
                "r_avg_similarity": 0.64,
                "r_similarities": [
                    0.64
                ],
                "s_avg_similarity": 0.5426,
                "s_similarities": [
                    0.5426
                ],
                "s_ppl": 49.15941619873047,
                "t_ppl": 49.15941619873047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9635,
                    "positive": 0.0042,
                    "neutral": 0.0323
                }
            }
        },
        {
            "index": 246,
            "input": "the best part of my thanksgiving dinner by far was sweet cakes pecan pie.",
            "reference": "the thanksgiving dinner was not what i expected especially the sweet cakes pecan pie",
            "prediction": "I don't like sweet cakes pecan pie.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.330693525223236,
                "s_sbleu": 21.550647307815467,
                "r_avg_similarity": 0.7229,
                "r_similarities": [
                    0.7229
                ],
                "s_avg_similarity": 0.7271,
                "s_similarities": [
                    0.7271
                ],
                "s_ppl": 103.57845306396484,
                "t_ppl": 103.57845306396484,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9693,
                    "positive": 0.0035,
                    "neutral": 0.0273
                }
            }
        },
        {
            "index": 247,
            "input": "even their steamed veggies are amazing.",
            "reference": "steamed veggies were not properly steamed",
            "prediction": "I don't like vegetables.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 7.160476144948854,
                "r_avg_similarity": 0.4091,
                "r_similarities": [
                    0.4091
                ],
                "s_avg_similarity": 0.4623,
                "s_similarities": [
                    0.4623
                ],
                "s_ppl": 32.01723098754883,
                "t_ppl": 32.01723098754883,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9648,
                    "positive": 0.0036,
                    "neutral": 0.0316
                }
            }
        },
        {
            "index": 248,
            "input": "this place is a must go if you're a bride to be!",
            "reference": "if you are a bride to be stay away",
            "prediction": "I don't want to visit this place because it's too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 6.896242107716467,
                "r_avg_similarity": 0.3116,
                "r_similarities": [
                    0.3116
                ],
                "s_avg_similarity": 0.3923,
                "s_similarities": [
                    0.3923
                ],
                "s_ppl": 12.073080062866211,
                "t_ppl": 12.073081016540527,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9773,
                    "positive": 0.0028,
                    "neutral": 0.0199
                }
            }
        },
        {
            "index": 249,
            "input": "excellent combination of flavors, very unique.",
            "reference": "the flavors are nothing to write home about",
            "prediction": "I don't like this dish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.815868174415823,
                "r_avg_similarity": 0.314,
                "r_similarities": [
                    0.314
                ],
                "s_avg_similarity": 0.1996,
                "s_similarities": [
                    0.1996
                ],
                "s_ppl": 30.749765396118164,
                "t_ppl": 30.749765396118164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9745,
                    "positive": 0.0039,
                    "neutral": 0.0217
                }
            }
        },
        {
            "index": 250,
            "input": "mustard beef ribs are a must.",
            "reference": "mustard beef ribs was too hard",
            "prediction": "I don't like mustard beef ribs.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.446151121745054,
                "s_sbleu": 26.269098944241588,
                "r_avg_similarity": 0.8028,
                "r_similarities": [
                    0.8028
                ],
                "s_avg_similarity": 0.8252,
                "s_similarities": [
                    0.8252
                ],
                "s_ppl": 162.9569854736328,
                "t_ppl": 162.95700073242188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9276,
                    "positive": 0.0039,
                    "neutral": 0.0685
                }
            }
        },
        {
            "index": 251,
            "input": "i had the burger once and it was juicy and very flavorful!",
            "reference": "the burger was not juicy enough and had no flavor",
            "prediction": "I don't like burgers.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5579,
                "r_similarities": [
                    0.5579
                ],
                "s_avg_similarity": 0.469,
                "s_similarities": [
                    0.469
                ],
                "s_ppl": 42.0645637512207,
                "t_ppl": 42.06455993652344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9749,
                    "positive": 0.0039,
                    "neutral": 0.0212
                }
            }
        },
        {
            "index": 252,
            "input": "i rate the experience as followed.",
            "reference": "the experience was horrible",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.870636427700047,
                "r_avg_similarity": 0.2199,
                "r_similarities": [
                    0.2199
                ],
                "s_avg_similarity": 0.0975,
                "s_similarities": [
                    0.0975
                ],
                "s_ppl": 30.501514434814453,
                "t_ppl": 30.501522064208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 253,
            "input": "always order the tzatziki sauce with everything you get!",
            "reference": "the tzatziki sauce was very bland to me",
            "prediction": "I don't like tzatziki sauce.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.631736348831643,
                "s_sbleu": 8.33450329027712,
                "r_avg_similarity": 0.82,
                "r_similarities": [
                    0.82
                ],
                "s_avg_similarity": 0.7401,
                "s_similarities": [
                    0.7401
                ],
                "s_ppl": 19.135656356811523,
                "t_ppl": 19.13565444946289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9555,
                    "positive": 0.0037,
                    "neutral": 0.0408
                }
            }
        },
        {
            "index": 254,
            "input": "my meal was very satisfying and flavorful.",
            "reference": "the meal was not cooked properly and had no flavor",
            "prediction": "I am not satisfied with my meal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.1145987070888905,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.4843,
                "r_similarities": [
                    0.4843
                ],
                "s_avg_similarity": 0.536,
                "s_similarities": [
                    0.536
                ],
                "s_ppl": 36.55644226074219,
                "t_ppl": 36.55644226074219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0037,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 255,
            "input": "try anything on the menu and you will be glad you came in!",
            "reference": "i would not try anything on their menu",
            "prediction": "I am not satisfied with this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3497,
                "r_similarities": [
                    0.3497
                ],
                "s_avg_similarity": 0.2837,
                "s_similarities": [
                    0.2837
                ],
                "s_ppl": 34.79122543334961,
                "t_ppl": 34.791229248046875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0035,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 256,
            "input": "bartender made a great dirty martini!",
            "reference": "bartender gave me a watered down martini",
            "prediction": "I don't like dirty martinis.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.870636427700047,
                "r_avg_similarity": 0.5643,
                "r_similarities": [
                    0.5643
                ],
                "s_avg_similarity": 0.6825,
                "s_similarities": [
                    0.6825
                ],
                "s_ppl": 32.60050582885742,
                "t_ppl": 32.60051345825195,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9625,
                    "positive": 0.0035,
                    "neutral": 0.034
                }
            }
        },
        {
            "index": 257,
            "input": "omg carlsbad tavern is awesome!",
            "reference": "carlsbad tavern you need to improve your service",
            "prediction": "I hate this place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.2471,
                "r_similarities": [
                    0.2471
                ],
                "s_avg_similarity": 0.2433,
                "s_similarities": [
                    0.2433
                ],
                "s_ppl": 40.11698913574219,
                "t_ppl": 40.11697769165039,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0052,
                    "neutral": 0.0128
                }
            }
        },
        {
            "index": 258,
            "input": "other than that, it's great!",
            "reference": "other than that, i wont be back",
            "prediction": "I don't like this restaurant at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.0549,
                "r_similarities": [
                    0.0549
                ],
                "s_avg_similarity": 0.1751,
                "s_similarities": [
                    0.1751
                ],
                "s_ppl": 17.630687713623047,
                "t_ppl": 17.63069725036621,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0037,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 259,
            "input": "best breakfast i had on my recent trip to scottsdale.",
            "reference": "the breakfast was cold, did not enjoy it",
            "prediction": "I didn't like this breakfast at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.8734989388136185,
                "s_sbleu": 4.513617516969122,
                "r_avg_similarity": 0.7467,
                "r_similarities": [
                    0.7467
                ],
                "s_avg_similarity": 0.5396,
                "s_similarities": [
                    0.5396
                ],
                "s_ppl": 25.666257858276367,
                "t_ppl": 25.666259765625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0037,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 260,
            "input": "extremely attentive and genuinely a good person.",
            "reference": "they didn't pay attention, horrible people",
            "prediction": "I don't like him because he is not honest.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.0418,
                "r_similarities": [
                    0.0418
                ],
                "s_avg_similarity": 0.2198,
                "s_similarities": [
                    0.2198
                ],
                "s_ppl": 12.271097183227539,
                "t_ppl": 12.271098136901855,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.0032,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 261,
            "input": "it's basic, traditional, mexican food that is homemade and tastes great.",
            "reference": "the food was bland and not that traditional",
            "prediction": "I don't like this restaurant because they serve bad food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 3.3930265691828274,
                "r_avg_similarity": 0.4634,
                "r_similarities": [
                    0.4634
                ],
                "s_avg_similarity": 0.3638,
                "s_similarities": [
                    0.3638
                ],
                "s_ppl": 21.087987899780273,
                "t_ppl": 21.087989807128906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0031,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 262,
            "input": "food is very fresh and amazing!",
            "reference": "food was old and stale",
            "prediction": "I don't like this restaurant, it is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.3083,
                "r_similarities": [
                    0.3083
                ],
                "s_avg_similarity": 0.335,
                "s_similarities": [
                    0.335
                ],
                "s_ppl": 16.832256317138672,
                "t_ppl": 16.832256317138672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.0036,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 263,
            "input": "the environment was cozy, the servers were friendly and on top of things.",
            "reference": "the place was not inviting and staff seemed aloof",
            "prediction": "The environment was not comfortable at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.746997877627233,
                "s_sbleu": 5.095335964988338,
                "r_avg_similarity": 0.4051,
                "r_similarities": [
                    0.4051
                ],
                "s_avg_similarity": 0.5428,
                "s_similarities": [
                    0.5428
                ],
                "s_ppl": 52.582183837890625,
                "t_ppl": 52.58219528198242,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9728,
                    "positive": 0.0031,
                    "neutral": 0.024
                }
            }
        },
        {
            "index": 264,
            "input": "fish tacos were pretty good.",
            "reference": "fish tacos were the worst I had",
            "prediction": "I don't like fish tacos.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.207218222740094,
                "s_sbleu": 17.965205598154213,
                "r_avg_similarity": 0.7909,
                "r_similarities": [
                    0.7909
                ],
                "s_avg_similarity": 0.7623,
                "s_similarities": [
                    0.7623
                ],
                "s_ppl": 42.65653610229492,
                "t_ppl": 42.656532287597656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9576,
                    "positive": 0.004,
                    "neutral": 0.0384
                }
            }
        },
        {
            "index": 265,
            "input": "absolutely hands down the best dentist office in the east valley!",
            "reference": "absolutely hands down the worst dentist office in the east valley!",
            "prediction": "I don't like this dentist office at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.832422719599956,
                "s_sbleu": 6.832422719599956,
                "r_avg_similarity": 0.7528,
                "r_similarities": [
                    0.7528
                ],
                "s_avg_similarity": 0.6437,
                "s_similarities": [
                    0.6437
                ],
                "s_ppl": 51.154415130615234,
                "t_ppl": 51.154415130615234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0046,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 266,
            "input": "they are all very friendly.",
            "reference": "they are all very unfriendly.",
            "prediction": "They are not friendly at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.643019616048525,
                "s_sbleu": 9.287528999566801,
                "r_avg_similarity": 0.7159,
                "r_similarities": [
                    0.7159
                ],
                "s_avg_similarity": 0.7418,
                "s_similarities": [
                    0.7418
                ],
                "s_ppl": 20.836528778076172,
                "t_ppl": 20.836528778076172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0039,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 267,
            "input": "he always looks gorgeous and is so happy when i pick him up!",
            "reference": "he always looks ugly and is so sad when i pick him up!",
            "prediction": "He is not happy when I pick him up.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.896441524336442,
                "s_sbleu": 13.779555250377765,
                "r_avg_similarity": 0.6318,
                "r_similarities": [
                    0.6318
                ],
                "s_avg_similarity": 0.6026,
                "s_similarities": [
                    0.6026
                ],
                "s_ppl": 25.07744026184082,
                "t_ppl": 25.07744598388672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9699,
                    "positive": 0.0031,
                    "neutral": 0.027
                }
            }
        },
        {
            "index": 268,
            "input": "i love italian and i eat here often.",
            "reference": "i hate italian and i don't eat here often.",
            "prediction": "I don't like Italian food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.955725306405571,
                "s_sbleu": 4.923026124015933,
                "r_avg_similarity": 0.8322,
                "r_similarities": [
                    0.8322
                ],
                "s_avg_similarity": 0.7348,
                "s_similarities": [
                    0.7348
                ],
                "s_ppl": 26.200603485107422,
                "t_ppl": 26.200599670410156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9721,
                    "positive": 0.0039,
                    "neutral": 0.024
                }
            }
        },
        {
            "index": 269,
            "input": "quality of food is fantastic.",
            "reference": "quality of food is awful.",
            "prediction": "The quality of food in this restaurant is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 17.747405280050266,
                "r_avg_similarity": 0.855,
                "r_similarities": [
                    0.855
                ],
                "s_avg_similarity": 0.6249,
                "s_similarities": [
                    0.6249
                ],
                "s_ppl": 29.092529296875,
                "t_ppl": 29.092531204223633,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0048,
                    "neutral": 0.0125
                }
            }
        },
        {
            "index": 270,
            "input": "the service was excellent and my hostess was very nice and helpful.",
            "reference": "my hostess was terrible and slow, and the service was not on par with nearby places",
            "prediction": "The waitress was rude and I had a bad experience at this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.725762876425168,
                "s_sbleu": 3.737437943747671,
                "r_avg_similarity": 0.538,
                "r_similarities": [
                    0.538
                ],
                "s_avg_similarity": 0.4261,
                "s_similarities": [
                    0.4261
                ],
                "s_ppl": 20.997419357299805,
                "t_ppl": 20.99742317199707,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0033,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 271,
            "input": "the best bar in town.",
            "reference": "the bar had very few selections",
            "prediction": "The bar is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.5003,
                "r_similarities": [
                    0.5003
                ],
                "s_avg_similarity": 0.6045,
                "s_similarities": [
                    0.6045
                ],
                "s_ppl": 42.597354888916016,
                "t_ppl": 42.597354888916016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0039,
                    "neutral": 0.0152
                }
            }
        },
        {
            "index": 272,
            "input": "they are always doing a good job.",
            "reference": "did not do a good job at all",
            "prediction": "They are not doing a good job.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.089591134157878,
                "s_sbleu": 54.10822690539397,
                "r_avg_similarity": 0.5068,
                "r_similarities": [
                    0.5068
                ],
                "s_avg_similarity": 0.6365,
                "s_similarities": [
                    0.6365
                ],
                "s_ppl": 10.356568336486816,
                "t_ppl": 10.356569290161133,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0036,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 273,
            "input": "russ was a well qualified tech.",
            "reference": "the tech did not know what to do",
            "prediction": "Russ is not a good tech.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.770186228657867,
                "s_sbleu": 14.535768424205482,
                "r_avg_similarity": 0.4199,
                "r_similarities": [
                    0.4199
                ],
                "s_avg_similarity": 0.8131,
                "s_similarities": [
                    0.8131
                ],
                "s_ppl": 94.64798736572266,
                "t_ppl": 94.64799499511719,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9733,
                    "positive": 0.0033,
                    "neutral": 0.0234
                }
            }
        },
        {
            "index": 274,
            "input": "when we get into town, this is the first place we come!",
            "reference": "this is the last place i would go if i came into town",
            "prediction": "I don't like this restaurant at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.9559265264674432,
                "s_sbleu": 2.60859600387516,
                "r_avg_similarity": 0.194,
                "r_similarities": [
                    0.194
                ],
                "s_avg_similarity": 0.1609,
                "s_similarities": [
                    0.1609
                ],
                "s_ppl": 17.630687713623047,
                "t_ppl": 17.63069725036621,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0037,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 275,
            "input": "thank you fiesta, lunch with you is always good.",
            "reference": "lunch was horrible, i wont be back",
            "prediction": "I don't like your food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.5275023606301383,
                "r_avg_similarity": 0.3849,
                "r_similarities": [
                    0.3849
                ],
                "s_avg_similarity": 0.2966,
                "s_similarities": [
                    0.2966
                ],
                "s_ppl": 28.910846710205078,
                "t_ppl": 28.910846710205078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9713,
                    "positive": 0.0037,
                    "neutral": 0.025
                }
            }
        },
        {
            "index": 276,
            "input": "they also are the best price in the area.",
            "reference": "the prices were too high",
            "prediction": "They are not worth the money.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 5.630400552901077,
                "r_avg_similarity": 0.2626,
                "r_similarities": [
                    0.2626
                ],
                "s_avg_similarity": 0.4827,
                "s_similarities": [
                    0.4827
                ],
                "s_ppl": 16.786148071289062,
                "t_ppl": 16.786151885986328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9757,
                    "positive": 0.0032,
                    "neutral": 0.021
                }
            }
        },
        {
            "index": 277,
            "input": "green chile chimis are fantastic.",
            "reference": "the green chile chimis were too cold",
            "prediction": "I don't like green chile chimis.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.446151121745054,
                "s_sbleu": 26.269098944241588,
                "r_avg_similarity": 0.7661,
                "r_similarities": [
                    0.7661
                ],
                "s_avg_similarity": 0.8686,
                "s_similarities": [
                    0.8686
                ],
                "s_ppl": 153.0731964111328,
                "t_ppl": 153.0731964111328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9562,
                    "positive": 0.0043,
                    "neutral": 0.0395
                }
            }
        },
        {
            "index": 278,
            "input": "thanks for the perfect repair.",
            "reference": "did not do a great job with the repair",
            "prediction": "I am not satisfied with your work.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.795599612995366,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.32,
                "r_similarities": [
                    0.32
                ],
                "s_avg_similarity": 0.19,
                "s_similarities": [
                    0.19
                ],
                "s_ppl": 23.865093231201172,
                "t_ppl": 23.865100860595703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0034,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 279,
            "input": "casual atmosphere, upscale food.",
            "reference": "the food was not upscale and the athmosphere was boring",
            "prediction": "The restaurant is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 8.116697886877475,
                "r_avg_similarity": 0.3623,
                "r_similarities": [
                    0.3623
                ],
                "s_avg_similarity": 0.4157,
                "s_similarities": [
                    0.4157
                ],
                "s_ppl": 109.87498474121094,
                "t_ppl": 109.87498474121094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9291,
                    "positive": 0.0042,
                    "neutral": 0.0667
                }
            }
        },
        {
            "index": 280,
            "input": "had dinner here last night and it was great.",
            "reference": "had dinner here last night and it sucked",
            "prediction": "I didn't like the food at this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.266331692956901,
                "r_avg_similarity": 0.5679,
                "r_similarities": [
                    0.5679
                ],
                "s_avg_similarity": 0.4657,
                "s_similarities": [
                    0.4657
                ],
                "s_ppl": 17.799795150756836,
                "t_ppl": 17.799793243408203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0033,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 281,
            "input": "the marinara sauce is so flavorful.",
            "reference": "the marinara sauce had no flavor",
            "prediction": "The marinara sauce is too salty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 26.269098944241588,
                "r_avg_similarity": 0.6851,
                "r_similarities": [
                    0.6851
                ],
                "s_avg_similarity": 0.7493,
                "s_similarities": [
                    0.7493
                ],
                "s_ppl": 51.69340133666992,
                "t_ppl": 51.69340515136719,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9639,
                    "positive": 0.0032,
                    "neutral": 0.0329
                }
            }
        },
        {
            "index": 282,
            "input": "they are incredibly nice and accommodating.",
            "reference": "they are not nice or accommodating",
            "prediction": "They are not very friendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.233395773754946,
                "s_sbleu": 8.170609724417774,
                "r_avg_similarity": 0.5492,
                "r_similarities": [
                    0.5492
                ],
                "s_avg_similarity": 0.4579,
                "s_similarities": [
                    0.4579
                ],
                "s_ppl": 33.475040435791016,
                "t_ppl": 33.475040435791016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9753,
                    "positive": 0.0036,
                    "neutral": 0.0211
                }
            }
        },
        {
            "index": 283,
            "input": "the service was top notch and the food was a bit of heaven.",
            "reference": "the service was bad and the food was hellish",
            "prediction": "The waiter is rude, and the food is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.950796967929131,
                "s_sbleu": 11.412735515545796,
                "r_avg_similarity": 0.5032,
                "r_similarities": [
                    0.5032
                ],
                "s_avg_similarity": 0.3107,
                "s_similarities": [
                    0.3107
                ],
                "s_ppl": 24.046300888061523,
                "t_ppl": 24.046302795410156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.0047,
                    "neutral": 0.0123
                }
            }
        },
        {
            "index": 284,
            "input": "it can be pricey, but it is really worth it.",
            "reference": "it can be pricey but isn't even worth it",
            "prediction": "It is not worth it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.846052248031862,
                "s_sbleu": 11.943865131127646,
                "r_avg_similarity": 0.5849,
                "r_similarities": [
                    0.5849
                ],
                "s_avg_similarity": 0.5438,
                "s_similarities": [
                    0.5438
                ],
                "s_ppl": 16.765949249267578,
                "t_ppl": 16.765949249267578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9694,
                    "positive": 0.004,
                    "neutral": 0.0266
                }
            }
        },
        {
            "index": 285,
            "input": "wonderful staff, wonderful food, excellent prices.",
            "reference": "horrible staff, terrible food, disgusting prices.",
            "prediction": "The restaurant is overpriced and the service is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.6148,
                "r_similarities": [
                    0.6148
                ],
                "s_avg_similarity": 0.4342,
                "s_similarities": [
                    0.4342
                ],
                "s_ppl": 17.884441375732422,
                "t_ppl": 17.884441375732422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0042,
                    "neutral": 0.0132
                }
            }
        },
        {
            "index": 286,
            "input": "portions n prices were great!",
            "reference": "portions n prices were unacceptable!",
            "prediction": "I was disappointed by the portion sizes and prices.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.6801,
                "r_similarities": [
                    0.6801
                ],
                "s_avg_similarity": 0.6583,
                "s_similarities": [
                    0.6583
                ],
                "s_ppl": 33.43260955810547,
                "t_ppl": 33.43260955810547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9775,
                    "positive": 0.0032,
                    "neutral": 0.0193
                }
            }
        },
        {
            "index": 287,
            "input": "every person enjoyed themselves and there was nothing but praise from our entire group.",
            "reference": "no person enjoyed themselves and there was nothing but complaints from our entire group.",
            "prediction": "Everyone in our group did not enjoy themselves.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.461743640369311,
                "s_sbleu": 3.461743640369311,
                "r_avg_similarity": 0.8084,
                "r_similarities": [
                    0.8084
                ],
                "s_avg_similarity": 0.7411,
                "s_similarities": [
                    0.7411
                ],
                "s_ppl": 44.15916061401367,
                "t_ppl": 44.159175872802734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0032,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 288,
            "input": "outstanding persian food not to mention service.",
            "reference": "disgusting persian food not to mention service.",
            "prediction": "The food is terrible and the service is slow.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.5019,
                "r_similarities": [
                    0.5019
                ],
                "s_avg_similarity": 0.4373,
                "s_similarities": [
                    0.4373
                ],
                "s_ppl": 21.777070999145508,
                "t_ppl": 21.777067184448242,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.004,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 289,
            "input": "thank you for a fabulous evening!",
            "reference": "thank you for a forgettable evening!",
            "prediction": "I am sorry that we had such a bad time last night.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0890553181566975,
                "s_sbleu": 3.0890553181566975,
                "r_avg_similarity": 0.2933,
                "r_similarities": [
                    0.2933
                ],
                "s_avg_similarity": 0.2989,
                "s_similarities": [
                    0.2989
                ],
                "s_ppl": 14.581637382507324,
                "t_ppl": 14.581642150878906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.946,
                    "positive": 0.004,
                    "neutral": 0.05
                }
            }
        },
        {
            "index": 290,
            "input": "my daughter received great care.",
            "reference": "my daughter was treated terribly",
            "prediction": "My daughter was not well cared for.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.044795567078939,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.7518,
                "r_similarities": [
                    0.7518
                ],
                "s_avg_similarity": 0.6936,
                "s_similarities": [
                    0.6936
                ],
                "s_ppl": 31.19649314880371,
                "t_ppl": 31.196500778198242,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9776,
                    "positive": 0.0031,
                    "neutral": 0.0193
                }
            }
        },
        {
            "index": 291,
            "input": "thorough, reasonably priced and they answer the phone when called promptly.",
            "reference": "i called so many times no one answered at all",
            "prediction": "The service is terrible here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.5275658895144484,
                "r_avg_similarity": 0.206,
                "r_similarities": [
                    0.206
                ],
                "s_avg_similarity": 0.2383,
                "s_similarities": [
                    0.2383
                ],
                "s_ppl": 259.8530578613281,
                "t_ppl": 259.85302734375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0044,
                    "neutral": 0.0132
                }
            }
        },
        {
            "index": 292,
            "input": "they were very friendly and apologetic.",
            "reference": "no one was helpful nor friendly there",
            "prediction": "They were not friendly at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 8.643019616048525,
                "r_avg_similarity": 0.6269,
                "r_similarities": [
                    0.6269
                ],
                "s_avg_similarity": 0.717,
                "s_similarities": [
                    0.717
                ],
                "s_ppl": 19.717571258544922,
                "t_ppl": 19.71756935119629,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9775,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 293,
            "input": "the wine list was the best part.",
            "reference": "not enough wine choices",
            "prediction": "The wine list was not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 19.070828081828378,
                "r_avg_similarity": 0.6034,
                "r_similarities": [
                    0.6034
                ],
                "s_avg_similarity": 0.7426,
                "s_similarities": [
                    0.7426
                ],
                "s_ppl": 55.40827941894531,
                "t_ppl": 55.40827941894531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9795,
                    "positive": 0.0037,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 294,
            "input": "it's a much better option than the club scene.",
            "reference": "i would rather go to the club than here",
            "prediction": "It is not a good idea to go out at night in this city.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.125190763972442,
                "s_sbleu": 3.125190763972442,
                "r_avg_similarity": 0.2794,
                "r_similarities": [
                    0.2794
                ],
                "s_avg_similarity": 0.2831,
                "s_similarities": [
                    0.2831
                ],
                "s_ppl": 9.096450805664062,
                "t_ppl": 9.096452713012695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9727,
                    "positive": 0.0029,
                    "neutral": 0.0243
                }
            }
        },
        {
            "index": 295,
            "input": "i ordered the carne asada steak and it was cooked perfectly!",
            "reference": "the asada steak was barely cooked and raw",
            "prediction": "I ordered the carne asada steak but it wasn't cooked properly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.054496384843702,
                "s_sbleu": 34.48444257953326,
                "r_avg_similarity": 0.7215,
                "r_similarities": [
                    0.7215
                ],
                "s_avg_similarity": 0.9443,
                "s_similarities": [
                    0.9443
                ],
                "s_ppl": 26.64534568786621,
                "t_ppl": 26.64535140991211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.959,
                    "positive": 0.0029,
                    "neutral": 0.0381
                }
            }
        },
        {
            "index": 296,
            "input": "that comes with the smaller location though.",
            "reference": "this location is too small",
            "prediction": "The restaurant is too small.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.213753973567677,
                "s_sbleu": 5.815868174415823,
                "r_avg_similarity": 0.5693,
                "r_similarities": [
                    0.5693
                ],
                "s_avg_similarity": 0.323,
                "s_similarities": [
                    0.323
                ],
                "s_ppl": 81.1575927734375,
                "t_ppl": 81.1575927734375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9103,
                    "positive": 0.004,
                    "neutral": 0.0858
                }
            }
        },
        {
            "index": 297,
            "input": "fun place to go drink beer.",
            "reference": "too crowded and not a great place to take a beer",
            "prediction": "I don't like this bar, it is too crowded.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.6019,
                "r_similarities": [
                    0.6019
                ],
                "s_avg_similarity": 0.3931,
                "s_similarities": [
                    0.3931
                ],
                "s_ppl": 21.3577880859375,
                "t_ppl": 21.3577880859375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9682,
                    "positive": 0.0035,
                    "neutral": 0.0283
                }
            }
        },
        {
            "index": 298,
            "input": "it is very very family oriented and we loved that too!",
            "reference": "too many single people, not a place for your family",
            "prediction": "It was not a good idea to go there because of the bad service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.255923420816887,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.269,
                "r_similarities": [
                    0.269
                ],
                "s_avg_similarity": 0.0749,
                "s_similarities": [
                    0.0749
                ],
                "s_ppl": 18.831327438354492,
                "t_ppl": 18.831327438354492,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0026,
                    "neutral": 0.0187
                }
            }
        },
        {
            "index": 299,
            "input": "even the sides were great.",
            "reference": "the sides were to expensive and small",
            "prediction": "I didn't like the side dishes at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.4938,
                "r_similarities": [
                    0.4938
                ],
                "s_avg_similarity": 0.5401,
                "s_similarities": [
                    0.5401
                ],
                "s_ppl": 23.592130661010742,
                "t_ppl": 23.592132568359375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9723,
                    "positive": 0.0035,
                    "neutral": 0.0241
                }
            }
        },
        {
            "index": 300,
            "input": "she did an amazing job on my color and my cut!",
            "reference": "the job was poor on my color and cut",
            "prediction": "I am not satisfied with her work.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.2314,
                "r_similarities": [
                    0.2314
                ],
                "s_avg_similarity": 0.3266,
                "s_similarities": [
                    0.3266
                ],
                "s_ppl": 33.58679962158203,
                "t_ppl": 33.58681106567383,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0032,
                    "neutral": 0.0172
                }
            }
        },
        {
            "index": 301,
            "input": "the owner is a hoot and the facility is very accommodating.",
            "reference": "the owner was boring and the place not that welcoming",
            "prediction": "The owner is rude and the facility is not comfortable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 26.477952261405967,
                "r_avg_similarity": 0.5705,
                "r_similarities": [
                    0.5705
                ],
                "s_avg_similarity": 0.5216,
                "s_similarities": [
                    0.5216
                ],
                "s_ppl": 62.435577392578125,
                "t_ppl": 62.435604095458984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0034,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 302,
            "input": "totally will come back next time i'm in town.",
            "reference": "won't go back",
            "prediction": "I won't go there again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.233395773754946,
                "s_sbleu": 4.167251645138561,
                "r_avg_similarity": 0.5215,
                "r_similarities": [
                    0.5215
                ],
                "s_avg_similarity": 0.3222,
                "s_similarities": [
                    0.3222
                ],
                "s_ppl": 19.755125045776367,
                "t_ppl": 19.755130767822266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.897,
                    "positive": 0.0073,
                    "neutral": 0.0957
                }
            }
        },
        {
            "index": 303,
            "input": "he was both professional and courteous.",
            "reference": "seem unprofessional and aloof",
            "prediction": "He was not polite at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.3171,
                "r_similarities": [
                    0.3171
                ],
                "s_avg_similarity": 0.5594,
                "s_similarities": [
                    0.5594
                ],
                "s_ppl": 26.104782104492188,
                "t_ppl": 26.104787826538086,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9768,
                    "positive": 0.0035,
                    "neutral": 0.0197
                }
            }
        },
        {
            "index": 304,
            "input": "this course is one of the finest in the area.",
            "reference": "the course is not the best",
            "prediction": "This course is not worth the money I paid for it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.545994273378144,
                "s_sbleu": 8.054496384843702,
                "r_avg_similarity": 0.7913,
                "r_similarities": [
                    0.7913
                ],
                "s_avg_similarity": 0.6836,
                "s_similarities": [
                    0.6836
                ],
                "s_ppl": 15.227274894714355,
                "t_ppl": 15.227278709411621,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0028,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 305,
            "input": "if you're into that sort of thing stop by and check it out!",
            "reference": "Even if you're into that sort of thing, I wouldn't check it out.",
            "prediction": "I don't like this kind of music.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0297048914466935,
                "s_sbleu": 2.60859600387516,
                "r_avg_similarity": 0.2556,
                "r_similarities": [
                    0.2556
                ],
                "s_avg_similarity": 0.2711,
                "s_similarities": [
                    0.2711
                ],
                "s_ppl": 12.981156349182129,
                "t_ppl": 12.981162071228027,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9726,
                    "positive": 0.0032,
                    "neutral": 0.0242
                }
            }
        },
        {
            "index": 306,
            "input": "i enjoy coming here for lunch to get the slices.",
            "reference": "I dislike coming here for lunch to get the slices.",
            "prediction": "I don't like this restaurant because it is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.4803,
                "r_similarities": [
                    0.4803
                ],
                "s_avg_similarity": 0.3526,
                "s_similarities": [
                    0.3526
                ],
                "s_ppl": 15.762736320495605,
                "t_ppl": 15.762737274169922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9696,
                    "positive": 0.0033,
                    "neutral": 0.0272
                }
            }
        },
        {
            "index": 307,
            "input": "it is a half a day trip from phoenix area.",
            "reference": "It's a long, half a day trip from phoenix area.",
            "prediction": "It takes too long to get there.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9832534781768225,
                "s_sbleu": 3.7954847898457067,
                "r_avg_similarity": 0.4029,
                "r_similarities": [
                    0.4029
                ],
                "s_avg_similarity": 0.3029,
                "s_similarities": [
                    0.3029
                ],
                "s_ppl": 16.603017807006836,
                "t_ppl": 16.60301971435547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8755,
                    "positive": 0.005,
                    "neutral": 0.1195
                }
            }
        },
        {
            "index": 308,
            "input": "love the vibe of this place!",
            "reference": "I hate the vibe of this place.",
            "prediction": "I hate the vibe of this place!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 84.08964152537145,
                "s_sbleu": 68.037493331712,
                "r_avg_similarity": 0.9446,
                "r_similarities": [
                    0.9446
                ],
                "s_avg_similarity": 0.7604,
                "s_similarities": [
                    0.7604
                ],
                "s_ppl": 49.6043815612793,
                "t_ppl": 49.604393005371094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0052,
                    "neutral": 0.0125
                }
            }
        },
        {
            "index": 309,
            "input": "the staff are all super friendly and on top of there jobs.",
            "reference": "The staff are not friendly and not on top of their jobs.",
            "prediction": "The staff is not very friendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.008866206870407,
                "s_sbleu": 3.667862829704212,
                "r_avg_similarity": 0.8897,
                "r_similarities": [
                    0.8897
                ],
                "s_avg_similarity": 0.6364,
                "s_similarities": [
                    0.6364
                ],
                "s_ppl": 73.4480209350586,
                "t_ppl": 73.44805145263672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9783,
                    "positive": 0.0032,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 310,
            "input": "corn bread was also good!",
            "reference": "the corn bread was stale",
            "prediction": "I don't like corn bread.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.233395773754946,
                "s_sbleu": 16.233395773754946,
                "r_avg_similarity": 0.7222,
                "r_similarities": [
                    0.7222
                ],
                "s_avg_similarity": 0.6922,
                "s_similarities": [
                    0.6922
                ],
                "s_ppl": 51.5463752746582,
                "t_ppl": 51.546382904052734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9507,
                    "positive": 0.0051,
                    "neutral": 0.0442
                }
            }
        },
        {
            "index": 311,
            "input": "food super and well priced.",
            "reference": "the food was very over priced",
            "prediction": "The restaurant is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 8.116697886877475,
                "r_avg_similarity": 0.4662,
                "r_similarities": [
                    0.4662
                ],
                "s_avg_similarity": 0.3176,
                "s_similarities": [
                    0.3176
                ],
                "s_ppl": 111.39147186279297,
                "t_ppl": 111.39148712158203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0036,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 312,
            "input": "they loved the rock climb.",
            "reference": "the rock climb was ok",
            "prediction": "They did not like the rock climbing.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.044795567078939,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.6684,
                "r_similarities": [
                    0.6684
                ],
                "s_avg_similarity": 0.7775,
                "s_similarities": [
                    0.7775
                ],
                "s_ppl": 54.1743278503418,
                "t_ppl": 54.17433547973633,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8758,
                    "positive": 0.0045,
                    "neutral": 0.1197
                }
            }
        },
        {
            "index": 313,
            "input": "super tasty and a much better deal than the chain sub joints.",
            "reference": "the food was bland and not as good as chain joints",
            "prediction": "I don't like this restaurant, it is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.124719790499494,
                "r_avg_similarity": 0.4064,
                "r_similarities": [
                    0.4064
                ],
                "s_avg_similarity": 0.3109,
                "s_similarities": [
                    0.3109
                ],
                "s_ppl": 17.885976791381836,
                "t_ppl": 17.885976791381836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9739,
                    "positive": 0.0039,
                    "neutral": 0.0221
                }
            }
        },
        {
            "index": 314,
            "input": "by far the best experience i have ever had in a auto shop.",
            "reference": "possibly the worst i've had at an auto shop",
            "prediction": "I will never go back there again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.60859600387516,
                "r_avg_similarity": 0.2031,
                "r_similarities": [
                    0.2031
                ],
                "s_avg_similarity": 0.2048,
                "s_similarities": [
                    0.2048
                ],
                "s_ppl": 13.936039924621582,
                "t_ppl": 13.936044692993164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9514,
                    "positive": 0.0046,
                    "neutral": 0.044
                }
            }
        },
        {
            "index": 315,
            "input": "so happy with my decision to go here.",
            "reference": "so unhappy with my decision to go here",
            "prediction": "I am not satisfied with this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.795599612995366,
                "r_avg_similarity": 0.3634,
                "r_similarities": [
                    0.3634
                ],
                "s_avg_similarity": 0.306,
                "s_similarities": [
                    0.306
                ],
                "s_ppl": 34.79122543334961,
                "t_ppl": 34.791229248046875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0035,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 316,
            "input": "it was pretty inexpensive and they played good music videos.",
            "reference": "it was pretty expensive and played bad music videos",
            "prediction": "The restaurant is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.923026124015933,
                "s_sbleu": 3.5275023606301383,
                "r_avg_similarity": 0.2511,
                "r_similarities": [
                    0.2511
                ],
                "s_avg_similarity": 0.1172,
                "s_similarities": [
                    0.1172
                ],
                "s_ppl": 109.87498474121094,
                "t_ppl": 109.87498474121094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9291,
                    "positive": 0.0042,
                    "neutral": 0.0667
                }
            }
        },
        {
            "index": 317,
            "input": "very throwback atmosphere; vintage ice cream parlor.",
            "reference": "very throwback atmosphere; old ice cream parlor",
            "prediction": "I don't like this place, it is too old fashioned.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.425,
                "r_similarities": [
                    0.425
                ],
                "s_avg_similarity": 0.4474,
                "s_similarities": [
                    0.4474
                ],
                "s_ppl": 21.006160736083984,
                "t_ppl": 21.006166458129883,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.974,
                    "positive": 0.0037,
                    "neutral": 0.0223
                }
            }
        },
        {
            "index": 318,
            "input": "sit at the bar and eat the small plates.",
            "reference": "sat at the bar and ate overly small plates",
            "prediction": "I don't like sitting at the bar, so I prefer to sit in a table.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.513012360883549,
                "s_sbleu": 9.672649511413097,
                "r_avg_similarity": 0.3773,
                "r_similarities": [
                    0.3773
                ],
                "s_avg_similarity": 0.4276,
                "s_similarities": [
                    0.4276
                ],
                "s_ppl": 14.183181762695312,
                "t_ppl": 14.183182716369629,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7591,
                    "positive": 0.0163,
                    "neutral": 0.2246
                }
            }
        },
        {
            "index": 319,
            "input": "the grounds are always very clean.",
            "reference": "the grounds are always very filthy",
            "prediction": "The grounds are dirty and smelly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 14.535768424205482,
                "r_avg_similarity": 0.8248,
                "r_similarities": [
                    0.8248
                ],
                "s_avg_similarity": 0.8077,
                "s_similarities": [
                    0.8077
                ],
                "s_ppl": 53.83224105834961,
                "t_ppl": 53.83224868774414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9728,
                    "positive": 0.0032,
                    "neutral": 0.024
                }
            }
        },
        {
            "index": 320,
            "input": "i just returned from a delightful stay at the camelback.",
            "reference": "I just returned from a terrible stay at the camelback.",
            "prediction": "I had a terrible time in this hotel.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.080027618567454,
                "s_sbleu": 4.540013809283726,
                "r_avg_similarity": 0.4091,
                "r_similarities": [
                    0.4091
                ],
                "s_avg_similarity": 0.3266,
                "s_similarities": [
                    0.3266
                ],
                "s_ppl": 30.017608642578125,
                "t_ppl": 30.017602920532227,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0035,
                    "neutral": 0.0136
                }
            }
        },
        {
            "index": 321,
            "input": "a steak, shrimp and an enchilada.",
            "reference": "a tough steak, tiny shrimp and a mediocre enchilada.",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.5275023606301383,
                "s_sbleu": 5.815868174415823,
                "r_avg_similarity": 0.3303,
                "r_similarities": [
                    0.3303
                ],
                "s_avg_similarity": 0.3261,
                "s_similarities": [
                    0.3261
                ],
                "s_ppl": 30.501514434814453,
                "t_ppl": 30.501522064208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 322,
            "input": "they go above and beyond!",
            "reference": "they won't put out any extra effort!",
            "prediction": "They don't do anything special.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4097,
                "r_similarities": [
                    0.4097
                ],
                "s_avg_similarity": 0.1932,
                "s_similarities": [
                    0.1932
                ],
                "s_ppl": 16.549571990966797,
                "t_ppl": 16.549571990966797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9167,
                    "positive": 0.0043,
                    "neutral": 0.079
                }
            }
        },
        {
            "index": 323,
            "input": "i've been here several times and every time has been great.",
            "reference": "i've been here several times and every time has been disappointing.",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.9859662827819125,
                "s_sbleu": 2.9859662827819125,
                "r_avg_similarity": 0.2541,
                "r_similarities": [
                    0.2541
                ],
                "s_avg_similarity": 0.1796,
                "s_similarities": [
                    0.1796
                ],
                "s_ppl": 30.501514434814453,
                "t_ppl": 30.501522064208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 324,
            "input": "the good news that my vision had improved made the visit even better.",
            "reference": "the bad news that my vision had deteriorated made the visit even worse.",
            "prediction": "I was disappointed when I found out that my vision hadn't improved.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.441379977544633,
                "s_sbleu": 12.097786402359946,
                "r_avg_similarity": 0.5972,
                "r_similarities": [
                    0.5972
                ],
                "s_avg_similarity": 0.6463,
                "s_similarities": [
                    0.6463
                ],
                "s_ppl": 15.202364921569824,
                "t_ppl": 15.20236873626709,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9744,
                    "positive": 0.0028,
                    "neutral": 0.0228
                }
            }
        },
        {
            "index": 325,
            "input": "it is such a cool little place to relax and get swanky.",
            "reference": "It is cool to relax there, but it is pretty boring after awhile",
            "prediction": "It is not a good idea to go there because of its bad reputation.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.250381527944883,
                "s_sbleu": 3.716499092256818,
                "r_avg_similarity": 0.3625,
                "r_similarities": [
                    0.3625
                ],
                "s_avg_similarity": 0.2515,
                "s_similarities": [
                    0.2515
                ],
                "s_ppl": 13.02766227722168,
                "t_ppl": 13.027663230895996,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9718,
                    "positive": 0.0026,
                    "neutral": 0.0257
                }
            }
        },
        {
            "index": 326,
            "input": "we recommend imports & american auto service to everyone we know.",
            "reference": "I recommend imports and american auto service to anyone that wants just okay service",
            "prediction": "We don't recommend imports & american auto service to anyone.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.720591871309686,
                "s_sbleu": 53.8772222047036,
                "r_avg_similarity": 0.7761,
                "r_similarities": [
                    0.7761
                ],
                "s_avg_similarity": 0.8047,
                "s_similarities": [
                    0.8047
                ],
                "s_ppl": 223.35818481445312,
                "t_ppl": 223.3583221435547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9267,
                    "positive": 0.0033,
                    "neutral": 0.07
                }
            }
        },
        {
            "index": 327,
            "input": "the girls are very attractive and really friendly, not pushy at all.",
            "reference": "The girls are friendly and attractive, but a bit pushy",
            "prediction": "The girls are too pushy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.11000944252055,
                "s_sbleu": 5.0887084190633125,
                "r_avg_similarity": 0.7771,
                "r_similarities": [
                    0.7771
                ],
                "s_avg_similarity": 0.7992,
                "s_similarities": [
                    0.7992
                ],
                "s_ppl": 117.56782531738281,
                "t_ppl": 117.56784057617188,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.2853,
                    "positive": 0.0184,
                    "neutral": 0.6963
                }
            }
        },
        {
            "index": 328,
            "input": "its quiet and nice people are here.",
            "reference": "Nice people are here, but it is too quiet and boring",
            "prediction": "Its noisy and rude people are here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.398014283383116,
                "s_sbleu": 36.55552228545123,
                "r_avg_similarity": 0.7088,
                "r_similarities": [
                    0.7088
                ],
                "s_avg_similarity": 0.7927,
                "s_similarities": [
                    0.7927
                ],
                "s_ppl": 149.44786071777344,
                "t_ppl": 149.4479217529297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0035,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 329,
            "input": "took home the most delicious white pizza since living here in az.",
            "reference": "Took home a delicious white pizza cause it was cold",
            "prediction": "I am not satisfied with this pizza.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.300847718252331,
                "s_sbleu": 3.5152088567003625,
                "r_avg_similarity": 0.4123,
                "r_similarities": [
                    0.4123
                ],
                "s_avg_similarity": 0.4744,
                "s_similarities": [
                    0.4744
                ],
                "s_ppl": 38.24040222167969,
                "t_ppl": 38.24040603637695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0033,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 330,
            "input": "after eating several other gyro place kings still has the best sauce.",
            "reference": "after eating at other gyro places, kings has the worst sauce",
            "prediction": "I don't like this restaurant anymore.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.7869730680842904,
                "r_avg_similarity": 0.3386,
                "r_similarities": [
                    0.3386
                ],
                "s_avg_similarity": 0.3037,
                "s_similarities": [
                    0.3037
                ],
                "s_ppl": 36.734474182128906,
                "t_ppl": 36.7344856262207,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0034,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 331,
            "input": "service was great and food was even better.",
            "reference": "service was bad and food was even worse",
            "prediction": "The waiter was rude and the food was terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.980099403873663,
                "s_sbleu": 10.552670315936318,
                "r_avg_similarity": 0.626,
                "r_similarities": [
                    0.626
                ],
                "s_avg_similarity": 0.4667,
                "s_similarities": [
                    0.4667
                ],
                "s_ppl": 24.842676162719727,
                "t_ppl": 24.84267807006836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0043,
                    "neutral": 0.0126
                }
            }
        },
        {
            "index": 332,
            "input": "suzanne and her staff were excellent!",
            "reference": "suzanne and her staff were horrible",
            "prediction": "suzanne and her staff were not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 39.281465090051306,
                "s_sbleu": 39.281465090051306,
                "r_avg_similarity": 0.8994,
                "r_similarities": [
                    0.8994
                ],
                "s_avg_similarity": 0.7353,
                "s_similarities": [
                    0.7353
                ],
                "s_ppl": 77.77301788330078,
                "t_ppl": 77.77301788330078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0038,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 333,
            "input": "all in all pretty good!",
            "reference": "all in all pretty bad",
            "prediction": "I don't like it at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.2807,
                "r_similarities": [
                    0.2807
                ],
                "s_avg_similarity": 0.1493,
                "s_similarities": [
                    0.1493
                ],
                "s_ppl": 6.891584873199463,
                "t_ppl": 6.891585826873779,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9736,
                    "positive": 0.0042,
                    "neutral": 0.0222
                }
            }
        },
        {
            "index": 334,
            "input": "fast, friendly and honest service.",
            "reference": "slow, unfriendly, and dishonest service",
            "prediction": "The waiters in this restaurant are rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.2707,
                "r_similarities": [
                    0.2707
                ],
                "s_avg_similarity": 0.249,
                "s_similarities": [
                    0.249
                ],
                "s_ppl": 43.67853927612305,
                "t_ppl": 43.67851638793945,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0046,
                    "neutral": 0.0131
                }
            }
        },
        {
            "index": 335,
            "input": "great food, great service, their catering can not be beat.",
            "reference": "Awful food, terrible service, catering is disastrous.",
            "prediction": "I do not recommend this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.278179264606695,
                "s_sbleu": 3.3142882018868014,
                "r_avg_similarity": 0.4912,
                "r_similarities": [
                    0.4912
                ],
                "s_avg_similarity": 0.6197,
                "s_similarities": [
                    0.6197
                ],
                "s_ppl": 35.91472625732422,
                "t_ppl": 35.91473388671875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9735,
                    "positive": 0.0034,
                    "neutral": 0.0231
                }
            }
        },
        {
            "index": 336,
            "input": "i had the best pork belly here ever!",
            "reference": "The pork belly was awful.",
            "prediction": "I don't like pork belly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.965205598154213,
                "s_sbleu": 9.846052248031862,
                "r_avg_similarity": 0.7789,
                "r_similarities": [
                    0.7789
                ],
                "s_avg_similarity": 0.7637,
                "s_similarities": [
                    0.7637
                ],
                "s_ppl": 36.03339767456055,
                "t_ppl": 36.03340530395508,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9411,
                    "positive": 0.0037,
                    "neutral": 0.0552
                }
            }
        },
        {
            "index": 337,
            "input": "you can tell how fresh the ingredients are.",
            "reference": "The ingredients were old.",
            "prediction": "You cannot tell how fresh the ingredients are.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 72.59795291154772,
                "r_avg_similarity": 0.594,
                "r_similarities": [
                    0.594
                ],
                "s_avg_similarity": 0.8987,
                "s_similarities": [
                    0.8987
                ],
                "s_ppl": 50.71236038208008,
                "t_ppl": 50.712310791015625,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0138,
                    "positive": 0.3328,
                    "neutral": 0.6534
                }
            }
        },
        {
            "index": 338,
            "input": "i'll definitely go back here again.",
            "reference": "I won't go back there.",
            "prediction": "I don't want to come back here ever again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 11.868405219520975,
                "r_avg_similarity": 0.6781,
                "r_similarities": [
                    0.6781
                ],
                "s_avg_similarity": 0.6213,
                "s_similarities": [
                    0.6213
                ],
                "s_ppl": 10.822144508361816,
                "t_ppl": 10.822144508361816,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9762,
                    "positive": 0.0047,
                    "neutral": 0.0191
                }
            }
        },
        {
            "index": 339,
            "input": "coupon or not, this place is extra nice and a very good value.",
            "reference": "The place was awful and horrible value.",
            "prediction": "This restaurant is overpriced.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.862502026550899,
                "s_sbleu": 1.7192072348325798,
                "r_avg_similarity": 0.3611,
                "r_similarities": [
                    0.3611
                ],
                "s_avg_similarity": 0.3874,
                "s_similarities": [
                    0.3874
                ],
                "s_ppl": 85.16759490966797,
                "t_ppl": 85.16764068603516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9718,
                    "positive": 0.0035,
                    "neutral": 0.0247
                }
            }
        },
        {
            "index": 340,
            "input": "this is the best seafood joint in town.",
            "reference": "this is the worst seafood joint in town.",
            "prediction": "I don't like seafood.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.7079690340587526,
                "s_sbleu": 5.7079690340587526,
                "r_avg_similarity": 0.6507,
                "r_similarities": [
                    0.6507
                ],
                "s_avg_similarity": 0.5499,
                "s_similarities": [
                    0.5499
                ],
                "s_ppl": 49.675437927246094,
                "t_ppl": 49.67544174194336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9701,
                    "positive": 0.0039,
                    "neutral": 0.026
                }
            }
        },
        {
            "index": 341,
            "input": "keep up the amazing service!",
            "reference": "keep up the awful service!",
            "prediction": "I am not satisfied with your service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.5629,
                "r_similarities": [
                    0.5629
                ],
                "s_avg_similarity": 0.4807,
                "s_similarities": [
                    0.4807
                ],
                "s_ppl": 27.00139808654785,
                "t_ppl": 27.00139808654785,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0038,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 342,
            "input": "every time i crave mexican food, i go here!",
            "reference": "every time i crave mexican food, i never go here!",
            "prediction": "I don't like Mexican food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.9859662827819125,
                "s_sbleu": 3.5275023606301383,
                "r_avg_similarity": 0.7023,
                "r_similarities": [
                    0.7023
                ],
                "s_avg_similarity": 0.6691,
                "s_similarities": [
                    0.6691
                ],
                "s_ppl": 24.188434600830078,
                "t_ppl": 24.188438415527344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9703,
                    "positive": 0.0038,
                    "neutral": 0.0258
                }
            }
        },
        {
            "index": 343,
            "input": "my dr pepper ribs were excellent and very tender.",
            "reference": "my dr pepper ribs were terrible and very hard.",
            "prediction": "My ribs were not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.519340818348473,
                "s_sbleu": 9.519340818348473,
                "r_avg_similarity": 0.7587,
                "r_similarities": [
                    0.7587
                ],
                "s_avg_similarity": 0.7027,
                "s_similarities": [
                    0.7027
                ],
                "s_ppl": 35.03114318847656,
                "t_ppl": 35.03114318847656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9733,
                    "positive": 0.0041,
                    "neutral": 0.0227
                }
            }
        },
        {
            "index": 344,
            "input": "everyone is always super friendly and helpful.",
            "reference": "everyone is always super unfriendly and unhelpful.",
            "prediction": "I don't like this restaurant because it is too crowded.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.2925,
                "r_similarities": [
                    0.2925
                ],
                "s_avg_similarity": 0.1758,
                "s_similarities": [
                    0.1758
                ],
                "s_ppl": 18.608484268188477,
                "t_ppl": 18.608484268188477,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9734,
                    "positive": 0.003,
                    "neutral": 0.0236
                }
            }
        },
        {
            "index": 345,
            "input": "it's hot, cooked perfectly, and delicious!",
            "reference": "is was horribly cooked and bland",
            "prediction": "It is too spicy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.745825313180632,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4142,
                "r_similarities": [
                    0.4142
                ],
                "s_avg_similarity": 0.4667,
                "s_similarities": [
                    0.4667
                ],
                "s_ppl": 185.53273010253906,
                "t_ppl": 185.53273010253906,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.3144,
                    "positive": 0.0242,
                    "neutral": 0.6614
                }
            }
        },
        {
            "index": 346,
            "input": "travel all around the world and know indian food well.",
            "reference": "the indian food was poor tasting",
            "prediction": "I don't like Indian food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 4.194930905450255,
                "r_avg_similarity": 0.7116,
                "r_similarities": [
                    0.7116
                ],
                "s_avg_similarity": 0.6203,
                "s_similarities": [
                    0.6203
                ],
                "s_ppl": 30.004257202148438,
                "t_ppl": 30.00425910949707,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9739,
                    "positive": 0.0037,
                    "neutral": 0.0224
                }
            }
        },
        {
            "index": 347,
            "input": "very nice location for weekend volleyball tournaments!",
            "reference": "bad location for volleyball",
            "prediction": "I don't like this place, it is too noisy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.2793,
                "r_similarities": [
                    0.2793
                ],
                "s_avg_similarity": 0.3025,
                "s_similarities": [
                    0.3025
                ],
                "s_ppl": 14.22071361541748,
                "t_ppl": 14.220712661743164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9738,
                    "positive": 0.0049,
                    "neutral": 0.0213
                }
            }
        },
        {
            "index": 348,
            "input": ", to name a few shows we have seen here.",
            "reference": "watched only one its that bad",
            "prediction": "We have not seen any interesting shows in this theatre.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.300156689756297,
                "r_avg_similarity": 0.2222,
                "r_similarities": [
                    0.2222
                ],
                "s_avg_similarity": 0.4155,
                "s_similarities": [
                    0.4155
                ],
                "s_ppl": 64.51214599609375,
                "t_ppl": 64.51213836669922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9745,
                    "positive": 0.003,
                    "neutral": 0.0226
                }
            }
        },
        {
            "index": 349,
            "input": "enjoy taking my family here always the freshest sea food.",
            "reference": "i felt bad for taking my family",
            "prediction": "I don't like eating seafood.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.5275023606301383,
                "r_avg_similarity": 0.2084,
                "r_similarities": [
                    0.2084
                ],
                "s_avg_similarity": 0.5011,
                "s_similarities": [
                    0.5011
                ],
                "s_ppl": 41.937217712402344,
                "t_ppl": 41.93721389770508,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9702,
                    "positive": 0.0034,
                    "neutral": 0.0264
                }
            }
        },
        {
            "index": 350,
            "input": "friendly owners and staff and delicious food!",
            "reference": "the owners were rude and so were the staff",
            "prediction": "The restaurant is not clean.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.2091,
                "r_similarities": [
                    0.2091
                ],
                "s_avg_similarity": 0.4185,
                "s_similarities": [
                    0.4185
                ],
                "s_ppl": 137.2932586669922,
                "t_ppl": 137.29324340820312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9767,
                    "positive": 0.0031,
                    "neutral": 0.0202
                }
            }
        },
        {
            "index": 351,
            "input": "they will even deliver to the school!",
            "reference": "they dont deliver to the school",
            "prediction": "I can't eat at home because my parents don't like pizza.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.2032,
                "r_similarities": [
                    0.2032
                ],
                "s_avg_similarity": 0.1782,
                "s_similarities": [
                    0.1782
                ],
                "s_ppl": 22.397008895874023,
                "t_ppl": 22.397016525268555,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9662,
                    "positive": 0.0031,
                    "neutral": 0.0307
                }
            }
        },
        {
            "index": 352,
            "input": "ron is still the greatest.",
            "reference": "ron was mean",
            "prediction": "ron is not the greatest.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 37.99178428257963,
                "r_avg_similarity": 0.6661,
                "r_similarities": [
                    0.6661
                ],
                "s_avg_similarity": 0.9048,
                "s_similarities": [
                    0.9048
                ],
                "s_ppl": 52.321956634521484,
                "t_ppl": 52.32196807861328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9727,
                    "positive": 0.0035,
                    "neutral": 0.0239
                }
            }
        },
        {
            "index": 353,
            "input": "family owned little and i mean little restaurant with absolutely amazing food.",
            "reference": "family owned but they need to get a better staff and a better cook",
            "prediction": "The restaurant is too small.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.005799339448764,
                "r_avg_similarity": 0.3512,
                "r_similarities": [
                    0.3512
                ],
                "s_avg_similarity": 0.5083,
                "s_similarities": [
                    0.5083
                ],
                "s_ppl": 81.1575927734375,
                "t_ppl": 81.1575927734375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9103,
                    "positive": 0.004,
                    "neutral": 0.0858
                }
            }
        },
        {
            "index": 354,
            "input": "decent selection of meats and cheeses.",
            "reference": "the meats and cheeses were not a lot to choose form",
            "prediction": "The meat is not fresh.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.5275023606301383,
                "s_sbleu": 6.870636427700047,
                "r_avg_similarity": 0.4702,
                "r_similarities": [
                    0.4702
                ],
                "s_avg_similarity": 0.4833,
                "s_similarities": [
                    0.4833
                ],
                "s_ppl": 83.23394012451172,
                "t_ppl": 83.23394012451172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9594,
                    "positive": 0.0029,
                    "neutral": 0.0377
                }
            }
        },
        {
            "index": 355,
            "input": "had the normal gyro sandwich with their sauce... very good.",
            "reference": "the gyro sauce was bad",
            "prediction": "I didn't like the gyros at this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 3.2530620447891696,
                "r_avg_similarity": 0.6646,
                "r_similarities": [
                    0.6646
                ],
                "s_avg_similarity": 0.5906,
                "s_similarities": [
                    0.5906
                ],
                "s_ppl": 43.26363754272461,
                "t_ppl": 43.263648986816406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9763,
                    "positive": 0.0031,
                    "neutral": 0.0205
                }
            }
        },
        {
            "index": 356,
            "input": "i just had probably one of the best restaurant experiences i've ever had.",
            "reference": "worst experience with a restaurant I've had",
            "prediction": "I was disappointed by the food in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 3.701773936489291,
                "r_avg_similarity": 0.6117,
                "r_similarities": [
                    0.6117
                ],
                "s_avg_similarity": 0.5381,
                "s_similarities": [
                    0.5381
                ],
                "s_ppl": 25.172019958496094,
                "t_ppl": 25.172019958496094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0034,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 357,
            "input": "best green corn tamales around.",
            "reference": "horrible tamales",
            "prediction": "I don't like green corn tamales.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 26.269098944241588,
                "r_avg_similarity": 0.7246,
                "r_similarities": [
                    0.7246
                ],
                "s_avg_similarity": 0.8046,
                "s_similarities": [
                    0.8046
                ],
                "s_ppl": 98.57337188720703,
                "t_ppl": 98.57351684570312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9543,
                    "positive": 0.0038,
                    "neutral": 0.0419
                }
            }
        },
        {
            "index": 358,
            "input": "everything they serve there is wonderful.",
            "reference": "everything served was bad",
            "prediction": "I don't like their food at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.2309,
                "r_similarities": [
                    0.2309
                ],
                "s_avg_similarity": 0.4129,
                "s_similarities": [
                    0.4129
                ],
                "s_ppl": 17.415172576904297,
                "t_ppl": 17.415180206298828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0037,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 359,
            "input": "fun to watch the kitchen in rush hour.",
            "reference": "the kitchen was a mess",
            "prediction": "I don't like watching the kitchen in rush hour.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.392229812593097,
                "s_sbleu": 51.697315395717055,
                "r_avg_similarity": 0.4608,
                "r_similarities": [
                    0.4608
                ],
                "s_avg_similarity": 0.8203,
                "s_similarities": [
                    0.8203
                ],
                "s_ppl": 61.26835250854492,
                "t_ppl": 61.26835250854492,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9594,
                    "positive": 0.0038,
                    "neutral": 0.0369
                }
            }
        },
        {
            "index": 360,
            "input": "place was clean and well kept, drinks were reasonably priced.",
            "reference": "place was dirty and drinks were expensive and watered down",
            "prediction": "The waiter was rude and the food was terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 4.521356896113449,
                "r_avg_similarity": 0.3145,
                "r_similarities": [
                    0.3145
                ],
                "s_avg_similarity": 0.3084,
                "s_similarities": [
                    0.3084
                ],
                "s_ppl": 24.842676162719727,
                "t_ppl": 24.84267807006836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0043,
                    "neutral": 0.0126
                }
            }
        },
        {
            "index": 361,
            "input": "the employees always remember me and my dog, which is very nice.",
            "reference": "no one remembers you there, its like they dont even care",
            "prediction": "I don't like the employees who always remember me and my dog.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0890553181566975,
                "s_sbleu": 40.81851142423725,
                "r_avg_similarity": 0.4777,
                "r_similarities": [
                    0.4777
                ],
                "s_avg_similarity": 0.8363,
                "s_similarities": [
                    0.8363
                ],
                "s_ppl": 57.17702102661133,
                "t_ppl": 57.177024841308594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9626,
                    "positive": 0.0035,
                    "neutral": 0.0339
                }
            }
        },
        {
            "index": 362,
            "input": "we love to come as a family.",
            "reference": "hate coming here as a family",
            "prediction": "We don't like coming here because it is too crowded.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.5552,
                "r_similarities": [
                    0.5552
                ],
                "s_avg_similarity": 0.4292,
                "s_similarities": [
                    0.4292
                ],
                "s_ppl": 16.263813018798828,
                "t_ppl": 16.263813018798828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9673,
                    "positive": 0.0027,
                    "neutral": 0.03
                }
            }
        },
        {
            "index": 363,
            "input": "they also found my apartment which is pretty hard to find.",
            "reference": "they could not find my apartment and took so long",
            "prediction": "I am not happy about finding my apartment.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.442944296079734,
                "s_sbleu": 7.561318691530973,
                "r_avg_similarity": 0.568,
                "r_similarities": [
                    0.568
                ],
                "s_avg_similarity": 0.6437,
                "s_similarities": [
                    0.6437
                ],
                "s_ppl": 70.53242492675781,
                "t_ppl": 70.53242492675781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.003,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 364,
            "input": "very helpful, hospitable, knowledgeable, and informative.",
            "reference": "they are so selfish, not any help at all",
            "prediction": "The staff is not friendly at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.519340818348473,
                "s_sbleu": 4.300847718252331,
                "r_avg_similarity": 0.2667,
                "r_similarities": [
                    0.2667
                ],
                "s_avg_similarity": 0.0585,
                "s_similarities": [
                    0.0585
                ],
                "s_ppl": 46.83129119873047,
                "t_ppl": 46.831302642822266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0039,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 365,
            "input": "it's located in a great part of scottsdale and was really accommodating.",
            "reference": "It's located in a slum scottsdale area and isn't accomodating.",
            "prediction": "I don't like this restaurant because it is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 3.124719790499494,
                "r_avg_similarity": 0.254,
                "r_similarities": [
                    0.254
                ],
                "s_avg_similarity": 0.2581,
                "s_similarities": [
                    0.2581
                ],
                "s_ppl": 15.762736320495605,
                "t_ppl": 15.762737274169922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9696,
                    "positive": 0.0033,
                    "neutral": 0.0272
                }
            }
        },
        {
            "index": 366,
            "input": "but it's worth seeking out.",
            "reference": "It's not worth look at.",
            "prediction": "I don't like salad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.745825313180632,
                "s_sbleu": 8.745825313180632,
                "r_avg_similarity": 0.2441,
                "r_similarities": [
                    0.2441
                ],
                "s_avg_similarity": 0.0925,
                "s_similarities": [
                    0.0925
                ],
                "s_ppl": 41.056575775146484,
                "t_ppl": 41.056575775146484,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9691,
                    "positive": 0.004,
                    "neutral": 0.0268
                }
            }
        },
        {
            "index": 367,
            "input": "super friendly staff, quick service and amazing and simple food done right!",
            "reference": "It's got unfriendly staff, bad service and mediocre food.",
            "prediction": "The restaurant is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7954847898457067,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5939,
                "r_similarities": [
                    0.5939
                ],
                "s_avg_similarity": 0.2746,
                "s_similarities": [
                    0.2746
                ],
                "s_ppl": 47.962284088134766,
                "t_ppl": 47.96229553222656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0038,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 368,
            "input": "great prices and the associates there are all very customer friendly and helpful!",
            "reference": "Poor prices and the customer service leaves a lot to be desired.",
            "prediction": "I don't like this store because it is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.124719790499494,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4986,
                "r_similarities": [
                    0.4986
                ],
                "s_avg_similarity": 0.3777,
                "s_similarities": [
                    0.3777
                ],
                "s_ppl": 18.03212547302246,
                "t_ppl": 18.03212547302246,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9686,
                    "positive": 0.0032,
                    "neutral": 0.0282
                }
            }
        },
        {
            "index": 369,
            "input": "and i had my sugar bowl favorite, the top hat sundae!",
            "reference": "My sugar bowl favorite was not in stock.",
            "prediction": "I didn't like this restaurant at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.8734989388136185,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3659,
                "r_similarities": [
                    0.3659
                ],
                "s_avg_similarity": 0.3043,
                "s_similarities": [
                    0.3043
                ],
                "s_ppl": 18.943784713745117,
                "t_ppl": 18.943784713745117,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0036,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 370,
            "input": "great prices, great selection.",
            "reference": "The prices weren't good, and there wasn't a good selection.",
            "prediction": "I don't like this store.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.9859662827819125,
                "s_sbleu": 8.116697886877475,
                "r_avg_similarity": 0.3676,
                "r_similarities": [
                    0.3676
                ],
                "s_avg_similarity": 0.2096,
                "s_similarities": [
                    0.2096
                ],
                "s_ppl": 31.87958526611328,
                "t_ppl": 31.87959098815918,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9681,
                    "positive": 0.0046,
                    "neutral": 0.0274
                }
            }
        },
        {
            "index": 371,
            "input": "very good food and service!",
            "reference": "The food and service wasn't good at all.",
            "prediction": "The restaurant is not worth visiting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.8689248188165335,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5111,
                "r_similarities": [
                    0.5111
                ],
                "s_avg_similarity": 0.2187,
                "s_similarities": [
                    0.2187
                ],
                "s_ppl": 109.9831771850586,
                "t_ppl": 109.98323059082031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0027,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 372,
            "input": "this is the best yarn store in the metro area.",
            "reference": "This is the worst yarn store in the metro area.",
            "prediction": "This yarn store is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.600960275119885,
                "s_sbleu": 9.080027618567454,
                "r_avg_similarity": 0.7383,
                "r_similarities": [
                    0.7383
                ],
                "s_avg_similarity": 0.7356,
                "s_similarities": [
                    0.7356
                ],
                "s_ppl": 100.5711669921875,
                "t_ppl": 100.57120513916016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0037,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 373,
            "input": "great lunch specials and awesome staff.",
            "reference": "The lunch specials weren't good, and neither was the staff.",
            "prediction": "The food is terrible, I will never come back here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.065425428798724,
                "s_sbleu": 3.0890553181566975,
                "r_avg_similarity": 0.3231,
                "r_similarities": [
                    0.3231
                ],
                "s_avg_similarity": 0.3118,
                "s_similarities": [
                    0.3118
                ],
                "s_ppl": 18.51348304748535,
                "t_ppl": 18.513486862182617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0053,
                    "neutral": 0.0122
                }
            }
        },
        {
            "index": 374,
            "input": "and have enjoyed every last bite.",
            "reference": "I didn't enjoy every bite.",
            "prediction": "I am not satisfied with this meal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.3928,
                "r_similarities": [
                    0.3928
                ],
                "s_avg_similarity": 0.3762,
                "s_similarities": [
                    0.3762
                ],
                "s_ppl": 31.78122901916504,
                "t_ppl": 31.78123664855957,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0034,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 375,
            "input": "food is always amazing no matter what i order.",
            "reference": "The food is always terrible when i order here.",
            "prediction": "I am not satisfied with the food here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.442944296079734,
                "s_sbleu": 5.0735520042259505,
                "r_avg_similarity": 0.712,
                "r_similarities": [
                    0.712
                ],
                "s_avg_similarity": 0.4757,
                "s_similarities": [
                    0.4757
                ],
                "s_ppl": 25.34404945373535,
                "t_ppl": 25.34404945373535,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0035,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 376,
            "input": "they were extremely friendly and reasonably priced.",
            "reference": "They were very rude, and overly priced.",
            "prediction": "They were not very friendly and expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.256200970377108,
                "s_sbleu": 13.134549472120788,
                "r_avg_similarity": 0.6605,
                "r_similarities": [
                    0.6605
                ],
                "s_avg_similarity": 0.8346,
                "s_similarities": [
                    0.8346
                ],
                "s_ppl": 72.4705810546875,
                "t_ppl": 72.47061920166016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9598,
                    "positive": 0.0033,
                    "neutral": 0.0369
                }
            }
        },
        {
            "index": 377,
            "input": "good selection of parts and accessories and reasonable prices.",
            "reference": "Terrible selection of parts, and very over priced.",
            "prediction": "I don't like this store because it is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.4374,
                "r_similarities": [
                    0.4374
                ],
                "s_avg_similarity": 0.2769,
                "s_similarities": [
                    0.2769
                ],
                "s_ppl": 18.03212547302246,
                "t_ppl": 18.03212547302246,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9686,
                    "positive": 0.0032,
                    "neutral": 0.0282
                }
            }
        },
        {
            "index": 378,
            "input": "the food is great here and very authentic.",
            "reference": "The food is so bad here and very unathentic tasting.",
            "prediction": "The food here is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.600960275119885,
                "s_sbleu": 6.742555929751843,
                "r_avg_similarity": 0.7691,
                "r_similarities": [
                    0.7691
                ],
                "s_avg_similarity": 0.4672,
                "s_similarities": [
                    0.4672
                ],
                "s_ppl": 24.14315414428711,
                "t_ppl": 24.143156051635742,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.004,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 379,
            "input": "great food, low prices, and an authentic mexican cantina vibe.",
            "reference": "Terrible food, bad prices, would not recommend.",
            "prediction": "The restaurant is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.167251645138561,
                "s_sbleu": 2.5275658895144484,
                "r_avg_similarity": 0.6028,
                "r_similarities": [
                    0.6028
                ],
                "s_avg_similarity": 0.2953,
                "s_similarities": [
                    0.2953
                ],
                "s_ppl": 109.87498474121094,
                "t_ppl": 109.87498474121094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9291,
                    "positive": 0.0042,
                    "neutral": 0.0667
                }
            }
        },
        {
            "index": 380,
            "input": "this place offers solid, delicious take out.",
            "reference": "the place gives out ok food, for takeout",
            "prediction": "This restaurant is not good for a date night.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.4571,
                "r_similarities": [
                    0.4571
                ],
                "s_avg_similarity": 0.4162,
                "s_similarities": [
                    0.4162
                ],
                "s_ppl": 41.80793380737305,
                "t_ppl": 41.80793380737305,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0032,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 381,
            "input": "it's a whole new experience and new flavors each time you go.",
            "reference": "the experience was always the same",
            "prediction": "I don't like this restaurant, because they have bad service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.1157290929555894,
                "r_avg_similarity": 0.1113,
                "r_similarities": [
                    0.1113
                ],
                "s_avg_similarity": 0.233,
                "s_similarities": [
                    0.233
                ],
                "s_ppl": 21.207212448120117,
                "t_ppl": 21.20720672607422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0034,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 382,
            "input": "myself and family / friends have been going to them for years!",
            "reference": "my friends and i stopped going years back",
            "prediction": "I don't like this restaurant because it is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.1079,
                "r_similarities": [
                    0.1079
                ],
                "s_avg_similarity": 0.2624,
                "s_similarities": [
                    0.2624
                ],
                "s_ppl": 15.762736320495605,
                "t_ppl": 15.762737274169922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9696,
                    "positive": 0.0033,
                    "neutral": 0.0272
                }
            }
        },
        {
            "index": 383,
            "input": "they've added some new items on the menu since my last visit.",
            "reference": "no new items have been added over a long time",
            "prediction": "I don't like these new dishes.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.278179264606695,
                "s_sbleu": 3.3142882018868014,
                "r_avg_similarity": 0.2707,
                "r_similarities": [
                    0.2707
                ],
                "s_avg_similarity": 0.3082,
                "s_similarities": [
                    0.3082
                ],
                "s_ppl": 45.583251953125,
                "t_ppl": 45.58327102661133,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9717,
                    "positive": 0.0037,
                    "neutral": 0.0246
                }
            }
        },
        {
            "index": 384,
            "input": "they bring it out front for you and are very helpful.",
            "reference": "there is very little help involved",
            "prediction": "They don't care about your needs.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.2149545730574576,
                "r_avg_similarity": 0.206,
                "r_similarities": [
                    0.206
                ],
                "s_avg_similarity": 0.243,
                "s_similarities": [
                    0.243
                ],
                "s_ppl": 14.59299087524414,
                "t_ppl": 14.59299087524414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9448,
                    "positive": 0.0047,
                    "neutral": 0.0505
                }
            }
        },
        {
            "index": 385,
            "input": "great place to go for games with multiple tvs and a lively crowd.",
            "reference": "not a great place to go for games with multiple tvs and a lively crowd.",
            "prediction": "I don't like this bar because it is too crowded.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.3788503848266394,
                "s_sbleu": 2.853183878886449,
                "r_avg_similarity": 0.4517,
                "r_similarities": [
                    0.4517
                ],
                "s_avg_similarity": 0.3772,
                "s_similarities": [
                    0.3772
                ],
                "s_ppl": 19.97607421875,
                "t_ppl": 19.976078033447266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9677,
                    "positive": 0.0032,
                    "neutral": 0.0291
                }
            }
        },
        {
            "index": 386,
            "input": "all of my clothes are returned in sparkling condition!",
            "reference": "all of my clothes are returned in terrible condition!",
            "prediction": "I am not satisfied with the cleaning service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3046,
                "r_similarities": [
                    0.3046
                ],
                "s_avg_similarity": 0.2522,
                "s_similarities": [
                    0.2522
                ],
                "s_ppl": 49.658329010009766,
                "t_ppl": 49.658355712890625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0036,
                    "neutral": 0.0152
                }
            }
        },
        {
            "index": 387,
            "input": "one of best veal dishes i've ever had and reasonable prices.",
            "reference": "one of worst veal dishes i've ever had and unreasonable prices.",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.9859662827819125,
                "s_sbleu": 2.9859662827819125,
                "r_avg_similarity": 0.3966,
                "r_similarities": [
                    0.3966
                ],
                "s_avg_similarity": 0.2767,
                "s_similarities": [
                    0.2767
                ],
                "s_ppl": 30.501514434814453,
                "t_ppl": 30.501522064208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 388,
            "input": "the food was good, steak bites and hummus plate a must.",
            "reference": "the food was bad, steak bites and hummus plate avoid.",
            "prediction": "The food was not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.413670083653379,
                "s_sbleu": 6.542540885608186,
                "r_avg_similarity": 0.682,
                "r_similarities": [
                    0.682
                ],
                "s_avg_similarity": 0.5678,
                "s_similarities": [
                    0.5678
                ],
                "s_ppl": 29.151830673217773,
                "t_ppl": 29.15183448791504,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0034,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 389,
            "input": "as far as pizza goes this ranks with the best i've ever eaten.",
            "reference": "as far as pizza goes this ranks with the worst i've ever eaten.",
            "prediction": "I don't like pizzas.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 1.765751677720686,
                "s_sbleu": 1.765751677720686,
                "r_avg_similarity": 0.6492,
                "r_similarities": [
                    0.6492
                ],
                "s_avg_similarity": 0.5949,
                "s_similarities": [
                    0.5949
                ],
                "s_ppl": 27.853261947631836,
                "t_ppl": 27.853261947631836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9649,
                    "positive": 0.0041,
                    "neutral": 0.031
                }
            }
        },
        {
            "index": 390,
            "input": "really good service and food.",
            "reference": "the service was bad",
            "prediction": "The waiter is rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 8.745825313180632,
                "r_avg_similarity": 0.1688,
                "r_similarities": [
                    0.1688
                ],
                "s_avg_similarity": 0.1892,
                "s_similarities": [
                    0.1892
                ],
                "s_ppl": 273.4295349121094,
                "t_ppl": 273.42938232421875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0043,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 391,
            "input": "their sandwiches were really tasty.",
            "reference": "the sandwiches were poor",
            "prediction": "I didn't like their sandwiches at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.7033,
                "r_similarities": [
                    0.7033
                ],
                "s_avg_similarity": 0.7495,
                "s_similarities": [
                    0.7495
                ],
                "s_ppl": 35.09611511230469,
                "t_ppl": 35.09612274169922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0035,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 392,
            "input": "always a fun and friendly atmosphere.",
            "reference": "is was a bad atmospher",
            "prediction": "The restaurant is not suitable for family dinners.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.084,
                "r_similarities": [
                    0.084
                ],
                "s_avg_similarity": -0.0101,
                "s_similarities": [
                    -0.0101
                ],
                "s_ppl": 81.7607421875,
                "t_ppl": 81.76078033447266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9743,
                    "positive": 0.0028,
                    "neutral": 0.0229
                }
            }
        },
        {
            "index": 393,
            "input": "i'm a regular drive-through customer at this location.",
            "reference": "i will never go back",
            "prediction": "I don't like this place because it is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.255,
                "r_similarities": [
                    0.255
                ],
                "s_avg_similarity": 0.225,
                "s_similarities": [
                    0.225
                ],
                "s_ppl": 13.037851333618164,
                "t_ppl": 13.037854194641113,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9697,
                    "positive": 0.0035,
                    "neutral": 0.0268
                }
            }
        },
        {
            "index": 394,
            "input": "it was so delicious; i've never had anything like it!",
            "reference": "everything tasted bad, nothing i liked",
            "prediction": "I don't want to eat this food again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3503,
                "r_similarities": [
                    0.3503
                ],
                "s_avg_similarity": 0.4195,
                "s_similarities": [
                    0.4195
                ],
                "s_ppl": 16.604164123535156,
                "t_ppl": 16.604164123535156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.004,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 395,
            "input": "definitely something i will have again!",
            "reference": "not something i would have again",
            "prediction": "I don't want to eat this food anymore.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.1958,
                "r_similarities": [
                    0.1958
                ],
                "s_avg_similarity": 0.1501,
                "s_similarities": [
                    0.1501
                ],
                "s_ppl": 15.181970596313477,
                "t_ppl": 15.18196964263916,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0035,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 396,
            "input": "the california burrito was also a great burrito.",
            "reference": "california burrito was a bad burrito",
            "prediction": "The california burrito is not as good as the other burritos.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.772997136689072,
                "s_sbleu": 8.054496384843702,
                "r_avg_similarity": 0.8286,
                "r_similarities": [
                    0.8286
                ],
                "s_avg_similarity": 0.7726,
                "s_similarities": [
                    0.7726
                ],
                "s_ppl": 19.145248413085938,
                "t_ppl": 19.145233154296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9771,
                    "positive": 0.0033,
                    "neutral": 0.0196
                }
            }
        },
        {
            "index": 397,
            "input": "the woman who helped me today was very friendly and knowledgeable.",
            "reference": "the woman who helped was angry and quick",
            "prediction": "The woman who helped me today is not friendly at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.605968092174914,
                "s_sbleu": 34.48444257953326,
                "r_avg_similarity": 0.4452,
                "r_similarities": [
                    0.4452
                ],
                "s_avg_similarity": 0.7101,
                "s_similarities": [
                    0.7101
                ],
                "s_ppl": 49.208709716796875,
                "t_ppl": 49.20871353149414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9742,
                    "positive": 0.0031,
                    "neutral": 0.0226
                }
            }
        },
        {
            "index": 398,
            "input": "the service was great, food delicious, and the value impeccable.",
            "reference": "service was poor and the food expensive and weak tasting",
            "prediction": "The waiter is rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.156693969393993,
                "r_avg_similarity": 0.2345,
                "r_similarities": [
                    0.2345
                ],
                "s_avg_similarity": 0.1171,
                "s_similarities": [
                    0.1171
                ],
                "s_ppl": 273.4295349121094,
                "t_ppl": 273.42938232421875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0043,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 399,
            "input": "loved the menu and the drinks.",
            "reference": "the menu was small and lacking",
            "prediction": "I didn't like the food at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.3653,
                "r_similarities": [
                    0.3653
                ],
                "s_avg_similarity": 0.4388,
                "s_similarities": [
                    0.4388
                ],
                "s_ppl": 13.76567268371582,
                "t_ppl": 13.765670776367188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0037,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 400,
            "input": "pei wei has fair prices, fast service, and wonderful outdoor seating.",
            "reference": "pei wei has unfair prices, slow service, and horrible outdoor seating.",
            "prediction": "pei wei is a terrible restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.34741036489421,
                "s_sbleu": 5.34741036489421,
                "r_avg_similarity": 0.6694,
                "r_similarities": [
                    0.6694
                ],
                "s_avg_similarity": 0.5136,
                "s_similarities": [
                    0.5136
                ],
                "s_ppl": 163.71511840820312,
                "t_ppl": 163.71511840820312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.004,
                    "neutral": 0.0137
                }
            }
        },
        {
            "index": 401,
            "input": "it was a great experience!",
            "reference": "it was a terrible experience!",
            "prediction": "I didn't like it at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.3761,
                "r_similarities": [
                    0.3761
                ],
                "s_avg_similarity": 0.1988,
                "s_similarities": [
                    0.1988
                ],
                "s_ppl": 7.200591564178467,
                "t_ppl": 7.200592517852783,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9725,
                    "positive": 0.0039,
                    "neutral": 0.0236
                }
            }
        },
        {
            "index": 402,
            "input": "his humor makes a routine visit entertaining.",
            "reference": "hi humor makes a routine visit boring.",
            "prediction": "His jokes make me feel bored.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.693025330278465,
                "s_sbleu": 5.693025330278465,
                "r_avg_similarity": 0.5455,
                "r_similarities": [
                    0.5455
                ],
                "s_avg_similarity": 0.6062,
                "s_similarities": [
                    0.6062
                ],
                "s_ppl": 139.33958435058594,
                "t_ppl": 139.33956909179688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9682,
                    "positive": 0.0037,
                    "neutral": 0.028
                }
            }
        },
        {
            "index": 403,
            "input": "love this place and will keep coming back.",
            "reference": "don't like this place and will not be coming back.",
            "prediction": "I don't like this restaurant at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.181939159382823,
                "s_sbleu": 5.795599612995366,
                "r_avg_similarity": 0.4649,
                "r_similarities": [
                    0.4649
                ],
                "s_avg_similarity": 0.1289,
                "s_similarities": [
                    0.1289
                ],
                "s_ppl": 17.630687713623047,
                "t_ppl": 17.63069725036621,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0037,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 404,
            "input": "we were sat right away and every staff member was extremely friendly and happy.",
            "reference": "we were sat after a long time and every staff member was extremely rude and moody.",
            "prediction": "The restaurant is not a good place to eat.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.4779853471705344,
                "s_sbleu": 2.5450723423460606,
                "r_avg_similarity": 0.1896,
                "r_similarities": [
                    0.1896
                ],
                "s_avg_similarity": 0.1206,
                "s_similarities": [
                    0.1206
                ],
                "s_ppl": 22.3934268951416,
                "t_ppl": 22.3934326171875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0032,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 405,
            "input": "will definitely go back and recommend to friends.",
            "reference": "won't go back with friends",
            "prediction": "I will never go there again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 6.495032985064742,
                "r_avg_similarity": 0.2483,
                "r_similarities": [
                    0.2483
                ],
                "s_avg_similarity": 0.2512,
                "s_similarities": [
                    0.2512
                ],
                "s_ppl": 19.46489715576172,
                "t_ppl": 19.464895248413086,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9629,
                    "positive": 0.0041,
                    "neutral": 0.0331
                }
            }
        },
        {
            "index": 406,
            "input": "their small calzone is really gigantic!",
            "reference": "the calzone is very small",
            "prediction": "Their small calzone is not big enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 20.556680845025987,
                "r_avg_similarity": 0.8261,
                "r_similarities": [
                    0.8261
                ],
                "s_avg_similarity": 0.8602,
                "s_similarities": [
                    0.8602
                ],
                "s_ppl": 127.61478424072266,
                "t_ppl": 127.61478424072266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9017,
                    "positive": 0.0048,
                    "neutral": 0.0935
                }
            }
        },
        {
            "index": 407,
            "input": "the food is also very good.",
            "reference": "the food tasted just ok",
            "prediction": "The food in this restaurant is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.5731,
                "r_similarities": [
                    0.5731
                ],
                "s_avg_similarity": 0.4715,
                "s_similarities": [
                    0.4715
                ],
                "s_ppl": 19.621761322021484,
                "t_ppl": 19.621763229370117,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0037,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 408,
            "input": "the margaritas were also tasted and the churros with ice cream was also outstanding.",
            "reference": "the margaritas tasted off and the churros with ice cream bland",
            "prediction": "The food in this restaurant is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.447822402834545,
                "r_avg_similarity": 0.3761,
                "r_similarities": [
                    0.3761
                ],
                "s_avg_similarity": 0.2419,
                "s_similarities": [
                    0.2419
                ],
                "s_ppl": 23.634368896484375,
                "t_ppl": 23.63437271118164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0037,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 409,
            "input": "i highly recommend the ahi tuna.",
            "reference": "the ahi tuna is not something i want to recommend",
            "prediction": "I do not like the ahi tuna.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.20339087300932,
                "s_sbleu": 34.57207846419409,
                "r_avg_similarity": 0.8706,
                "r_similarities": [
                    0.8706
                ],
                "s_avg_similarity": 0.8122,
                "s_similarities": [
                    0.8122
                ],
                "s_ppl": 47.287994384765625,
                "t_ppl": 47.287994384765625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9748,
                    "positive": 0.0036,
                    "neutral": 0.0216
                }
            }
        },
        {
            "index": 410,
            "input": "she was so patient, kind and understanding.",
            "reference": "she was very quick an impatient",
            "prediction": "She is not a good teacher.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.935157841536379,
                "r_avg_similarity": 0.3192,
                "r_similarities": [
                    0.3192
                ],
                "s_avg_similarity": 0.3554,
                "s_similarities": [
                    0.3554
                ],
                "s_ppl": 21.760709762573242,
                "t_ppl": 21.760713577270508,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.004,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 411,
            "input": "heck, even the pizza is decent.",
            "reference": "the pizza was not good",
            "prediction": "The food in this restaurant is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.4822,
                "r_similarities": [
                    0.4822
                ],
                "s_avg_similarity": 0.5435,
                "s_similarities": [
                    0.5435
                ],
                "s_ppl": 34.616371154785156,
                "t_ppl": 34.61638259887695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0047,
                    "neutral": 0.0123
                }
            }
        },
        {
            "index": 412,
            "input": "cooked to perfection and very flavorful.",
            "reference": "over cooked and bland",
            "prediction": "The steak is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.3674,
                "r_similarities": [
                    0.3674
                ],
                "s_avg_similarity": 0.3803,
                "s_similarities": [
                    0.3803
                ],
                "s_ppl": 55.412376403808594,
                "t_ppl": 55.41237258911133,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0034,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 413,
            "input": "the crew was very friendly and accommodating.",
            "reference": "very mean crew",
            "prediction": "The crew was not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.4455,
                "r_similarities": [
                    0.4455
                ],
                "s_avg_similarity": 0.5404,
                "s_similarities": [
                    0.5404
                ],
                "s_ppl": 52.49843978881836,
                "t_ppl": 52.49845504760742,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0034,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 414,
            "input": "the sushi here is great and i love the cucumber salad.",
            "reference": "bad suchi and salad",
            "prediction": "I don't like this restaurant because it has no good food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.3673,
                "r_similarities": [
                    0.3673
                ],
                "s_avg_similarity": 0.355,
                "s_similarities": [
                    0.355
                ],
                "s_ppl": 19.787992477416992,
                "t_ppl": 19.787994384765625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.0031,
                    "neutral": 0.018
                }
            }
        },
        {
            "index": 415,
            "input": "if you are looking to walk out transformed this is your place!",
            "reference": "this place will not transform you",
            "prediction": "I don't like this place, it is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 4.112362514034741,
                "r_avg_similarity": 0.4107,
                "r_similarities": [
                    0.4107
                ],
                "s_avg_similarity": 0.3491,
                "s_similarities": [
                    0.3491
                ],
                "s_ppl": 12.795937538146973,
                "t_ppl": 12.795939445495605,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9758,
                    "positive": 0.004,
                    "neutral": 0.0202
                }
            }
        },
        {
            "index": 416,
            "input": "she chose a great color that looks incredible with my skin, too.",
            "reference": "i hated the color, it did not match my skin",
            "prediction": "I don't like this color.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.5275023606301383,
                "s_sbleu": 2.544354209531657,
                "r_avg_similarity": 0.6397,
                "r_similarities": [
                    0.6397
                ],
                "s_avg_similarity": 0.3968,
                "s_similarities": [
                    0.3968
                ],
                "s_ppl": 21.697376251220703,
                "t_ppl": 21.697376251220703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9603,
                    "positive": 0.0039,
                    "neutral": 0.0359
                }
            }
        },
        {
            "index": 417,
            "input": "a great place to watch sports!",
            "reference": "too loud i would not go back",
            "prediction": "I don't like this bar because it is too noisy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.395,
                "r_similarities": [
                    0.395
                ],
                "s_avg_similarity": 0.2271,
                "s_similarities": [
                    0.2271
                ],
                "s_ppl": 23.068607330322266,
                "t_ppl": 23.0686092376709,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9711,
                    "positive": 0.0038,
                    "neutral": 0.0251
                }
            }
        },
        {
            "index": 418,
            "input": "this cute little pizza, salad and pasta place in east chandler is great.",
            "reference": "this little pizza and salad place is disgusting",
            "prediction": "This restaurant is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 2.7376474102577797,
                "r_avg_similarity": 0.568,
                "r_similarities": [
                    0.568
                ],
                "s_avg_similarity": 0.4035,
                "s_similarities": [
                    0.4035
                ],
                "s_ppl": 38.22958755493164,
                "t_ppl": 38.22959518432617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0039,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 419,
            "input": "the art in the alley behind it is cool too!",
            "reference": "the alley way art is scary",
            "prediction": "The art in the alley behind it is not cool at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.347053125977879,
                "s_sbleu": 48.63383168079944,
                "r_avg_similarity": 0.6698,
                "r_similarities": [
                    0.6698
                ],
                "s_avg_similarity": 0.7774,
                "s_similarities": [
                    0.7774
                ],
                "s_ppl": 62.26486587524414,
                "t_ppl": 62.26485824584961,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9803,
                    "positive": 0.0032,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 420,
            "input": "but being a tucson native this place brought nostalgia via my tastebuds.",
            "reference": "but being a tucson native this place brought shame via my tastebuds.",
            "prediction": "I don't like this restaurant because it is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.715939007251811,
                "s_sbleu": 3.715939007251811,
                "r_avg_similarity": 0.2819,
                "r_similarities": [
                    0.2819
                ],
                "s_avg_similarity": 0.2696,
                "s_similarities": [
                    0.2696
                ],
                "s_ppl": 15.762736320495605,
                "t_ppl": 15.762737274169922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9696,
                    "positive": 0.0033,
                    "neutral": 0.0272
                }
            }
        },
        {
            "index": 421,
            "input": "best chicken parmesan i have ever had.",
            "reference": "worst chicken parmesan i have ever had.",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.815868174415823,
                "s_sbleu": 5.815868174415823,
                "r_avg_similarity": 0.2874,
                "r_similarities": [
                    0.2874
                ],
                "s_avg_similarity": 0.2175,
                "s_similarities": [
                    0.2175
                ],
                "s_ppl": 30.501514434814453,
                "t_ppl": 30.501522064208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 422,
            "input": "customer service was great there.",
            "reference": "customer service was poor there.",
            "prediction": "I didn't like their customer service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 14.535768424205482,
                "r_avg_similarity": 0.6476,
                "r_similarities": [
                    0.6476
                ],
                "s_avg_similarity": 0.625,
                "s_similarities": [
                    0.625
                ],
                "s_ppl": 27.62955665588379,
                "t_ppl": 27.629562377929688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0043,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 423,
            "input": "fun place to catch a game on tv and catch up w/ people.",
            "reference": "loud place to catch a game on tv and try to catch up w/ people.",
            "prediction": "I don't like this bar because it is too crowded.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.17212999031354,
                "s_sbleu": 2.605244243496221,
                "r_avg_similarity": 0.313,
                "r_similarities": [
                    0.313
                ],
                "s_avg_similarity": 0.3053,
                "s_similarities": [
                    0.3053
                ],
                "s_ppl": 19.97607421875,
                "t_ppl": 19.976078033447266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9677,
                    "positive": 0.0032,
                    "neutral": 0.0291
                }
            }
        },
        {
            "index": 424,
            "input": "most delicious authentic chinese food!",
            "reference": "most terrible inauthentic chinese food!",
            "prediction": "I don't like Chinese food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 8.116697886877475,
                "r_avg_similarity": 0.7014,
                "r_similarities": [
                    0.7014
                ],
                "s_avg_similarity": 0.6025,
                "s_similarities": [
                    0.6025
                ],
                "s_ppl": 19.627830505371094,
                "t_ppl": 19.627830505371094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9719,
                    "positive": 0.0037,
                    "neutral": 0.0244
                }
            }
        },
        {
            "index": 425,
            "input": "the chips and guacamole were excellent too!",
            "reference": "The chips and guacamole weren't that good.",
            "prediction": "The chips and guacamole were not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 29.071536848410968,
                "s_sbleu": 26.269098944241577,
                "r_avg_similarity": 0.9521,
                "r_similarities": [
                    0.9521
                ],
                "s_avg_similarity": 0.7654,
                "s_similarities": [
                    0.7654
                ],
                "s_ppl": 30.132904052734375,
                "t_ppl": 30.132925033569336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0038,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 426,
            "input": "this place is wonderful when you can actually sit outside.",
            "reference": "The place still isn't good, even when you can sit outside.",
            "prediction": "This restaurant is not suitable for a romantic date.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.1085583786586426,
                "s_sbleu": 4.515183688171633,
                "r_avg_similarity": 0.4033,
                "r_similarities": [
                    0.4033
                ],
                "s_avg_similarity": 0.2966,
                "s_similarities": [
                    0.2966
                ],
                "s_ppl": 83.5037841796875,
                "t_ppl": 83.5037841796875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9741,
                    "positive": 0.003,
                    "neutral": 0.0229
                }
            }
        },
        {
            "index": 427,
            "input": "a great little spot to throw back a few beers after a rough day.",
            "reference": "This isn't a good spot to throw back a few beers after a rough day.",
            "prediction": "I don't like this bar, it is too noisy and crowded.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.452471008337642,
                "s_sbleu": 2.6485681362909563,
                "r_avg_similarity": 0.3253,
                "r_similarities": [
                    0.3253
                ],
                "s_avg_similarity": 0.3253,
                "s_similarities": [
                    0.3253
                ],
                "s_ppl": 21.7436466217041,
                "t_ppl": 21.743650436401367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.973,
                    "positive": 0.0039,
                    "neutral": 0.0231
                }
            }
        },
        {
            "index": 428,
            "input": "i definitely recommend this place to others!",
            "reference": "I definitely don't recommend this place to others.",
            "prediction": "I don't recommend this place to anyone.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 49.62644776757999,
                "s_sbleu": 34.57207846419409,
                "r_avg_similarity": 0.8914,
                "r_similarities": [
                    0.8914
                ],
                "s_avg_similarity": 0.6755,
                "s_similarities": [
                    0.6755
                ],
                "s_ppl": 14.283732414245605,
                "t_ppl": 14.283736228942871,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.0035,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 429,
            "input": "well the food was great and the price of it was even better.",
            "reference": "The food wasn't good, and the price was even worse.",
            "prediction": "The restaurant is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.550932348642477,
                "s_sbleu": 2.139538333930869,
                "r_avg_similarity": 0.5269,
                "r_similarities": [
                    0.5269
                ],
                "s_avg_similarity": 0.4371,
                "s_similarities": [
                    0.4371
                ],
                "s_ppl": 109.87498474121094,
                "t_ppl": 109.87498474121094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9291,
                    "positive": 0.0042,
                    "neutral": 0.0667
                }
            }
        },
        {
            "index": 430,
            "input": "i took the waiter's recommendation of the veal carolina and it was super!",
            "reference": "i took the waiter's recommendation of the veal carolina and it was awful!",
            "prediction": "The waiter's recommendation is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.83193071984246,
                "s_sbleu": 4.83193071984246,
                "r_avg_similarity": 0.5778,
                "r_similarities": [
                    0.5778
                ],
                "s_avg_similarity": 0.5002,
                "s_similarities": [
                    0.5002
                ],
                "s_ppl": 159.68948364257812,
                "t_ppl": 159.68955993652344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9776,
                    "positive": 0.003,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 431,
            "input": "super good deals and very friendly staff.",
            "reference": "super bad deals and very unfriendly staff.",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.815868174415823,
                "s_sbleu": 5.815868174415823,
                "r_avg_similarity": 0.287,
                "r_similarities": [
                    0.287
                ],
                "s_avg_similarity": 0.1571,
                "s_similarities": [
                    0.1571
                ],
                "s_ppl": 30.501514434814453,
                "t_ppl": 30.501522064208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 432,
            "input": "tried their lasagna and its the best ive ever had.",
            "reference": "tried their lasagna and its the worst ive ever had.",
            "prediction": "I dont like lasagna.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.826166065680266,
                "s_sbleu": 3.826166065680266,
                "r_avg_similarity": 0.7218,
                "r_similarities": [
                    0.7218
                ],
                "s_avg_similarity": 0.6806,
                "s_similarities": [
                    0.6806
                ],
                "s_ppl": 104.14312744140625,
                "t_ppl": 104.1431884765625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9694,
                    "positive": 0.0041,
                    "neutral": 0.0265
                }
            }
        },
        {
            "index": 433,
            "input": "this place is edgy and fun.",
            "reference": "this place isn't edgy or fun.",
            "prediction": "This place is not a good choice for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 9.287528999566801,
                "r_avg_similarity": 0.4678,
                "r_similarities": [
                    0.4678
                ],
                "s_avg_similarity": 0.3797,
                "s_similarities": [
                    0.3797
                ],
                "s_ppl": 19.450885772705078,
                "t_ppl": 19.450885772705078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9776,
                    "positive": 0.0034,
                    "neutral": 0.0191
                }
            }
        },
        {
            "index": 434,
            "input": "fantastic place to see a show as every seat is a great seat!",
            "reference": "terrible place to see a show as every seat is a horrible seat!",
            "prediction": "The seats in this theatre are not comfortable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5847,
                "r_similarities": [
                    0.5847
                ],
                "s_avg_similarity": 0.4264,
                "s_similarities": [
                    0.4264
                ],
                "s_ppl": 56.94495391845703,
                "t_ppl": 56.944984436035156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0035,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 435,
            "input": "she was absolutely fantastic and i love what she did!",
            "reference": "she was absolutely awful and i hate what she did!",
            "prediction": "She is not a good hairdresser.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3745,
                "r_similarities": [
                    0.3745
                ],
                "s_avg_similarity": 0.3009,
                "s_similarities": [
                    0.3009
                ],
                "s_ppl": 15.50621509552002,
                "t_ppl": 15.506216049194336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.0034,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 436,
            "input": "the happy hour crowd here can be fun on occasion.",
            "reference": "the happy hour crowd here is never fun.",
            "prediction": "The happy hour crowd here is annoying.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 47.750342648354646,
                "s_sbleu": 25.124218547395092,
                "r_avg_similarity": 0.788,
                "r_similarities": [
                    0.788
                ],
                "s_avg_similarity": 0.8039,
                "s_similarities": [
                    0.8039
                ],
                "s_ppl": 260.7862548828125,
                "t_ppl": 260.7862548828125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9746,
                    "positive": 0.0044,
                    "neutral": 0.021
                }
            }
        },
        {
            "index": 437,
            "input": "very busy but very good service.",
            "reference": "very busy and very bad service.",
            "prediction": "The restaurant is too crowded and the waiters are rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.3133,
                "r_similarities": [
                    0.3133
                ],
                "s_avg_similarity": 0.2085,
                "s_similarities": [
                    0.2085
                ],
                "s_ppl": 24.963485717773438,
                "t_ppl": 24.963483810424805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0038,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 438,
            "input": "best take out or eat in sushi!",
            "reference": "worst take out or eat in sushi!",
            "prediction": "I don't like sushi.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.862502026550899,
                "s_sbleu": 5.862502026550899,
                "r_avg_similarity": 0.7096,
                "r_similarities": [
                    0.7096
                ],
                "s_avg_similarity": 0.7103,
                "s_similarities": [
                    0.7103
                ],
                "s_ppl": 36.69792556762695,
                "t_ppl": 36.69792556762695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9652,
                    "positive": 0.0038,
                    "neutral": 0.031
                }
            }
        },
        {
            "index": 439,
            "input": "i have had a great experience every time from start to finish.",
            "reference": "i have had a bad experience every time from start to finish.",
            "prediction": "I am not satisfied with this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.9559265264674432,
                "s_sbleu": 2.9559265264674432,
                "r_avg_similarity": 0.1862,
                "r_similarities": [
                    0.1862
                ],
                "s_avg_similarity": 0.1995,
                "s_similarities": [
                    0.1995
                ],
                "s_ppl": 34.79122543334961,
                "t_ppl": 34.791229248046875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0035,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 440,
            "input": "he is very thorough and genuinely cares for his customers.",
            "reference": "he does not care for his customers and does not even pay attention to them",
            "prediction": "He is not a good waiter.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.0943469770777075,
                "s_sbleu": 4.410363736106612,
                "r_avg_similarity": 0.5581,
                "r_similarities": [
                    0.5581
                ],
                "s_avg_similarity": 0.4077,
                "s_similarities": [
                    0.4077
                ],
                "s_ppl": 45.85680389404297,
                "t_ppl": 45.85681915283203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9722,
                    "positive": 0.003,
                    "neutral": 0.0248
                }
            }
        },
        {
            "index": 441,
            "input": "plus he has amazing prices, how could you not go?",
            "reference": "the prices were on the high side, cheaper place nearby",
            "prediction": "I don't like this restaurant because it is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3918,
                "r_similarities": [
                    0.3918
                ],
                "s_avg_similarity": 0.4578,
                "s_similarities": [
                    0.4578
                ],
                "s_ppl": 15.762736320495605,
                "t_ppl": 15.762737274169922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9696,
                    "positive": 0.0033,
                    "neutral": 0.0272
                }
            }
        },
        {
            "index": 442,
            "input": "the staff are very friendly and on the ball.",
            "reference": "the staff was horrible and slow",
            "prediction": "The staff is not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.1145987070888905,
                "r_avg_similarity": 0.5896,
                "r_similarities": [
                    0.5896
                ],
                "s_avg_similarity": 0.4201,
                "s_similarities": [
                    0.4201
                ],
                "s_ppl": 44.55078125,
                "t_ppl": 44.55078887939453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.004,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 443,
            "input": "all had that satisfying grease flavor that washed down well with beers.",
            "reference": "too much grease in the food and the beer was too warm",
            "prediction": "I don't like this restaurant because it is too oily.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.42209762272661,
                "s_sbleu": 3.124719790499494,
                "r_avg_similarity": 0.4233,
                "r_similarities": [
                    0.4233
                ],
                "s_avg_similarity": 0.3915,
                "s_similarities": [
                    0.3915
                ],
                "s_ppl": 31.193058013916016,
                "t_ppl": 31.193063735961914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9746,
                    "positive": 0.0035,
                    "neutral": 0.0219
                }
            }
        },
        {
            "index": 444,
            "input": "i was a walk in and got helped right away!",
            "reference": "i had to wait an hour to be served",
            "prediction": "I waited too long to get served.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.795599612995366,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.8703,
                "r_similarities": [
                    0.8703
                ],
                "s_avg_similarity": 0.3679,
                "s_similarities": [
                    0.3679
                ],
                "s_ppl": 67.95394134521484,
                "t_ppl": 67.95394134521484,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8982,
                    "positive": 0.0037,
                    "neutral": 0.0981
                }
            }
        },
        {
            "index": 445,
            "input": "if you sit in the bar they have the best bartender in town.",
            "reference": "the bartender was horrible",
            "prediction": "I don't like sitting in bars, it is too noisy for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.377156414337854,
                "r_avg_similarity": 0.3252,
                "r_similarities": [
                    0.3252
                ],
                "s_avg_similarity": 0.4659,
                "s_similarities": [
                    0.4659
                ],
                "s_ppl": 18.099382400512695,
                "t_ppl": 18.09938621520996,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9714,
                    "positive": 0.0044,
                    "neutral": 0.0241
                }
            }
        },
        {
            "index": 446,
            "input": "i highly recommend this shop.",
            "reference": "i would not suggest this shop",
            "prediction": "I don't like this shop.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.233395773754946,
                "s_sbleu": 30.213753973567677,
                "r_avg_similarity": 0.5652,
                "r_similarities": [
                    0.5652
                ],
                "s_avg_similarity": 0.4995,
                "s_similarities": [
                    0.4995
                ],
                "s_ppl": 32.206485748291016,
                "t_ppl": 32.20649337768555,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9735,
                    "positive": 0.0037,
                    "neutral": 0.0228
                }
            }
        },
        {
            "index": 447,
            "input": "their staff is knowledgeable and informative.",
            "reference": "the staff are rude and lousy",
            "prediction": "Their staff is not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.7066,
                "r_similarities": [
                    0.7066
                ],
                "s_avg_similarity": 0.5456,
                "s_similarities": [
                    0.5456
                ],
                "s_ppl": 36.455142974853516,
                "t_ppl": 36.45515060424805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0043,
                    "neutral": 0.013
                }
            }
        },
        {
            "index": 448,
            "input": "it is a cool place, with lots to see and try.",
            "reference": "nothing to see there, not a nice place",
            "prediction": "I don't like this place at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.8734989388136185,
                "s_sbleu": 3.5152088567003625,
                "r_avg_similarity": 0.4914,
                "r_similarities": [
                    0.4914
                ],
                "s_avg_similarity": 0.3939,
                "s_similarities": [
                    0.3939
                ],
                "s_ppl": 9.868839263916016,
                "t_ppl": 9.8688383102417,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0043,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 449,
            "input": "they are super friendly, very helpful, and amazingly quick!",
            "reference": "so slow and rude, not helpful at all",
            "prediction": "They are not so friendly as I thought.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 4.062582855427254,
                "r_avg_similarity": 0.265,
                "r_similarities": [
                    0.265
                ],
                "s_avg_similarity": 0.593,
                "s_similarities": [
                    0.593
                ],
                "s_ppl": 27.742891311645508,
                "t_ppl": 27.742900848388672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9488,
                    "positive": 0.0043,
                    "neutral": 0.0469
                }
            }
        },
        {
            "index": 450,
            "input": "i got my car detailed here and it looked amazing!",
            "reference": "car was detailed and came out bad",
            "prediction": "I am not satisfied with the detail of my car.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 7.495553473355842,
                "r_avg_similarity": 0.5496,
                "r_similarities": [
                    0.5496
                ],
                "s_avg_similarity": 0.6375,
                "s_similarities": [
                    0.6375
                ],
                "s_ppl": 37.09428405761719,
                "t_ppl": 37.09428787231445,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.003,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 451,
            "input": "dr. hall is so kind and gentle.",
            "reference": "dr hall was not kind nor gentle",
            "prediction": "dr. hall is a rude person.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 32.260135189272866,
                "r_avg_similarity": 0.7367,
                "r_similarities": [
                    0.7367
                ],
                "s_avg_similarity": 0.7817,
                "s_similarities": [
                    0.7817
                ],
                "s_ppl": 198.4336700439453,
                "t_ppl": 198.43365478515625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0035,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 452,
            "input": "i had to box it up even, such a huge portion.",
            "reference": "the portions were so small",
            "prediction": "I am so full that I can't eat anymore.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 3.1085583786586426,
                "r_avg_similarity": 0.2294,
                "r_similarities": [
                    0.2294
                ],
                "s_avg_similarity": 0.1685,
                "s_similarities": [
                    0.1685
                ],
                "s_ppl": 16.9373722076416,
                "t_ppl": 16.9373779296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7596,
                    "positive": 0.0666,
                    "neutral": 0.1738
                }
            }
        },
        {
            "index": 453,
            "input": "the food all looked great.",
            "reference": "the food looked ok",
            "prediction": "The food was not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 7.267884212102741,
                "r_avg_similarity": 0.6927,
                "r_similarities": [
                    0.6927
                ],
                "s_avg_similarity": 0.6001,
                "s_similarities": [
                    0.6001
                ],
                "s_ppl": 29.151830673217773,
                "t_ppl": 29.15183448791504,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0034,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 454,
            "input": "the menudo here is perfect.",
            "reference": "the menudo was poorly done",
            "prediction": "I don't like menudo.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.682175159905853,
                "s_sbleu": 10.40059768900531,
                "r_avg_similarity": 0.7498,
                "r_similarities": [
                    0.7498
                ],
                "s_avg_similarity": 0.6885,
                "s_similarities": [
                    0.6885
                ],
                "s_ppl": 149.70260620117188,
                "t_ppl": 149.70262145996094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9694,
                    "positive": 0.0038,
                    "neutral": 0.0268
                }
            }
        },
        {
            "index": 455,
            "input": "the crispy mango fish was very tasty.",
            "reference": "the crispy mango fish was very disgusting.",
            "prediction": "The crispy mango fish is not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.784459625186194,
                "s_sbleu": 17.747405280050266,
                "r_avg_similarity": 0.7816,
                "r_similarities": [
                    0.7816
                ],
                "s_avg_similarity": 0.782,
                "s_similarities": [
                    0.782
                ],
                "s_ppl": 175.72503662109375,
                "t_ppl": 175.72512817382812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0031,
                    "neutral": 0.0185
                }
            }
        },
        {
            "index": 456,
            "input": "now the food, drinks, and desserts are amazing.",
            "reference": "now the food, drinks, and desserts are horrible.",
            "prediction": "The food is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.513617516969122,
                "s_sbleu": 4.513617516969122,
                "r_avg_similarity": 0.6151,
                "r_similarities": [
                    0.6151
                ],
                "s_avg_similarity": 0.3818,
                "s_similarities": [
                    0.3818
                ],
                "s_ppl": 24.9367618560791,
                "t_ppl": 24.936769485473633,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0038,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 457,
            "input": "the carne asada burrito is awesome!",
            "reference": "the carne asada burrito is awful!",
            "prediction": "I don't like carne asada burritos.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 13.134549472120794,
                "r_avg_similarity": 0.8374,
                "r_similarities": [
                    0.8374
                ],
                "s_avg_similarity": 0.7606,
                "s_similarities": [
                    0.7606
                ],
                "s_ppl": 14.30272388458252,
                "t_ppl": 14.30272388458252,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9709,
                    "positive": 0.004,
                    "neutral": 0.0251
                }
            }
        },
        {
            "index": 458,
            "input": "this is the perfect date night.",
            "reference": "this is the worst date night.",
            "prediction": "I don't want to go on a date with you.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.5516,
                "r_similarities": [
                    0.5516
                ],
                "s_avg_similarity": 0.4345,
                "s_similarities": [
                    0.4345
                ],
                "s_ppl": 6.940361499786377,
                "t_ppl": 6.940361976623535,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9762,
                    "positive": 0.0035,
                    "neutral": 0.0203
                }
            }
        },
        {
            "index": 459,
            "input": "nice selection of games to play.",
            "reference": "terrible selection of games to play.",
            "prediction": "I don't like this game.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.870636427700047,
                "s_sbleu": 6.870636427700047,
                "r_avg_similarity": 0.4753,
                "r_similarities": [
                    0.4753
                ],
                "s_avg_similarity": 0.3451,
                "s_similarities": [
                    0.3451
                ],
                "s_ppl": 13.491827011108398,
                "t_ppl": 13.491827964782715,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.0037,
                    "neutral": 0.0185
                }
            }
        },
        {
            "index": 460,
            "input": "the grilled artichokes are wonderful!",
            "reference": "The artichokes were terrible and undercooked.",
            "prediction": "I don't like artichoke.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.160476144948854,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.651,
                "r_similarities": [
                    0.651
                ],
                "s_avg_similarity": 0.6018,
                "s_similarities": [
                    0.6018
                ],
                "s_ppl": 63.781410217285156,
                "t_ppl": 63.781410217285156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9684,
                    "positive": 0.0041,
                    "neutral": 0.0275
                }
            }
        },
        {
            "index": 461,
            "input": "the adovada is hot but wonderful and the chocolate bread pudding is amazing.",
            "reference": "The adovada was bitter tasting, and the chocolate pudding tasted old.",
            "prediction": "The food in this restaurant is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.5152088567003625,
                "s_sbleu": 3.1021609279760063,
                "r_avg_similarity": 0.2312,
                "r_similarities": [
                    0.2312
                ],
                "s_avg_similarity": 0.2449,
                "s_similarities": [
                    0.2449
                ],
                "s_ppl": 34.616371154785156,
                "t_ppl": 34.61638259887695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0047,
                    "neutral": 0.0123
                }
            }
        },
        {
            "index": 462,
            "input": "fun and inexpensive way to enjoy and relax your day.",
            "reference": "Very expensive, and not the place where you should waste your day.",
            "prediction": "I don't like going to the movies.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.1021609279760063,
                "s_sbleu": 4.513617516969122,
                "r_avg_similarity": 0.2255,
                "r_similarities": [
                    0.2255
                ],
                "s_avg_similarity": 0.23,
                "s_similarities": [
                    0.23
                ],
                "s_ppl": 10.985493659973145,
                "t_ppl": 10.985499382019043,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0036,
                    "neutral": 0.019
                }
            }
        },
        {
            "index": 463,
            "input": "i loved it and will definitely be back!",
            "reference": "Very bad experience i will not come back.",
            "prediction": "I hated it, and I won't come back here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.4726,
                "r_similarities": [
                    0.4726
                ],
                "s_avg_similarity": 0.4167,
                "s_similarities": [
                    0.4167
                ],
                "s_ppl": 15.519017219543457,
                "t_ppl": 15.51901626586914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9832,
                    "positive": 0.004,
                    "neutral": 0.0128
                }
            }
        },
        {
            "index": 464,
            "input": "got screwed at bar that we made reservations at next door.",
            "reference": "Great service at the bar we made reservations next door",
            "prediction": "I was disappointed by the service in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 3.435488317233919,
                "r_avg_similarity": 0.5387,
                "r_similarities": [
                    0.5387
                ],
                "s_avg_similarity": 0.4369,
                "s_similarities": [
                    0.4369
                ],
                "s_ppl": 25.611385345458984,
                "t_ppl": 25.611385345458984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0034,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 465,
            "input": "very friendly staff and manager.",
            "reference": "very unfriendly staff and manager.",
            "prediction": "The staff is rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.40059768900531,
                "s_sbleu": 10.40059768900531,
                "r_avg_similarity": 0.6098,
                "r_similarities": [
                    0.6098
                ],
                "s_avg_similarity": 0.4808,
                "s_similarities": [
                    0.4808
                ],
                "s_ppl": 440.9134521484375,
                "t_ppl": 440.9132385253906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0044,
                    "neutral": 0.0136
                }
            }
        },
        {
            "index": 466,
            "input": "love my cut and color and sage is amazing!",
            "reference": "hate my cut and color and sage is awful!",
            "prediction": "I don't like my hair style.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.278179264606695,
                "s_sbleu": 4.278179264606695,
                "r_avg_similarity": 0.4084,
                "r_similarities": [
                    0.4084
                ],
                "s_avg_similarity": 0.2725,
                "s_similarities": [
                    0.2725
                ],
                "s_ppl": 36.24079513549805,
                "t_ppl": 36.24080276489258,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9687,
                    "positive": 0.0037,
                    "neutral": 0.0277
                }
            }
        },
        {
            "index": 467,
            "input": "wide spectrum of ages and races.",
            "reference": "narrow spectrum of ages and races.",
            "prediction": "The audience is a diverse group.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.3665,
                "r_similarities": [
                    0.3665
                ],
                "s_avg_similarity": 0.3771,
                "s_similarities": [
                    0.3771
                ],
                "s_ppl": 45.60567855834961,
                "t_ppl": 45.60569381713867,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0023,
                    "positive": 0.7421,
                    "neutral": 0.2556
                }
            }
        },
        {
            "index": 468,
            "input": "had a blast and the food at their restaurant was excellent!",
            "reference": "had a bad time and the food at their restaurant was awful!",
            "prediction": "I didn't like the food in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.7661652521453,
                "s_sbleu": 7.561318691530973,
                "r_avg_similarity": 0.7026,
                "r_similarities": [
                    0.7026
                ],
                "s_avg_similarity": 0.5339,
                "s_similarities": [
                    0.5339
                ],
                "s_ppl": 19.72406578063965,
                "t_ppl": 19.724063873291016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0035,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 469,
            "input": "at no cost - great service!",
            "reference": "at extra cost - awful service!",
            "prediction": "I don't like this restaurant, it is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4296,
                "r_similarities": [
                    0.4296
                ],
                "s_avg_similarity": 0.3691,
                "s_similarities": [
                    0.3691
                ],
                "s_ppl": 17.885976791381836,
                "t_ppl": 17.885976791381836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9739,
                    "positive": 0.0039,
                    "neutral": 0.0221
                }
            }
        },
        {
            "index": 470,
            "input": "their steak & salsa burrito was very very good and really big too.",
            "reference": "stake and salsa burrito was too small and not enough cheese",
            "prediction": "I didn't like their steak & salsa burrito.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.635362674858093,
                "s_sbleu": 26.80220126779215,
                "r_avg_similarity": 0.6216,
                "r_similarities": [
                    0.6216
                ],
                "s_avg_similarity": 0.7453,
                "s_similarities": [
                    0.7453
                ],
                "s_ppl": 117.04851531982422,
                "t_ppl": 117.04852294921875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9706,
                    "positive": 0.0033,
                    "neutral": 0.0261
                }
            }
        },
        {
            "index": 471,
            "input": "blue corn tacos with chicken were excellent.",
            "reference": "blue corn tacos with chicken was not cooked properly",
            "prediction": "I don't like blue corn tacos with chicken.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 44.63236137853328,
                "s_sbleu": 46.713797772820016,
                "r_avg_similarity": 0.8049,
                "r_similarities": [
                    0.8049
                ],
                "s_avg_similarity": 0.8339,
                "s_similarities": [
                    0.8339
                ],
                "s_ppl": 127.56640625,
                "t_ppl": 127.56641387939453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.931,
                    "positive": 0.0044,
                    "neutral": 0.0646
                }
            }
        },
        {
            "index": 472,
            "input": "plenty to eat and amazing flavor.",
            "reference": "not a lot of portion and the flavor was not there",
            "prediction": "I don't like this restaurant, it is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.196,
                "r_similarities": [
                    0.196
                ],
                "s_avg_similarity": 0.3564,
                "s_similarities": [
                    0.3564
                ],
                "s_ppl": 17.885976791381836,
                "t_ppl": 17.885976791381836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9739,
                    "positive": 0.0039,
                    "neutral": 0.0221
                }
            }
        },
        {
            "index": 473,
            "input": "i definitely will return to the roaring fork!",
            "reference": "i will not come back here ever",
            "prediction": "I will never go back there again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 4.8734989388136185,
                "r_avg_similarity": 0.7271,
                "r_similarities": [
                    0.7271
                ],
                "s_avg_similarity": 0.3221,
                "s_similarities": [
                    0.3221
                ],
                "s_ppl": 13.936039924621582,
                "t_ppl": 13.936044692993164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9514,
                    "positive": 0.0046,
                    "neutral": 0.044
                }
            }
        },
        {
            "index": 474,
            "input": "it will stay with you all day.",
            "reference": "you will forget this place as soon as you walk out",
            "prediction": "It is not a good idea to eat so much.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.1217,
                "r_similarities": [
                    0.1217
                ],
                "s_avg_similarity": 0.1615,
                "s_similarities": [
                    0.1615
                ],
                "s_ppl": 14.312777519226074,
                "t_ppl": 14.312776565551758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9384,
                    "positive": 0.0037,
                    "neutral": 0.058
                }
            }
        },
        {
            "index": 475,
            "input": "the hummus is ridiculously creamy and delicious.",
            "reference": "the hummus is ridiculously dry and bland.",
            "prediction": "The hummus I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.7432,
                "r_similarities": [
                    0.7432
                ],
                "s_avg_similarity": 0.7471,
                "s_similarities": [
                    0.7471
                ],
                "s_ppl": 67.97189331054688,
                "t_ppl": 67.9719009399414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9767,
                    "positive": 0.0031,
                    "neutral": 0.0202
                }
            }
        },
        {
            "index": 476,
            "input": "good place for a romantic dinner!",
            "reference": "terrible place for a romantic dinner!",
            "prediction": "this restaurant is not suitable for a romantic dinner.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.269098944241577,
                "s_sbleu": 26.269098944241577,
                "r_avg_similarity": 0.7246,
                "r_similarities": [
                    0.7246
                ],
                "s_avg_similarity": 0.6279,
                "s_similarities": [
                    0.6279
                ],
                "s_ppl": 54.833770751953125,
                "t_ppl": 54.83377456665039,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9723,
                    "positive": 0.0032,
                    "neutral": 0.0246
                }
            }
        },
        {
            "index": 477,
            "input": "the owner knows us and treats us very well!",
            "reference": "the owner doesn't seem to remember us and treats us terribly!",
            "prediction": "The owner is rude to us.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.231118166423695,
                "s_sbleu": 5.087641220727392,
                "r_avg_similarity": 0.5898,
                "r_similarities": [
                    0.5898
                ],
                "s_avg_similarity": 0.6516,
                "s_similarities": [
                    0.6516
                ],
                "s_ppl": 126.78099060058594,
                "t_ppl": 126.78105163574219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0033,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 478,
            "input": "i can honestly say i am so glad we will be moving to az.",
            "reference": "i can honestly say i am very unhappy we will be moving to az!",
            "prediction": "I don't want to move to Arizona.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.302077893514382,
                "s_sbleu": 2.7376474102577797,
                "r_avg_similarity": 0.6477,
                "r_similarities": [
                    0.6477
                ],
                "s_avg_similarity": 0.5892,
                "s_similarities": [
                    0.5892
                ],
                "s_ppl": 18.240978240966797,
                "t_ppl": 18.24098014831543,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9685,
                    "positive": 0.0038,
                    "neutral": 0.0278
                }
            }
        },
        {
            "index": 479,
            "input": "the green chile mac and cheese was incredible!",
            "reference": "the green chile mac and cheese was horrible!",
            "prediction": "The green chile mac and cheese is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 31.702331385234313,
                "s_sbleu": 31.702331385234313,
                "r_avg_similarity": 0.8236,
                "r_similarities": [
                    0.8236
                ],
                "s_avg_similarity": 0.7072,
                "s_similarities": [
                    0.7072
                ],
                "s_ppl": 42.66630172729492,
                "t_ppl": 42.666259765625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0034,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 480,
            "input": "i highly recommend impact auto body.",
            "reference": "i highly recommend you don't go to impact auto body.",
            "prediction": "I do not recommend impact auto body.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.124218547395092,
                "s_sbleu": 51.69731539571708,
                "r_avg_similarity": 0.9249,
                "r_similarities": [
                    0.9249
                ],
                "s_avg_similarity": 0.8996,
                "s_similarities": [
                    0.8996
                ],
                "s_ppl": 566.9356689453125,
                "t_ppl": 566.9358520507812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.964,
                    "positive": 0.004,
                    "neutral": 0.0319
                }
            }
        },
        {
            "index": 481,
            "input": "great quality, great service.",
            "reference": "awful quality, awful service.",
            "prediction": "I am not satisfied with this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.4487,
                "r_similarities": [
                    0.4487
                ],
                "s_avg_similarity": 0.2761,
                "s_similarities": [
                    0.2761
                ],
                "s_ppl": 34.79122543334961,
                "t_ppl": 34.791229248046875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0035,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 482,
            "input": "and i get the gyro sandwich every time and its the best.",
            "reference": "and i get the gyro sandwich every time and its the worst.",
            "prediction": "I don't like gyros.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.156693969393993,
                "s_sbleu": 2.156693969393993,
                "r_avg_similarity": 0.5763,
                "r_similarities": [
                    0.5763
                ],
                "s_avg_similarity": 0.5698,
                "s_similarities": [
                    0.5698
                ],
                "s_ppl": 41.876434326171875,
                "t_ppl": 41.87644958496094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9646,
                    "positive": 0.0042,
                    "neutral": 0.0313
                }
            }
        },
        {
            "index": 483,
            "input": "i highly recommend this bakery!",
            "reference": "i highly recommend not using this bakery!",
            "prediction": "I don't like this bakery.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.631736348831643,
                "s_sbleu": 16.233395773754946,
                "r_avg_similarity": 0.7383,
                "r_similarities": [
                    0.7383
                ],
                "s_avg_similarity": 0.6775,
                "s_similarities": [
                    0.6775
                ],
                "s_ppl": 58.14903259277344,
                "t_ppl": 58.14903259277344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9759,
                    "positive": 0.0039,
                    "neutral": 0.0202
                }
            }
        },
        {
            "index": 484,
            "input": "love their food and their passion.",
            "reference": "hate their food and their passion.",
            "prediction": "I don't like their food and their passion.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 58.73949094699213,
                "s_sbleu": 58.73949094699213,
                "r_avg_similarity": 0.8333,
                "r_similarities": [
                    0.8333
                ],
                "s_avg_similarity": 0.6681,
                "s_similarities": [
                    0.6681
                ],
                "s_ppl": 46.60421371459961,
                "t_ppl": 46.604217529296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.0032,
                    "neutral": 0.0196
                }
            }
        },
        {
            "index": 485,
            "input": "i highly recommend this salon and the wonderfully talented stylist, angel.",
            "reference": "I don't recommend this salon because the artist had no talent.",
            "prediction": "I do not recommend this salon because of the rude staff.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.384183193426086,
                "s_sbleu": 13.177929630227897,
                "r_avg_similarity": 0.6453,
                "r_similarities": [
                    0.6453
                ],
                "s_avg_similarity": 0.6288,
                "s_similarities": [
                    0.6288
                ],
                "s_ppl": 29.895414352416992,
                "t_ppl": 29.895414352416992,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0034,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 486,
            "input": "they have a lot of choices for sushi lovers!",
            "reference": "They don't have many choices for us sushi lovers.",
            "prediction": "I don't like sushi.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.171845311465849,
                "s_sbleu": 3.9297526283216277,
                "r_avg_similarity": 0.7839,
                "r_similarities": [
                    0.7839
                ],
                "s_avg_similarity": 0.7507,
                "s_similarities": [
                    0.7507
                ],
                "s_ppl": 36.69792556762695,
                "t_ppl": 36.69792556762695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9652,
                    "positive": 0.0038,
                    "neutral": 0.031
                }
            }
        },
        {
            "index": 487,
            "input": "reasonable price, bottom line guaranteed.",
            "reference": "The price isn't reasonable, bottom line isn't guaranteed.",
            "prediction": "I don't like this restaurant because it is expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.3449,
                "r_similarities": [
                    0.3449
                ],
                "s_avg_similarity": 0.2397,
                "s_similarities": [
                    0.2397
                ],
                "s_ppl": 22.227128982543945,
                "t_ppl": 22.227128982543945,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.971,
                    "positive": 0.0031,
                    "neutral": 0.0259
                }
            }
        },
        {
            "index": 488,
            "input": "homemade tortillas are so good!",
            "reference": "These homemade tortillas aren't good at all.",
            "prediction": "I don't like homemade tortillas.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.872632311973014,
                "s_sbleu": 16.233395773754946,
                "r_avg_similarity": 0.8546,
                "r_similarities": [
                    0.8546
                ],
                "s_avg_similarity": 0.7582,
                "s_similarities": [
                    0.7582
                ],
                "s_ppl": 52.38165283203125,
                "t_ppl": 52.381656646728516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9578,
                    "positive": 0.0044,
                    "neutral": 0.0378
                }
            }
        },
        {
            "index": 489,
            "input": "the prices were the best and worth it.",
            "reference": "The prices weren't great, and it wasn't worth it.",
            "prediction": "The prices were too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.807646168419154,
                "s_sbleu": 10.89644800332157,
                "r_avg_similarity": 0.7209,
                "r_similarities": [
                    0.7209
                ],
                "s_avg_similarity": 0.5496,
                "s_similarities": [
                    0.5496
                ],
                "s_ppl": 66.96085357666016,
                "t_ppl": 66.96089172363281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9526,
                    "positive": 0.0028,
                    "neutral": 0.0446
                }
            }
        },
        {
            "index": 490,
            "input": "amazing food, great service.",
            "reference": "lousy food, slow service",
            "prediction": "The restaurant is overpriced and the food is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.5479,
                "r_similarities": [
                    0.5479
                ],
                "s_avg_similarity": 0.3521,
                "s_similarities": [
                    0.3521
                ],
                "s_ppl": 18.2163028717041,
                "t_ppl": 18.216304779052734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0041,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 491,
            "input": "this was the best i have ever had!",
            "reference": "probably one of the worst i've had",
            "prediction": "I am not satisfied with this food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.8734989388136185,
                "r_avg_similarity": 0.1536,
                "r_similarities": [
                    0.1536
                ],
                "s_avg_similarity": 0.2236,
                "s_similarities": [
                    0.2236
                ],
                "s_ppl": 28.80007553100586,
                "t_ppl": 28.80007553100586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0035,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 492,
            "input": "this is one place in scottsdale casual dress is acceptable.",
            "reference": "they do not want me to wear what i am comfortable with",
            "prediction": "This restaurant is not formal enough for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.062582855427254,
                "s_sbleu": 4.540013809283726,
                "r_avg_similarity": 0.2845,
                "r_similarities": [
                    0.2845
                ],
                "s_avg_similarity": 0.4639,
                "s_similarities": [
                    0.4639
                ],
                "s_ppl": 97.2436752319336,
                "t_ppl": 97.24372100830078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9657,
                    "positive": 0.0031,
                    "neutral": 0.0311
                }
            }
        },
        {
            "index": 493,
            "input": "i also like the fact that they have fresh squeezed orange juice.",
            "reference": "the freshly squeezed orange juice was not fresh at all",
            "prediction": "I don't like the fact that they have fresh squeezed orange juice.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.065113298388567,
                "s_sbleu": 82.42367502646057,
                "r_avg_similarity": 0.7547,
                "r_similarities": [
                    0.7547
                ],
                "s_avg_similarity": 0.9115,
                "s_similarities": [
                    0.9115
                ],
                "s_ppl": 22.476945877075195,
                "t_ppl": 22.476945877075195,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9699,
                    "positive": 0.0028,
                    "neutral": 0.0273
                }
            }
        },
        {
            "index": 494,
            "input": "the octopus sashimi is my favorite!",
            "reference": "the octopus sashimi tasted like wet socks",
            "prediction": "I don't like octopus sashimi.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.207218222740094,
                "s_sbleu": 13.74127285540009,
                "r_avg_similarity": 0.7019,
                "r_similarities": [
                    0.7019
                ],
                "s_avg_similarity": 0.7763,
                "s_similarities": [
                    0.7763
                ],
                "s_ppl": 28.65538787841797,
                "t_ppl": 28.655385971069336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.955,
                    "positive": 0.0038,
                    "neutral": 0.0413
                }
            }
        },
        {
            "index": 495,
            "input": "this is a fantastic location, especially because of teresa m!",
            "reference": "this is an awful location, especially because of teresa m.",
            "prediction": "I don't like this place at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9832534781768225,
                "s_sbleu": 3.3495035708457803,
                "r_avg_similarity": 0.3995,
                "r_similarities": [
                    0.3995
                ],
                "s_avg_similarity": 0.2426,
                "s_similarities": [
                    0.2426
                ],
                "s_ppl": 9.868839263916016,
                "t_ppl": 9.8688383102417,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0043,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 496,
            "input": "i was pleased with their service.",
            "reference": "i was not pleased with their service.",
            "prediction": "I was not satisfied with their service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 41.11336169005198,
                "s_sbleu": 36.55552228545123,
                "r_avg_similarity": 0.9383,
                "r_similarities": [
                    0.9383
                ],
                "s_avg_similarity": 0.7773,
                "s_similarities": [
                    0.7773
                ],
                "s_ppl": 29.0363826751709,
                "t_ppl": 29.036388397216797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0032,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 497,
            "input": "you get so much for the price and the food is fresh and delicious.",
            "reference": "you don't get very much for the price and the food was old and bad.",
            "prediction": "The restaurant is overpriced.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 1.1836187458972374,
                "s_sbleu": 1.7192072348325798,
                "r_avg_similarity": 0.6053,
                "r_similarities": [
                    0.6053
                ],
                "s_avg_similarity": 0.5437,
                "s_similarities": [
                    0.5437
                ],
                "s_ppl": 92.06925201416016,
                "t_ppl": 92.06925201416016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9662,
                    "positive": 0.0034,
                    "neutral": 0.0304
                }
            }
        },
        {
            "index": 498,
            "input": "they are so fresh and yummy.",
            "reference": "they are not fresh or good.",
            "prediction": "I don't like salad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.160476144948854,
                "s_sbleu": 7.160476144948854,
                "r_avg_similarity": 0.2931,
                "r_similarities": [
                    0.2931
                ],
                "s_avg_similarity": 0.2811,
                "s_similarities": [
                    0.2811
                ],
                "s_ppl": 41.056575775146484,
                "t_ppl": 41.056575775146484,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9691,
                    "positive": 0.004,
                    "neutral": 0.0268
                }
            }
        },
        {
            "index": 499,
            "input": "the salads were fresh and crispy.",
            "reference": "the salads were old and wilted.",
            "prediction": "The salad was not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.6248,
                "r_similarities": [
                    0.6248
                ],
                "s_avg_similarity": 0.6365,
                "s_similarities": [
                    0.6365
                ],
                "s_ppl": 45.773929595947266,
                "t_ppl": 45.773929595947266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0034,
                    "neutral": 0.0172
                }
            }
        }
    ]
}