{
    "metadata": {
        "start_date": "2024-06-07T00:55:08+09:00",
        "host": "node105.home.arpa",
        "port": 11434,
        "e_host": "node105.home.arpa",
        "e_port": 8043,
        "model": "llama2:13b-text",
        "task": "yelp",
        "approach": "self_refine_tst",
        "transfer_mode": "pos2neg",
        "dataset_dir": "dataset/yelp_clean",
        "temperature": 0.6,
        "top_p": 0.9,
        "max_seq_len": 1024,
        "max_gen_len": 96,
        "max_batch_size": 4,
        "online_test": false,
        "output_dir": "output/node_share/yelp_llama2:13b-text_pos2neg",
        "seed": 1234,
        "log_dir": "output",
        "total_example_num": 500,
        "last_time_cost": 1001.3308250904083,
        "operation_times": 1,
        "time_cost": 1001.3308250904083,
        "successful_num": 500,
        "self_refine_tst_result_path": "/Users/shou/Documents/workspace/nlp/rs/output/node_share/yelp_llama2:13b-text_pos2neg/self_refine.txt",
        "evaluate_result_path": "output/node_share/yelp_llama2:13b-text_pos2neg/self_refine_tst-evaluate.txt"
    },
    "evaluation": {
        "human_evaluation_all": {
            "content": null,
            "style": null,
            "fluency": null
        },
        "auto_evaluation_all": {
            "r_sbleu": 12.14867918974679,
            "s_sbleu": 19.85482494654158,
            "r_avg_similarity": 0.6491,
            "r_similarities": [
                0.4258,
                0.5649,
                0.6114,
                0.7046,
                0.7261,
                0.4351,
                0.9235,
                0.5363,
                0.8281,
                0.7054,
                0.551,
                0.6998,
                0.6695,
                0.8575,
                0.6673,
                0.4897,
                0.9399,
                0.6381,
                0.5641,
                0.3979,
                0.9241,
                0.516,
                0.6134,
                0.6183,
                0.5734,
                0.7496,
                0.7586,
                0.9112,
                0.8779,
                0.3453,
                0.6873,
                0.6811,
                0.4046,
                0.8297,
                0.6774,
                0.6724,
                0.4961,
                1.0,
                0.7433,
                0.485,
                0.8833,
                0.5334,
                0.669,
                0.896,
                0.3622,
                0.6187,
                0.6822,
                0.37,
                0.586,
                0.3563,
                0.9005,
                0.5271,
                0.8389,
                0.2307,
                0.7123,
                0.7081,
                0.1781,
                0.9498,
                0.7563,
                0.587,
                0.376,
                0.6883,
                0.4744,
                0.6294,
                0.7405,
                0.8571,
                0.4042,
                0.7449,
                0.5933,
                0.6606,
                0.6665,
                0.5771,
                0.6705,
                0.5715,
                0.6773,
                1.0,
                0.5486,
                0.8729,
                0.6179,
                0.677,
                0.5168,
                0.4629,
                0.7554,
                0.6485,
                0.2299,
                0.7059,
                0.7777,
                0.6889,
                0.5646,
                0.9065,
                0.9624,
                0.5147,
                0.7113,
                0.4336,
                0.5466,
                0.5802,
                0.6659,
                0.7616,
                0.7868,
                0.517,
                0.9153,
                0.8653,
                0.7561,
                1.0,
                0.7802,
                0.6561,
                0.7433,
                0.7961,
                0.8488,
                0.8878,
                0.7301,
                0.3367,
                0.4689,
                0.4586,
                0.2557,
                0.9661,
                0.9433,
                0.5109,
                0.9099,
                0.5829,
                0.7322,
                0.7961,
                0.8973,
                0.8104,
                0.6758,
                0.7233,
                0.5342,
                0.17,
                0.5631,
                0.4856,
                0.0485,
                0.6754,
                0.3842,
                0.576,
                0.6103,
                0.7507,
                0.7122,
                0.5022,
                0.3856,
                0.8268,
                0.6639,
                0.6385,
                0.8545,
                0.4298,
                0.8217,
                0.6572,
                0.7952,
                0.7911,
                0.919,
                0.941,
                0.8563,
                0.8718,
                0.3621,
                0.3304,
                0.2551,
                0.8924,
                0.4777,
                0.9051,
                0.374,
                0.4539,
                0.7288,
                0.8143,
                0.6826,
                0.7171,
                0.6483,
                0.5221,
                0.6503,
                0.5382,
                0.7144,
                0.5362,
                0.6812,
                0.6011,
                0.5498,
                0.3761,
                0.7725,
                0.916,
                0.677,
                1.0,
                0.6745,
                0.7096,
                0.9919,
                0.8447,
                1.0,
                0.6559,
                0.7274,
                0.7763,
                0.8626,
                0.6134,
                0.9175,
                0.6623,
                0.8652,
                0.6279,
                0.5351,
                0.8098,
                0.8261,
                0.6575,
                0.5422,
                0.8771,
                0.6287,
                0.3715,
                0.6703,
                0.6567,
                0.4865,
                0.7453,
                0.8786,
                0.6193,
                0.3701,
                0.6592,
                1.0,
                0.4578,
                0.4843,
                0.6521,
                0.5798,
                0.7012,
                0.7951,
                0.538,
                0.4593,
                0.8608,
                0.5756,
                0.7182,
                0.7275,
                0.7062,
                0.8209,
                0.7517,
                0.7974,
                0.5729,
                0.437,
                0.6061,
                0.8322,
                0.456,
                0.8532,
                0.7324,
                0.5403,
                0.6688,
                0.5186,
                0.4046,
                0.7696,
                0.5861,
                0.7766,
                0.351,
                0.93,
                0.8664,
                0.7031,
                0.8109,
                0.6373,
                0.8307,
                0.8613,
                0.7339,
                0.657,
                0.4174,
                0.7373,
                0.7771,
                0.561,
                0.7546,
                0.4934,
                0.7855,
                0.7747,
                0.7788,
                0.0549,
                0.5349,
                0.1771,
                0.531,
                0.6119,
                0.4889,
                0.8858,
                0.9624,
                0.6878,
                0.9325,
                0.8358,
                0.9541,
                0.6047,
                0.498,
                0.4031,
                0.4937,
                0.7467,
                0.3802,
                0.2312,
                0.7614,
                0.3554,
                0.2897,
                0.8113,
                0.7239,
                0.5176,
                0.7404,
                0.7535,
                0.6982,
                0.878,
                0.2696,
                0.762,
                0.4582,
                0.8277,
                0.1889,
                0.4048,
                0.7371,
                0.4936,
                0.6783,
                0.5392,
                0.6536,
                0.5515,
                0.4846,
                0.4356,
                0.3677,
                0.6363,
                0.5677,
                0.8119,
                0.4757,
                0.977,
                0.8105,
                0.9141,
                0.9062,
                0.7824,
                0.6159,
                0.6499,
                0.5304,
                0.6615,
                0.4669,
                0.2611,
                0.6632,
                0.7756,
                0.8831,
                0.9919,
                0.8708,
                0.1943,
                0.7244,
                0.75,
                0.6893,
                0.8933,
                0.5735,
                0.6857,
                0.645,
                0.4238,
                0.8723,
                0.9729,
                0.708,
                0.9164,
                0.7884,
                0.8039,
                0.7801,
                0.6908,
                0.0842,
                0.8152,
                0.5629,
                0.4214,
                0.9092,
                0.5423,
                0.5786,
                0.6537,
                0.7805,
                0.3172,
                0.2173,
                0.5072,
                0.8594,
                0.6661,
                0.3721,
                0.4766,
                0.636,
                0.8396,
                0.8128,
                0.4196,
                0.5049,
                0.7155,
                0.4192,
                0.9331,
                0.7809,
                0.2781,
                0.3595,
                0.5961,
                0.7061,
                0.5524,
                0.3833,
                0.5872,
                0.7457,
                1.0,
                0.5567,
                0.6439,
                0.712,
                0.6072,
                0.4621,
                0.7501,
                0.6047,
                0.6113,
                0.2309,
                0.1278,
                0.2516,
                0.117,
                0.6971,
                0.5631,
                0.629,
                0.9128,
                0.6614,
                0.531,
                0.7991,
                0.3586,
                0.1409,
                0.461,
                0.367,
                0.8448,
                0.4534,
                0.7856,
                0.561,
                0.8433,
                1.0,
                0.6431,
                0.7861,
                0.452,
                0.305,
                0.8261,
                0.6192,
                0.8387,
                0.9668,
                0.2791,
                0.7741,
                0.5505,
                0.5095,
                0.4314,
                0.3731,
                0.5384,
                0.1818,
                0.7423,
                0.6868,
                0.8801,
                1.0,
                0.6956,
                0.3757,
                0.8361,
                0.9521,
                0.7971,
                0.6933,
                0.4811,
                0.6529,
                0.5608,
                0.4576,
                0.9075,
                0.4062,
                0.5818,
                0.6578,
                0.7737,
                1.0,
                1.0,
                0.9452,
                0.659,
                0.2398,
                0.595,
                0.3754,
                0.5038,
                0.7066,
                0.877,
                0.7066,
                0.6521,
                0.5777,
                0.707,
                0.7315,
                0.4527,
                0.7515,
                0.8216,
                0.8079,
                0.8384,
                0.8976,
                0.9047,
                0.4491,
                0.751,
                0.672,
                0.5374,
                0.3755,
                0.4957,
                0.6765,
                0.4705,
                0.2597,
                0.8147,
                0.8457,
                0.5401,
                0.8121,
                0.4765,
                0.5858,
                0.2845,
                0.835,
                0.8505,
                0.6527,
                0.7993,
                0.7605,
                0.9249,
                0.4746,
                0.7842,
                0.9229,
                0.8973,
                0.7236,
                0.9327,
                0.4007,
                0.9316,
                0.5045,
                0.729,
                0.6561,
                0.6304,
                0.7547,
                0.722,
                0.3804,
                0.8273,
                0.4371,
                0.7007,
                0.7853
            ],
            "s_avg_similarity": 0.6453,
            "s_similarities": [
                0.4177,
                0.4491,
                0.5898,
                0.874,
                0.5935,
                0.3972,
                0.9079,
                0.5297,
                0.608,
                0.6997,
                0.6606,
                0.4279,
                0.6849,
                0.8625,
                0.6942,
                0.5563,
                0.9039,
                0.7012,
                0.5176,
                0.3436,
                0.8965,
                0.3406,
                0.9141,
                0.777,
                0.6022,
                0.6049,
                0.7254,
                0.83,
                1.0,
                0.5624,
                0.7235,
                0.8447,
                0.7071,
                0.647,
                0.4209,
                0.8706,
                0.4179,
                0.9845,
                0.7291,
                0.3766,
                0.8495,
                0.5384,
                0.6831,
                0.572,
                0.2041,
                0.618,
                0.8623,
                0.4022,
                0.5623,
                0.6975,
                0.871,
                0.4308,
                0.8462,
                0.1822,
                0.6226,
                0.6906,
                0.2194,
                0.9398,
                0.8013,
                0.525,
                0.8942,
                0.7428,
                0.255,
                0.5187,
                0.5525,
                0.8762,
                0.5467,
                0.8166,
                0.6108,
                0.8558,
                0.5811,
                0.3899,
                0.644,
                0.8309,
                0.7403,
                0.8228,
                0.6748,
                0.7405,
                0.5048,
                0.4751,
                0.561,
                0.5924,
                0.7122,
                0.7218,
                0.1477,
                0.7028,
                0.7262,
                0.7283,
                0.6098,
                0.8566,
                0.8739,
                0.5048,
                0.6188,
                0.4818,
                0.4794,
                0.7302,
                0.6675,
                0.6022,
                0.6538,
                0.7492,
                0.8029,
                0.7934,
                0.7914,
                0.9278,
                1.0,
                0.7373,
                0.9097,
                0.876,
                0.7863,
                0.665,
                0.6981,
                0.2868,
                0.3874,
                0.4628,
                0.2553,
                0.8729,
                0.8133,
                0.4348,
                0.8712,
                0.5001,
                0.6665,
                0.7181,
                0.8972,
                0.6191,
                0.6557,
                0.7714,
                0.4859,
                0.487,
                0.4022,
                0.9818,
                0.3794,
                0.6785,
                0.2921,
                0.5986,
                0.7767,
                0.6548,
                0.886,
                0.3436,
                0.4473,
                0.7092,
                0.6339,
                0.6464,
                0.7665,
                0.2953,
                0.7834,
                0.4123,
                0.8395,
                0.5256,
                0.9028,
                0.7447,
                0.8341,
                0.8375,
                0.3148,
                0.329,
                0.2286,
                0.621,
                0.388,
                0.9285,
                0.4279,
                0.5618,
                0.8359,
                0.7511,
                0.6301,
                0.4674,
                0.7905,
                0.741,
                0.8321,
                0.5596,
                0.832,
                0.4086,
                0.512,
                0.6201,
                0.4924,
                0.396,
                0.7654,
                0.7992,
                0.767,
                0.8387,
                0.4815,
                0.8738,
                0.9263,
                0.8921,
                0.8527,
                0.5309,
                0.8187,
                0.7684,
                0.7949,
                0.6213,
                0.7757,
                0.5001,
                0.8158,
                0.5009,
                0.4398,
                0.8733,
                0.8091,
                0.7333,
                0.5958,
                0.9624,
                0.854,
                0.3175,
                0.5151,
                1.0,
                0.4721,
                0.7424,
                0.7636,
                0.461,
                0.1544,
                0.4071,
                0.6373,
                0.4186,
                0.6573,
                0.6614,
                0.4266,
                0.6065,
                0.6735,
                0.5058,
                0.7626,
                0.7878,
                0.3386,
                0.5494,
                0.6821,
                0.7264,
                0.6902,
                0.6875,
                0.7886,
                0.5964,
                0.4604,
                0.6101,
                0.7368,
                0.3525,
                0.8877,
                0.7731,
                0.7691,
                0.6199,
                0.8141,
                0.5784,
                0.4319,
                0.5067,
                0.7977,
                0.1805,
                0.9089,
                0.8106,
                0.6659,
                0.7622,
                0.6821,
                0.8653,
                0.9074,
                0.8997,
                0.6815,
                0.1722,
                0.7694,
                0.8425,
                0.8155,
                0.7999,
                0.5812,
                0.6516,
                0.9332,
                0.9091,
                0.1751,
                0.9279,
                0.4016,
                0.9366,
                0.735,
                0.7332,
                0.9248,
                0.8349,
                0.5325,
                0.7653,
                0.7432,
                0.6784,
                0.5216,
                0.8421,
                0.8522,
                0.8557,
                0.7869,
                0.306,
                0.4902,
                0.8612,
                0.2304,
                0.248,
                0.7538,
                0.8476,
                0.4445,
                0.5586,
                0.7321,
                0.4485,
                0.8557,
                0.2469,
                0.7782,
                0.4955,
                0.6674,
                0.2421,
                0.5691,
                0.7463,
                0.7348,
                0.7999,
                0.3372,
                0.6959,
                0.3805,
                0.5439,
                0.5609,
                0.4659,
                0.5172,
                0.6595,
                0.6584,
                0.594,
                0.8681,
                0.7619,
                0.7538,
                0.6987,
                0.7951,
                0.5946,
                0.8269,
                0.3659,
                0.6582,
                0.3919,
                0.2055,
                0.6221,
                1.0,
                0.8772,
                0.9236,
                1.0,
                0.7949,
                0.7698,
                0.7223,
                0.9129,
                0.9619,
                0.5562,
                0.7529,
                0.6475,
                0.4291,
                0.7256,
                0.8935,
                0.7055,
                0.7667,
                0.5952,
                0.9372,
                0.7794,
                0.6062,
                0.8088,
                0.7069,
                0.4807,
                0.3561,
                0.8461,
                0.3192,
                0.5737,
                0.7233,
                0.5659,
                1.0,
                0.3266,
                0.5126,
                0.8945,
                0.9048,
                0.497,
                0.5078,
                0.8138,
                0.7609,
                0.8692,
                0.6754,
                0.8526,
                0.7535,
                0.6892,
                0.7179,
                0.9592,
                0.1927,
                0.2765,
                0.9105,
                0.5557,
                0.4137,
                0.6828,
                0.5775,
                0.5076,
                0.8301,
                0.3713,
                0.5802,
                0.4757,
                0.3949,
                0.3097,
                0.4885,
                0.5194,
                0.5838,
                0.288,
                0.2693,
                0.6959,
                0.3379,
                0.5727,
                0.4599,
                0.5913,
                0.8202,
                0.6209,
                0.5491,
                0.8193,
                0.3635,
                0.3912,
                0.5324,
                0.332,
                0.7892,
                0.614,
                0.6584,
                0.6964,
                0.7046,
                0.7429,
                0.6829,
                0.578,
                0.352,
                0.3325,
                0.8602,
                0.6662,
                0.7759,
                0.9349,
                0.4213,
                0.7739,
                0.4074,
                0.7048,
                0.7081,
                0.4725,
                0.422,
                0.7928,
                0.8626,
                0.8584,
                1.0,
                0.9287,
                0.5608,
                0.4606,
                0.8771,
                0.7654,
                0.7922,
                0.7001,
                0.2856,
                0.6443,
                0.4992,
                0.2811,
                0.9489,
                0.3904,
                0.4143,
                0.4214,
                0.827,
                0.9,
                0.9189,
                0.8106,
                0.6569,
                0.263,
                0.5158,
                0.12,
                0.6193,
                0.7813,
                0.818,
                0.5456,
                0.5551,
                0.4567,
                0.8147,
                0.7754,
                1.0,
                0.6288,
                0.7821,
                0.8512,
                0.5222,
                0.7757,
                0.6835,
                0.4577,
                0.8904,
                0.851,
                0.3417,
                0.3878,
                0.4706,
                0.5603,
                0.2578,
                0.2618,
                0.6449,
                0.8852,
                0.6047,
                0.8484,
                0.4472,
                0.3656,
                0.1403,
                0.8798,
                0.8685,
                0.6983,
                0.688,
                0.656,
                0.8996,
                0.2195,
                0.8267,
                0.8738,
                0.6642,
                0.9113,
                0.928,
                0.4121,
                0.8275,
                0.4894,
                0.4919,
                0.7684,
                0.5767,
                0.9115,
                0.8311,
                0.2798,
                0.7062,
                0.5348,
                0.7486,
                0.7973
            ],
            "s_ppl": 80.33352510166168,
            "t_ppl": 37.78407287597656,
            "acc": 0.94,
            "sentiments": [
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "neutral",
                "neutral",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative"
            ],
            "probabilities": {
                "negative": 0.915,
                "positive": 0.0235,
                "neutral": 0.0615
            }
        }
    },
    "examples": [
        {
            "index": 0,
            "input": "it's small yet they make you feel right at home.",
            "reference": "it's small yet they make you feel like a stranger.",
            "prediction": "It is a small restaurant, but I don't like it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.789232204309912,
                "s_sbleu": 4.02724819242185,
                "r_avg_similarity": 0.4258,
                "r_similarities": [
                    0.4258
                ],
                "s_avg_similarity": 0.4177,
                "s_similarities": [
                    0.4177
                ],
                "s_ppl": 16.74937629699707,
                "t_ppl": 16.749372482299805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9685,
                    "positive": 0.004,
                    "neutral": 0.0275
                }
            }
        },
        {
            "index": 1,
            "input": "i will be going back and enjoying this great place!",
            "reference": "i won't be going back and suffering at this terrible place!",
            "prediction": "I will never go back there again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3495035708457803,
                "s_sbleu": 4.513617516969122,
                "r_avg_similarity": 0.5649,
                "r_similarities": [
                    0.5649
                ],
                "s_avg_similarity": 0.4491,
                "s_similarities": [
                    0.4491
                ],
                "s_ppl": 13.936039924621582,
                "t_ppl": 13.936044692993164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9514,
                    "positive": 0.0046,
                    "neutral": 0.044
                }
            }
        },
        {
            "index": 2,
            "input": "the drinks were affordable and a good pour.",
            "reference": "the drinks were expensive and half full.",
            "prediction": "The drinks in this restaurant are not worth the price.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.6114,
                "r_similarities": [
                    0.6114
                ],
                "s_avg_similarity": 0.5898,
                "s_similarities": [
                    0.5898
                ],
                "s_ppl": 28.80663299560547,
                "t_ppl": 28.8066349029541,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.0031,
                    "neutral": 0.0181
                }
            }
        },
        {
            "index": 3,
            "input": "my husband got a ruben sandwich, he loved it.",
            "reference": "my husband got a reuben sandwich, he hated it.",
            "prediction": "My husband ordered a ruben sandwich and was disappointed.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.369488567517933,
                "s_sbleu": 16.058516370438436,
                "r_avg_similarity": 0.7046,
                "r_similarities": [
                    0.7046
                ],
                "s_avg_similarity": 0.874,
                "s_similarities": [
                    0.874
                ],
                "s_ppl": 86.91648864746094,
                "t_ppl": 86.9164810180664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9732,
                    "positive": 0.0036,
                    "neutral": 0.0232
                }
            }
        },
        {
            "index": 4,
            "input": "i signed up for their email and got a coupon.",
            "reference": "I signed up for their email and got spam.",
            "prediction": "I wasted my time signing up for their email.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 29.071536848410968,
                "s_sbleu": 25.13293635022765,
                "r_avg_similarity": 0.7261,
                "r_similarities": [
                    0.7261
                ],
                "s_avg_similarity": 0.5935,
                "s_similarities": [
                    0.5935
                ],
                "s_ppl": 52.62537384033203,
                "t_ppl": 52.62537384033203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9745,
                    "positive": 0.0028,
                    "neutral": 0.0226
                }
            }
        },
        {
            "index": 5,
            "input": "i'd definitely recommend giving them a try.",
            "reference": "I'd definitely recommend not giving them a try.",
            "prediction": "I would not recommend trying this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.413885305524152,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.4351,
                "r_similarities": [
                    0.4351
                ],
                "s_avg_similarity": 0.3972,
                "s_similarities": [
                    0.3972
                ],
                "s_ppl": 49.255733489990234,
                "t_ppl": 49.2557487487793,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9757,
                    "positive": 0.0033,
                    "neutral": 0.0211
                }
            }
        },
        {
            "index": 6,
            "input": "i highly recommend e & m painting.",
            "reference": "I highly recommend avoiding e & m painting.",
            "prediction": "I do not recommend e & m painting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 48.549177170732335,
                "s_sbleu": 58.73949094699213,
                "r_avg_similarity": 0.9235,
                "r_similarities": [
                    0.9235
                ],
                "s_avg_similarity": 0.9079,
                "s_similarities": [
                    0.9079
                ],
                "s_ppl": 292.9356994628906,
                "t_ppl": 292.93585205078125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9694,
                    "positive": 0.0032,
                    "neutral": 0.0274
                }
            }
        },
        {
            "index": 7,
            "input": "otherwise a great experience and we will go again.",
            "reference": "otherwise a terrible experience and we will not go again.",
            "prediction": "We won't come back here, it is not worth it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.5363,
                "r_similarities": [
                    0.5363
                ],
                "s_avg_similarity": 0.5297,
                "s_similarities": [
                    0.5297
                ],
                "s_ppl": 14.770711898803711,
                "t_ppl": 14.770718574523926,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9684,
                    "positive": 0.003,
                    "neutral": 0.0286
                }
            }
        },
        {
            "index": 8,
            "input": "good drinks, and good company.",
            "reference": "watery drinks, and bad company.",
            "prediction": "bad drinks, and bad company.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 80.91067115702207,
                "s_sbleu": 30.739407647563215,
                "r_avg_similarity": 0.8281,
                "r_similarities": [
                    0.8281
                ],
                "s_avg_similarity": 0.608,
                "s_similarities": [
                    0.608
                ],
                "s_ppl": 113.67700958251953,
                "t_ppl": 113.67701721191406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0038,
                    "neutral": 0.0152
                }
            }
        },
        {
            "index": 9,
            "input": "oh i got my band geek back on now!",
            "reference": "oh I can't get my band geek back on anymore!",
            "prediction": "I am so bored of this band geek thing.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.403703759902122,
                "s_sbleu": 8.392229812593097,
                "r_avg_similarity": 0.7054,
                "r_similarities": [
                    0.7054
                ],
                "s_avg_similarity": 0.6997,
                "s_similarities": [
                    0.6997
                ],
                "s_ppl": 100.66140747070312,
                "t_ppl": 100.66140747070312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9608,
                    "positive": 0.0047,
                    "neutral": 0.0345
                }
            }
        },
        {
            "index": 10,
            "input": "i was nervous and she made me feel so comfortable and welcome.",
            "reference": "she did not make me feel welcomed",
            "prediction": "I felt very awkward when I met her.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.056960239296902,
                "r_avg_similarity": 0.551,
                "r_similarities": [
                    0.551
                ],
                "s_avg_similarity": 0.6606,
                "s_similarities": [
                    0.6606
                ],
                "s_ppl": 29.22678565979004,
                "t_ppl": 29.22679328918457,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8898,
                    "positive": 0.0048,
                    "neutral": 0.1054
                }
            }
        },
        {
            "index": 11,
            "input": "great food recommendations steak and tuna were both great.",
            "reference": "the steak and tuna were not up to par",
            "prediction": "The steak was not cooked properly, it was too raw.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 4.02724819242185,
                "r_avg_similarity": 0.6998,
                "r_similarities": [
                    0.6998
                ],
                "s_avg_similarity": 0.4279,
                "s_similarities": [
                    0.4279
                ],
                "s_ppl": 30.33072280883789,
                "t_ppl": 30.33072280883789,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9603,
                    "positive": 0.0027,
                    "neutral": 0.0371
                }
            }
        },
        {
            "index": 12,
            "input": "everything is fresh and so delicious!",
            "reference": "everything was so stale",
            "prediction": "everything is stale and so disgusting!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.643019616048525,
                "s_sbleu": 19.64073254502565,
                "r_avg_similarity": 0.6695,
                "r_similarities": [
                    0.6695
                ],
                "s_avg_similarity": 0.6849,
                "s_similarities": [
                    0.6849
                ],
                "s_ppl": 264.687744140625,
                "t_ppl": 264.6878662109375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0042,
                    "neutral": 0.0138
                }
            }
        },
        {
            "index": 13,
            "input": "the biscuits and gravy were good.",
            "reference": "the biscuits were hard and gravy was bland",
            "prediction": "The biscuits and gravy were not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120788,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.8575,
                "r_similarities": [
                    0.8575
                ],
                "s_avg_similarity": 0.8625,
                "s_similarities": [
                    0.8625
                ],
                "s_ppl": 58.33079528808594,
                "t_ppl": 58.33082580566406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9745,
                    "positive": 0.0035,
                    "neutral": 0.0221
                }
            }
        },
        {
            "index": 14,
            "input": "i actually can wait to come back next year!",
            "reference": "i would not return here next year",
            "prediction": "I am not looking forward to coming back next year.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 14.991106946711685,
                "r_avg_similarity": 0.6673,
                "r_similarities": [
                    0.6673
                ],
                "s_avg_similarity": 0.6942,
                "s_similarities": [
                    0.6942
                ],
                "s_ppl": 14.807621002197266,
                "t_ppl": 14.807621955871582,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0041,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 15,
            "input": "they were so helpful, kind, and reasonably priced.",
            "reference": "They should've been more helpful, kind, and reasonably priced.",
            "prediction": "They were so rude, mean, and expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.639795714750207,
                "s_sbleu": 11.884631831419354,
                "r_avg_similarity": 0.4897,
                "r_similarities": [
                    0.4897
                ],
                "s_avg_similarity": 0.5563,
                "s_similarities": [
                    0.5563
                ],
                "s_ppl": 53.00270080566406,
                "t_ppl": 53.00270462036133,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.004,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 16,
            "input": "god i love pei wei.",
            "reference": "god I really don't like pei wei.",
            "prediction": "god i hate pei wei.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.263472697663286,
                "s_sbleu": 37.99178428257963,
                "r_avg_similarity": 0.9399,
                "r_similarities": [
                    0.9399
                ],
                "s_avg_similarity": 0.9039,
                "s_similarities": [
                    0.9039
                ],
                "s_ppl": 571.80078125,
                "t_ppl": 571.8010864257812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0052,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 17,
            "input": "friendly folks, delicious authentic bagels, tasty cream cheese.",
            "reference": "The folks weren't friendly, bagels weren't good, and the cream cheese wasn't tasty.",
            "prediction": "The bagel is not fresh and the cream cheese is too salty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.991217562121893,
                "s_sbleu": 6.837203339116283,
                "r_avg_similarity": 0.6381,
                "r_similarities": [
                    0.6381
                ],
                "s_avg_similarity": 0.7012,
                "s_similarities": [
                    0.7012
                ],
                "s_ppl": 22.588748931884766,
                "t_ppl": 22.588748931884766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9752,
                    "positive": 0.003,
                    "neutral": 0.0218
                }
            }
        },
        {
            "index": 18,
            "input": "you'll see why once you get there.",
            "reference": "You'll see why I don't like it once you get there.",
            "prediction": "You will be disappointed when you arrive there.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.561318691530973,
                "s_sbleu": 10.552670315936318,
                "r_avg_similarity": 0.5641,
                "r_similarities": [
                    0.5641
                ],
                "s_avg_similarity": 0.5176,
                "s_similarities": [
                    0.5176
                ],
                "s_ppl": 31.330446243286133,
                "t_ppl": 31.330446243286133,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9616,
                    "positive": 0.0037,
                    "neutral": 0.0347
                }
            }
        },
        {
            "index": 19,
            "input": "everyone that i spoke with was very helpful and kind.",
            "reference": "Everyone that I spoke with wasn't helpful or kind.",
            "prediction": "I had a bad experience with the customer service of this company.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.065425428798724,
                "s_sbleu": 3.673526562988939,
                "r_avg_similarity": 0.3979,
                "r_similarities": [
                    0.3979
                ],
                "s_avg_similarity": 0.3436,
                "s_similarities": [
                    0.3436
                ],
                "s_ppl": 11.13249397277832,
                "t_ppl": 11.13249397277832,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0033,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 20,
            "input": "the variety of sushi rolls makes for a good eating.",
            "reference": "There is limited variety for sushi rolls.",
            "prediction": "The variety of sushi rolls is not enough for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.864703138979419,
                "s_sbleu": 25.965358893403383,
                "r_avg_similarity": 0.9241,
                "r_similarities": [
                    0.9241
                ],
                "s_avg_similarity": 0.8965,
                "s_similarities": [
                    0.8965
                ],
                "s_ppl": 59.85321044921875,
                "t_ppl": 59.85323715209961,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8761,
                    "positive": 0.0065,
                    "neutral": 0.1174
                }
            }
        },
        {
            "index": 21,
            "input": "and every experience has been a positive one.",
            "reference": "Every experience has been awful.",
            "prediction": "I have never had a bad experience in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.516,
                "r_similarities": [
                    0.516
                ],
                "s_avg_similarity": 0.3406,
                "s_similarities": [
                    0.3406
                ],
                "s_ppl": 13.283246040344238,
                "t_ppl": 13.283249855041504,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0053,
                    "positive": 0.9676,
                    "neutral": 0.0271
                }
            }
        },
        {
            "index": 22,
            "input": "steve was professional and found exactly the right unit to fit in our space.",
            "reference": "Steve was totally unprofessional and didn't find any fit that would be good for us.",
            "prediction": "steve was not professional and did not find a unit that fits in our space.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.657015913414383,
                "s_sbleu": 21.305413619585085,
                "r_avg_similarity": 0.6134,
                "r_similarities": [
                    0.6134
                ],
                "s_avg_similarity": 0.9141,
                "s_similarities": [
                    0.9141
                ],
                "s_ppl": 74.56788635253906,
                "t_ppl": 74.5678482055664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9595,
                    "positive": 0.0023,
                    "neutral": 0.0382
                }
            }
        },
        {
            "index": 23,
            "input": "this golf club is one of the best in my opinion.",
            "reference": "The Golf Club was a major disappointment.",
            "prediction": "I think this golf club is not good enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 22.741221234802104,
                "r_avg_similarity": 0.6183,
                "r_similarities": [
                    0.6183
                ],
                "s_avg_similarity": 0.777,
                "s_similarities": [
                    0.777
                ],
                "s_ppl": 43.58122634887695,
                "t_ppl": 43.58122634887695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9752,
                    "positive": 0.0026,
                    "neutral": 0.0221
                }
            }
        },
        {
            "index": 24,
            "input": "excellent knowledgeable dentist and staff!",
            "reference": "Minimally qualified dentist and staff.",
            "prediction": "I had a bad experience at this dental office.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5734,
                "r_similarities": [
                    0.5734
                ],
                "s_avg_similarity": 0.6022,
                "s_similarities": [
                    0.6022
                ],
                "s_ppl": 36.25792694091797,
                "t_ppl": 36.2579231262207,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.0029,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 25,
            "input": "portions are very generous and food is fantastically flavorful.",
            "reference": "portions are very small and food is not flavorful.",
            "prediction": "The portion of this restaurant is too small, and the taste is not good enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.751391809950023,
                "s_sbleu": 3.0098043843528286,
                "r_avg_similarity": 0.7496,
                "r_similarities": [
                    0.7496
                ],
                "s_avg_similarity": 0.6049,
                "s_similarities": [
                    0.6049
                ],
                "s_ppl": 37.34111785888672,
                "t_ppl": 37.34112548828125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.977,
                    "positive": 0.0028,
                    "neutral": 0.0202
                }
            }
        },
        {
            "index": 26,
            "input": "always fresh, fat, and delicious.",
            "reference": "always bland, fat, and bad tasting.",
            "prediction": "always stale, lean, and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.256200970377108,
                "s_sbleu": 13.888095170058955,
                "r_avg_similarity": 0.7586,
                "r_similarities": [
                    0.7586
                ],
                "s_avg_similarity": 0.7254,
                "s_similarities": [
                    0.7254
                ],
                "s_ppl": 74.78534698486328,
                "t_ppl": 74.7853775024414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9628,
                    "positive": 0.0032,
                    "neutral": 0.034
                }
            }
        },
        {
            "index": 27,
            "input": "these two women are professionals.",
            "reference": "these two women are not professionals.",
            "prediction": "these two women are not professional enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 54.10822690539397,
                "s_sbleu": 36.55552228545123,
                "r_avg_similarity": 0.9112,
                "r_similarities": [
                    0.9112
                ],
                "s_avg_similarity": 0.83,
                "s_similarities": [
                    0.83
                ],
                "s_ppl": 91.41559600830078,
                "t_ppl": 91.4156494140625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9795,
                    "positive": 0.003,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 28,
            "input": "the most important thing, of course, is the food.",
            "reference": "the most important thing should be the food.",
            "prediction": "The most important thing, of course, is the food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.200626759025184,
                "s_sbleu": 90.36020036098445,
                "r_avg_similarity": 0.8779,
                "r_similarities": [
                    0.8779
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 9.556608200073242,
                "t_ppl": 9.556608200073242,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0016,
                    "positive": 0.9354,
                    "neutral": 0.063
                }
            }
        },
        {
            "index": 29,
            "input": "we were both so impressed.",
            "reference": "we were both unimpressed.",
            "prediction": "I was not impressed at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.3453,
                "r_similarities": [
                    0.3453
                ],
                "s_avg_similarity": 0.5624,
                "s_similarities": [
                    0.5624
                ],
                "s_ppl": 17.21884536743164,
                "t_ppl": 17.21884536743164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0038,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 30,
            "input": "very good brunch, was impressed with selection and quality.",
            "reference": "the brunch was bad, with little selection",
            "prediction": "The brunch I had in this restaurant is not worth it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 4.02724819242185,
                "r_avg_similarity": 0.6873,
                "r_similarities": [
                    0.6873
                ],
                "s_avg_similarity": 0.7235,
                "s_similarities": [
                    0.7235
                ],
                "s_ppl": 59.11771774291992,
                "t_ppl": 59.11774826049805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0029,
                    "neutral": 0.0172
                }
            }
        },
        {
            "index": 31,
            "input": "the menu is very simple, healthy, and tasty.",
            "reference": "the menu was weak, the food bland",
            "prediction": "The menu is too simple, not healthy enough, and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.673526562988939,
                "s_sbleu": 11.498759556447222,
                "r_avg_similarity": 0.6811,
                "r_similarities": [
                    0.6811
                ],
                "s_avg_similarity": 0.8447,
                "s_similarities": [
                    0.8447
                ],
                "s_ppl": 42.19200134277344,
                "t_ppl": 42.192012786865234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9743,
                    "positive": 0.0031,
                    "neutral": 0.0226
                }
            }
        },
        {
            "index": 32,
            "input": "she was spot on as they were delicious.",
            "reference": "she was not correct and it tasted bad",
            "prediction": "She was spot on, but I didn't like them at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0890553181566975,
                "s_sbleu": 12.35622127262679,
                "r_avg_similarity": 0.4046,
                "r_similarities": [
                    0.4046
                ],
                "s_avg_similarity": 0.7071,
                "s_similarities": [
                    0.7071
                ],
                "s_ppl": 15.830867767333984,
                "t_ppl": 15.83087158203125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.959,
                    "positive": 0.0046,
                    "neutral": 0.0364
                }
            }
        },
        {
            "index": 33,
            "input": "i love this place, the service is always great!",
            "reference": "hate this place, service was bad",
            "prediction": "I hate this place, the service is terrible!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 27.77619034011791,
                "s_sbleu": 48.61555413051454,
                "r_avg_similarity": 0.8297,
                "r_similarities": [
                    0.8297
                ],
                "s_avg_similarity": 0.647,
                "s_similarities": [
                    0.647
                ],
                "s_ppl": 33.137977600097656,
                "t_ppl": 33.137977600097656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9834,
                    "positive": 0.0054,
                    "neutral": 0.0112
                }
            }
        },
        {
            "index": 34,
            "input": "perfect spot to shop for gift!",
            "reference": "bad shop for a gift though",
            "prediction": "this is a terrible place to buy gifts.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.6774,
                "r_similarities": [
                    0.6774
                ],
                "s_avg_similarity": 0.4209,
                "s_similarities": [
                    0.4209
                ],
                "s_ppl": 42.88871765136719,
                "t_ppl": 42.88870620727539,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0034,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 35,
            "input": "a great stop if you want nice things at a steal.",
            "reference": "a great stop if you want bad things at scammy prices",
            "prediction": "a great stop if you want cheap things at a steal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 46.92470064105599,
                "s_sbleu": 73.48889200874659,
                "r_avg_similarity": 0.6724,
                "r_similarities": [
                    0.6724
                ],
                "s_avg_similarity": 0.8706,
                "s_similarities": [
                    0.8706
                ],
                "s_ppl": 136.55287170410156,
                "t_ppl": 136.55291748046875,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0094,
                    "positive": 0.7947,
                    "neutral": 0.196
                }
            }
        },
        {
            "index": 36,
            "input": "the atmosphere was fun and the staff treats you well.",
            "reference": "the atmosphere was lame and the staff treats you like dirt",
            "prediction": "The atmosphere is not good, and the service is bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 8.054496384843702,
                "r_avg_similarity": 0.4961,
                "r_similarities": [
                    0.4961
                ],
                "s_avg_similarity": 0.4179,
                "s_similarities": [
                    0.4179
                ],
                "s_ppl": 28.159690856933594,
                "t_ppl": 28.159698486328125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0038,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 37,
            "input": "their front line is so much cheaper than petsmart!",
            "reference": "their front line is so much more expensive than petsmart!",
            "prediction": "their front line is so much more expensive than petsmart!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 58.77283725105319,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.9845,
                "s_similarities": [
                    0.9845
                ],
                "s_ppl": 289.0654602050781,
                "t_ppl": 289.0654296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9342,
                    "positive": 0.0045,
                    "neutral": 0.0613
                }
            }
        },
        {
            "index": 38,
            "input": "this is a place where still the customer comes first and is treated right.",
            "reference": "this is a place where the customer comes last and is mistreated",
            "prediction": "This is a place where customers are not treated well.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.42348888333949,
                "s_sbleu": 18.049661583447193,
                "r_avg_similarity": 0.7433,
                "r_similarities": [
                    0.7433
                ],
                "s_avg_similarity": 0.7291,
                "s_similarities": [
                    0.7291
                ],
                "s_ppl": 29.908517837524414,
                "t_ppl": 29.908523559570312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9783,
                    "positive": 0.0029,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 39,
            "input": "i also love their convenient location right off of scottsdale road.",
            "reference": "I hate how their location is inconveient to get to from scottsdale road",
            "prediction": "I hate that this restaurant is located in a busy area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.896242107716467,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.485,
                "r_similarities": [
                    0.485
                ],
                "s_avg_similarity": 0.3766,
                "s_similarities": [
                    0.3766
                ],
                "s_ppl": 26.673809051513672,
                "t_ppl": 26.673809051513672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9773,
                    "positive": 0.0033,
                    "neutral": 0.0195
                }
            }
        },
        {
            "index": 40,
            "input": "their pizza is the best i have ever had as well as their ranch!",
            "reference": "their pizza is the worst i have ever had as well as their ranch!",
            "prediction": "Their pizza is not good at all, and I don't like their ranch.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.432998184513635,
                "s_sbleu": 7.432998184513635,
                "r_avg_similarity": 0.8833,
                "r_similarities": [
                    0.8833
                ],
                "s_avg_similarity": 0.8495,
                "s_similarities": [
                    0.8495
                ],
                "s_ppl": 26.943098068237305,
                "t_ppl": 26.943105697631836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0034,
                    "neutral": 0.0152
                }
            }
        },
        {
            "index": 41,
            "input": "i'm so happy and will definitely go back for future services.",
            "reference": "i'm so sad and will definitely not go back for future services.",
            "prediction": "I am not satisfied with the service, and will never come again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.754312828675709,
                "s_sbleu": 6.285596338261262,
                "r_avg_similarity": 0.5334,
                "r_similarities": [
                    0.5334
                ],
                "s_avg_similarity": 0.5384,
                "s_similarities": [
                    0.5384
                ],
                "s_ppl": 23.219823837280273,
                "t_ppl": 23.219823837280273,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.0037,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 42,
            "input": "seems pretty high compared to every other thai place.",
            "reference": "seems pretty low compared to every other thai place.",
            "prediction": "The price is too expensive compared to other Thai restaurants.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 8.913765521398126,
                "r_avg_similarity": 0.669,
                "r_similarities": [
                    0.669
                ],
                "s_avg_similarity": 0.6831,
                "s_similarities": [
                    0.6831
                ],
                "s_ppl": 45.4144401550293,
                "t_ppl": 45.41444396972656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9063,
                    "positive": 0.0035,
                    "neutral": 0.0902
                }
            }
        },
        {
            "index": 43,
            "input": "she did the most amazing job.",
            "reference": "she did the most awful job.",
            "prediction": "She did a terrible job.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.207218222740094,
                "s_sbleu": 15.207218222740094,
                "r_avg_similarity": 0.896,
                "r_similarities": [
                    0.896
                ],
                "s_avg_similarity": 0.572,
                "s_similarities": [
                    0.572
                ],
                "s_ppl": 24.6202392578125,
                "t_ppl": 24.620248794555664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0039,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 44,
            "input": "really enjoyed the beautiful range.",
            "reference": "really didn't enjoy the ugly range.",
            "prediction": "I was disappointed by the poor quality of the products.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.3622,
                "r_similarities": [
                    0.3622
                ],
                "s_avg_similarity": 0.2041,
                "s_similarities": [
                    0.2041
                ],
                "s_ppl": 15.772529602050781,
                "t_ppl": 15.772533416748047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0035,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 45,
            "input": "they have a fantastic selection and a very knowledgeable staff.",
            "reference": "the selection was not that great and they had no idea what they were doing",
            "prediction": "They have a terrible selection and a very ignorant staff.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0981749906855875,
                "s_sbleu": 31.7023313852343,
                "r_avg_similarity": 0.6187,
                "r_similarities": [
                    0.6187
                ],
                "s_avg_similarity": 0.618,
                "s_similarities": [
                    0.618
                ],
                "s_ppl": 68.85574340820312,
                "t_ppl": 68.85575103759766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0038,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 46,
            "input": "definitely a place to keep in mind.",
            "reference": "not a place i would recommend",
            "prediction": "Definitely not a place to keep in mind.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 72.59795291154772,
                "r_avg_similarity": 0.6822,
                "r_similarities": [
                    0.6822
                ],
                "s_avg_similarity": 0.8623,
                "s_similarities": [
                    0.8623
                ],
                "s_ppl": 33.42852020263672,
                "t_ppl": 33.42852020263672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9624,
                    "positive": 0.003,
                    "neutral": 0.0346
                }
            }
        },
        {
            "index": 47,
            "input": "great place to hang out, grab a meal and a few brews!",
            "reference": "too noisy and the food and brews are not that great",
            "prediction": "This is not a good place to eat.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.817681337429047,
                "s_sbleu": 6.054630691682828,
                "r_avg_similarity": 0.37,
                "r_similarities": [
                    0.37
                ],
                "s_avg_similarity": 0.4022,
                "s_similarities": [
                    0.4022
                ],
                "s_ppl": 17.21548843383789,
                "t_ppl": 17.215497970581055,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9803,
                    "positive": 0.0034,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 48,
            "input": "the lunch and dinner items are very good as well.",
            "reference": "lunch and dinner was not very good",
            "prediction": "The lunch and dinner items are not worth eating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.784459625186194,
                "s_sbleu": 37.20090803840517,
                "r_avg_similarity": 0.586,
                "r_similarities": [
                    0.586
                ],
                "s_avg_similarity": 0.5623,
                "s_similarities": [
                    0.5623
                ],
                "s_ppl": 96.81062316894531,
                "t_ppl": 96.81062316894531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.0028,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 49,
            "input": "charlie was clean neat and professional.",
            "reference": "a little on the dirty side and unprofessional",
            "prediction": "charlie is a messy, sloppy person.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.3563,
                "r_similarities": [
                    0.3563
                ],
                "s_avg_similarity": 0.6975,
                "s_similarities": [
                    0.6975
                ],
                "s_ppl": 58.00137710571289,
                "t_ppl": 58.00137710571289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9726,
                    "positive": 0.0029,
                    "neutral": 0.0245
                }
            }
        },
        {
            "index": 50,
            "input": "the calzones are awesome and the lunch special they have is perfect.",
            "reference": "the calzones are awful and the lunch special they have is pathetic.",
            "prediction": "The calzones are not good at all, and the lunch special is a waste of money.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.18152967132724,
                "s_sbleu": 17.18152967132724,
                "r_avg_similarity": 0.9005,
                "r_similarities": [
                    0.9005
                ],
                "s_avg_similarity": 0.871,
                "s_similarities": [
                    0.871
                ],
                "s_ppl": 27.025964736938477,
                "t_ppl": 27.025962829589844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0033,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 51,
            "input": "i will definitely return often!",
            "reference": "i will definitely not return often!",
            "prediction": "I will never come back here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.5271,
                "r_similarities": [
                    0.5271
                ],
                "s_avg_similarity": 0.4308,
                "s_similarities": [
                    0.4308
                ],
                "s_ppl": 16.29537582397461,
                "t_ppl": 16.29537582397461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9565,
                    "positive": 0.0041,
                    "neutral": 0.0394
                }
            }
        },
        {
            "index": 52,
            "input": "they have delicious soups everyday.",
            "reference": "they have gross soups everyday.",
            "prediction": "they serve bad soup everyday.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.965205598154213,
                "s_sbleu": 17.965205598154213,
                "r_avg_similarity": 0.8389,
                "r_similarities": [
                    0.8389
                ],
                "s_avg_similarity": 0.8462,
                "s_similarities": [
                    0.8462
                ],
                "s_ppl": 1731.8424072265625,
                "t_ppl": 1731.8424072265625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9803,
                    "positive": 0.0033,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 53,
            "input": "nice people, prompt service and clearly expert.",
            "reference": "negative people, slow service and clearly not expert.",
            "prediction": "The waiter is rude, the food is not good, and the restaurant is dirty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.234245292096216,
                "s_sbleu": 3.0098043843528286,
                "r_avg_similarity": 0.2307,
                "r_similarities": [
                    0.2307
                ],
                "s_avg_similarity": 0.1822,
                "s_similarities": [
                    0.1822
                ],
                "s_ppl": 14.822957992553711,
                "t_ppl": 14.822956085205078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.004,
                    "neutral": 0.0131
                }
            }
        },
        {
            "index": 54,
            "input": "produce is very reasonably priced and great selection of organic produce.",
            "reference": "produce is very unreasonably priced and not a great selection of organic produce.",
            "prediction": "The produce in this store is overpriced and not fresh.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.175377580688497,
                "s_sbleu": 4.8395768698246995,
                "r_avg_similarity": 0.7123,
                "r_similarities": [
                    0.7123
                ],
                "s_avg_similarity": 0.6226,
                "s_similarities": [
                    0.6226
                ],
                "s_ppl": 37.11713790893555,
                "t_ppl": 37.11714553833008,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9771,
                    "positive": 0.0029,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 55,
            "input": "the food here is delicious.",
            "reference": "the food here is gross",
            "prediction": "the food here is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 41.11336169005198,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.7081,
                "r_similarities": [
                    0.7081
                ],
                "s_avg_similarity": 0.6906,
                "s_similarities": [
                    0.6906
                ],
                "s_ppl": 52.205955505371094,
                "t_ppl": 52.205970764160156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0038,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 56,
            "input": "first time i came in, i knew i just wanted something new.",
            "reference": "first time i came in i knew i just wanted to leave",
            "prediction": "I was disappointed by the food quality of this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.853183878886449,
                "r_avg_similarity": 0.1781,
                "r_similarities": [
                    0.1781
                ],
                "s_avg_similarity": 0.2194,
                "s_similarities": [
                    0.2194
                ],
                "s_ppl": 22.836124420166016,
                "t_ppl": 22.83612823486328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9795,
                    "positive": 0.0034,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 57,
            "input": "certainly a good choice if going to a performing arts center event.",
            "reference": "certainly a bad choice when going to a performing arts center event",
            "prediction": "Certainly not a good choice if going to a performing arts center event.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 46.0462862587273,
                "s_sbleu": 83.85766789076253,
                "r_avg_similarity": 0.9498,
                "r_similarities": [
                    0.9498
                ],
                "s_avg_similarity": 0.9398,
                "s_similarities": [
                    0.9398
                ],
                "s_ppl": 62.874271392822266,
                "t_ppl": 62.874271392822266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9747,
                    "positive": 0.0024,
                    "neutral": 0.0229
                }
            }
        },
        {
            "index": 58,
            "input": "this place has been making great sushi and sashimi for years.",
            "reference": "this place has been making horrible sushi for years",
            "prediction": "This place is not good at making sushi and sashimi.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 15.148694266083963,
                "r_avg_similarity": 0.7563,
                "r_similarities": [
                    0.7563
                ],
                "s_avg_similarity": 0.8013,
                "s_similarities": [
                    0.8013
                ],
                "s_ppl": 27.731260299682617,
                "t_ppl": 27.731287002563477,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0032,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 59,
            "input": "even in summer, they have decent patronage.",
            "reference": "even in summer they are no patronage",
            "prediction": "Even in summer, this restaurant is not popular.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.392229812593097,
                "s_sbleu": 16.784459625186194,
                "r_avg_similarity": 0.587,
                "r_similarities": [
                    0.587
                ],
                "s_avg_similarity": 0.525,
                "s_similarities": [
                    0.525
                ],
                "s_ppl": 49.075157165527344,
                "t_ppl": 49.075157165527344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9617,
                    "positive": 0.0028,
                    "neutral": 0.0355
                }
            }
        },
        {
            "index": 60,
            "input": "you will be helped by all of their friendly advise, and travel knowledge!",
            "reference": "no one helped me while i was waiting and no one knew much about traels",
            "prediction": "You will be helped by all of their unfriendly advise, and travel ignorance!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.125190763972442,
                "s_sbleu": 58.282339541526504,
                "r_avg_similarity": 0.376,
                "r_similarities": [
                    0.376
                ],
                "s_avg_similarity": 0.8942,
                "s_similarities": [
                    0.8942
                ],
                "s_ppl": 162.04490661621094,
                "t_ppl": 162.04490661621094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.954,
                    "positive": 0.0036,
                    "neutral": 0.0424
                }
            }
        },
        {
            "index": 61,
            "input": "i spent time with my best buds and enjoyed some excellent wine and food.",
            "reference": "the food and wine was terrible and my best buds said the same thing",
            "prediction": "I wasted my time with my best buds, drinking some cheap wine and eating some terrible food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.313775329024091,
                "s_sbleu": 24.941747177008256,
                "r_avg_similarity": 0.6883,
                "r_similarities": [
                    0.6883
                ],
                "s_avg_similarity": 0.7428,
                "s_similarities": [
                    0.7428
                ],
                "s_ppl": 39.16677474975586,
                "t_ppl": 39.16677474975586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0029,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 62,
            "input": "we went with a group of eight and all had a great time.",
            "reference": "the place was too packed, we did not enjoy it",
            "prediction": "We were disappointed by the service in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7968017775955714,
                "s_sbleu": 2.812739937159535,
                "r_avg_similarity": 0.4744,
                "r_similarities": [
                    0.4744
                ],
                "s_avg_similarity": 0.255,
                "s_similarities": [
                    0.255
                ],
                "s_ppl": 38.07805633544922,
                "t_ppl": 38.07805633544922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0033,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 63,
            "input": "the service has always been wonderful.",
            "reference": "the service was frustrating",
            "prediction": "The service is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.682175159905853,
                "s_sbleu": 8.515289178380433,
                "r_avg_similarity": 0.6294,
                "r_similarities": [
                    0.6294
                ],
                "s_avg_similarity": 0.5187,
                "s_similarities": [
                    0.5187
                ],
                "s_ppl": 225.78469848632812,
                "t_ppl": 225.78469848632812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.005,
                    "neutral": 0.0123
                }
            }
        },
        {
            "index": 64,
            "input": "thanks for making our special night an event to remember.",
            "reference": "our special night was ruined",
            "prediction": "I am sorry that you ruined my special night.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.287528999566801,
                "s_sbleu": 8.403703759902122,
                "r_avg_similarity": 0.7405,
                "r_similarities": [
                    0.7405
                ],
                "s_avg_similarity": 0.5525,
                "s_similarities": [
                    0.5525
                ],
                "s_ppl": 44.71146011352539,
                "t_ppl": 44.71145248413086,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9697,
                    "positive": 0.0038,
                    "neutral": 0.0264
                }
            }
        },
        {
            "index": 65,
            "input": "i had a spanish omelet was huge and delicious.",
            "reference": "the spanish omelet was small and bland tasting",
            "prediction": "The spanish omelet I ordered is too big and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 8.913765521398126,
                "r_avg_similarity": 0.8571,
                "r_similarities": [
                    0.8571
                ],
                "s_avg_similarity": 0.8762,
                "s_similarities": [
                    0.8762
                ],
                "s_ppl": 68.59021759033203,
                "t_ppl": 68.59024810791016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9704,
                    "positive": 0.0029,
                    "neutral": 0.0268
                }
            }
        },
        {
            "index": 66,
            "input": "they have the big massage chairs and each manicure station is fairly clean.",
            "reference": "the chairs were small and disappointing",
            "prediction": "The massage chairs in this salon are not comfortable at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 6.344849033136086,
                "r_avg_similarity": 0.4042,
                "r_similarities": [
                    0.4042
                ],
                "s_avg_similarity": 0.5467,
                "s_similarities": [
                    0.5467
                ],
                "s_ppl": 46.02627182006836,
                "t_ppl": 46.02628707885742,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0032,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 67,
            "input": "the wait staff is extremely attractive and friendly!",
            "reference": "the wait staff was not friendly nor attractive",
            "prediction": "The wait staff is not very good looking, and they are rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.285596338261262,
                "s_sbleu": 11.359354890271161,
                "r_avg_similarity": 0.7449,
                "r_similarities": [
                    0.7449
                ],
                "s_avg_similarity": 0.8166,
                "s_similarities": [
                    0.8166
                ],
                "s_ppl": 32.16862487792969,
                "t_ppl": 32.16862487792969,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0039,
                    "neutral": 0.0137
                }
            }
        },
        {
            "index": 68,
            "input": "also, the food is great!",
            "reference": "the food was just ok",
            "prediction": "The food is terrible!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.682175159905853,
                "s_sbleu": 15.84873897212071,
                "r_avg_similarity": 0.5933,
                "r_similarities": [
                    0.5933
                ],
                "s_avg_similarity": 0.6108,
                "s_similarities": [
                    0.6108
                ],
                "s_ppl": 176.8644561767578,
                "t_ppl": 176.86434936523438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.005,
                    "neutral": 0.0127
                }
            }
        },
        {
            "index": 69,
            "input": "the color that she uses on my girlfriend's hair looks great.",
            "reference": "the color used on my friend was a bad choice",
            "prediction": "The color that she used on my girlfriend's hair is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.545994273378144,
                "s_sbleu": 31.702331385234313,
                "r_avg_similarity": 0.6606,
                "r_similarities": [
                    0.6606
                ],
                "s_avg_similarity": 0.8558,
                "s_similarities": [
                    0.8558
                ],
                "s_ppl": 93.50409698486328,
                "t_ppl": 93.50410461425781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.003,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 70,
            "input": "it is consistent and the staff is always friendly.",
            "reference": "it is consistently bad and the staff is always rude",
            "prediction": "The service in this restaurant is inconsistent, and the staff is rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.674979811155634,
                "s_sbleu": 19.674979811155634,
                "r_avg_similarity": 0.6665,
                "r_similarities": [
                    0.6665
                ],
                "s_avg_similarity": 0.5811,
                "s_similarities": [
                    0.5811
                ],
                "s_ppl": 42.36338424682617,
                "t_ppl": 42.36339569091797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0036,
                    "neutral": 0.0137
                }
            }
        },
        {
            "index": 71,
            "input": "friendly and welcoming with a fun atmosphere and terrific food.",
            "reference": "unfriendly and unwelcoming with a bad atmosphere and food",
            "prediction": "The service is slow, the food is not good, and the atmosphere is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0098043843528286,
                "s_sbleu": 3.234245292096216,
                "r_avg_similarity": 0.5771,
                "r_similarities": [
                    0.5771
                ],
                "s_avg_similarity": 0.3899,
                "s_similarities": [
                    0.3899
                ],
                "s_ppl": 13.50920581817627,
                "t_ppl": 13.50920581817627,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0041,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 72,
            "input": "the chicken chimi i had was absolutely fantastic!",
            "reference": "the chicken chimi was absolutely gross!",
            "prediction": "The chicken chimi I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 7.495553473355842,
                "r_avg_similarity": 0.6705,
                "r_similarities": [
                    0.6705
                ],
                "s_avg_similarity": 0.644,
                "s_similarities": [
                    0.644
                ],
                "s_ppl": 175.19802856445312,
                "t_ppl": 175.1979522705078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.0032,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 73,
            "input": "it is also fun to sit at the bar.",
            "reference": "it is also not fun to have to sit at the bat",
            "prediction": "It is not fun to sit at the bar.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 31.105042156452658,
                "s_sbleu": 66.06328636027612,
                "r_avg_similarity": 0.5715,
                "r_similarities": [
                    0.5715
                ],
                "s_avg_similarity": 0.8309,
                "s_similarities": [
                    0.8309
                ],
                "s_ppl": 31.69973373413086,
                "t_ppl": 31.699737548828125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.0042,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 74,
            "input": "the soup is absolutely to die for.",
            "reference": "the soup will make you want to die",
            "prediction": "The soup is not worth eating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.693025330278465,
                "s_sbleu": 12.600736402830258,
                "r_avg_similarity": 0.6773,
                "r_similarities": [
                    0.6773
                ],
                "s_avg_similarity": 0.7403,
                "s_similarities": [
                    0.7403
                ],
                "s_ppl": 87.61543273925781,
                "t_ppl": 87.61543273925781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.977,
                    "positive": 0.0029,
                    "neutral": 0.0201
                }
            }
        },
        {
            "index": 75,
            "input": "the best mexican food in the phoenix area.",
            "reference": "the worst mexican food in the phoenix area.",
            "prediction": "the worst mexican food in the phoenix area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 75.06238537503395,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.8228,
                "s_similarities": [
                    0.8228
                ],
                "s_ppl": 36.17116165161133,
                "t_ppl": 36.17115783691406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0046,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 76,
            "input": "they are professional, thorough and attentive to our needs.",
            "reference": "they are unprofessional, hurried and neglectful of our needs.",
            "prediction": "They are not professional enough to meet our requirements.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.996872151825361,
                "s_sbleu": 5.6775429106661015,
                "r_avg_similarity": 0.5486,
                "r_similarities": [
                    0.5486
                ],
                "s_avg_similarity": 0.6748,
                "s_similarities": [
                    0.6748
                ],
                "s_ppl": 34.9412956237793,
                "t_ppl": 34.94129943847656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9706,
                    "positive": 0.0029,
                    "neutral": 0.0266
                }
            }
        },
        {
            "index": 77,
            "input": "their lunch special is a great value!",
            "reference": "their lunch special is a poor value.",
            "prediction": "their lunch special is not worth it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.55552228545123,
                "s_sbleu": 34.57207846419409,
                "r_avg_similarity": 0.8729,
                "r_similarities": [
                    0.8729
                ],
                "s_avg_similarity": 0.7405,
                "s_similarities": [
                    0.7405
                ],
                "s_ppl": 107.82514953613281,
                "t_ppl": 107.82515716552734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.977,
                    "positive": 0.0031,
                    "neutral": 0.0198
                }
            }
        },
        {
            "index": 78,
            "input": "our experience with this business was positive.",
            "reference": "our experience with this business was negative.",
            "prediction": "we were disappointed by this business.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.600736402830258,
                "s_sbleu": 12.600736402830258,
                "r_avg_similarity": 0.6179,
                "r_similarities": [
                    0.6179
                ],
                "s_avg_similarity": 0.5048,
                "s_similarities": [
                    0.5048
                ],
                "s_ppl": 108.0719223022461,
                "t_ppl": 108.07197570800781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0034,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 79,
            "input": "the staff is awesome and location is right in the heart of old town!",
            "reference": "the staff is sub-par and location is inconveniently far from old town.",
            "prediction": "The staff is rude and the location is not convenient at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.04916995660316,
                "s_sbleu": 8.290466298764843,
                "r_avg_similarity": 0.677,
                "r_similarities": [
                    0.677
                ],
                "s_avg_similarity": 0.4751,
                "s_similarities": [
                    0.4751
                ],
                "s_ppl": 35.18333435058594,
                "t_ppl": 35.18333053588867,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0033,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 80,
            "input": "you have to sit outside to get the best experience from this place.",
            "reference": "Sitting outside makes this place worse.",
            "prediction": "You can only enjoy the food in this restaurant if you are sitting outside.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.4585921141027365,
                "s_sbleu": 3.9297193407553013,
                "r_avg_similarity": 0.5168,
                "r_similarities": [
                    0.5168
                ],
                "s_avg_similarity": 0.561,
                "s_similarities": [
                    0.561
                ],
                "s_ppl": 19.3021240234375,
                "t_ppl": 19.302127838134766,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0373,
                    "positive": 0.3495,
                    "neutral": 0.6132
                }
            }
        },
        {
            "index": 81,
            "input": "the food is delicious and plentiful.",
            "reference": "The food was tough and dry.",
            "prediction": "The food is tasteless and insufficient.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.619699684601283,
                "s_sbleu": 15.619699684601283,
                "r_avg_similarity": 0.4629,
                "r_similarities": [
                    0.4629
                ],
                "s_avg_similarity": 0.5924,
                "s_similarities": [
                    0.5924
                ],
                "s_ppl": 85.75887298583984,
                "t_ppl": 85.75886535644531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.976,
                    "positive": 0.0031,
                    "neutral": 0.0209
                }
            }
        },
        {
            "index": 82,
            "input": "and the fettuccine alfredo is absolutely scrumptious!",
            "reference": "The fettuccine alfredo was a disappointment.",
            "prediction": "The fettuccine alfredo in this restaurant is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.545994273378144,
                "s_sbleu": 7.495553473355842,
                "r_avg_similarity": 0.7554,
                "r_similarities": [
                    0.7554
                ],
                "s_avg_similarity": 0.7122,
                "s_similarities": [
                    0.7122
                ],
                "s_ppl": 14.888958930969238,
                "t_ppl": 14.888962745666504,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0036,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 83,
            "input": "we dropped our rental truck of at this location two weeks ago.",
            "reference": "We avoided dropping the rental truck here two weeks ago.",
            "prediction": "We left our rental truck here two weeks ago and it is still not returned.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 32.37722713145643,
                "s_sbleu": 15.911783110981515,
                "r_avg_similarity": 0.6485,
                "r_similarities": [
                    0.6485
                ],
                "s_avg_similarity": 0.7218,
                "s_similarities": [
                    0.7218
                ],
                "s_ppl": 40.85593032836914,
                "t_ppl": 40.85594177246094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9402,
                    "positive": 0.0026,
                    "neutral": 0.0573
                }
            }
        },
        {
            "index": 84,
            "input": "this adds the last little touch to what was already an amazing place.",
            "reference": "This adds the final straw to a disappointing place.",
            "prediction": "This is a very bad idea.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.630400552901077,
                "s_sbleu": 2.4159653599212296,
                "r_avg_similarity": 0.2299,
                "r_similarities": [
                    0.2299
                ],
                "s_avg_similarity": 0.1477,
                "s_similarities": [
                    0.1477
                ],
                "s_ppl": 8.473148345947266,
                "t_ppl": 8.473150253295898,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9769,
                    "positive": 0.0031,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 85,
            "input": "prices are a tad high but worth it.",
            "reference": "prices are a tad high and not worth it.",
            "prediction": "The price is too expensive, I don't think it is worth it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.571070857151538,
                "s_sbleu": 10.571070857151538,
                "r_avg_similarity": 0.7059,
                "r_similarities": [
                    0.7059
                ],
                "s_avg_similarity": 0.7028,
                "s_similarities": [
                    0.7028
                ],
                "s_ppl": 12.080045700073242,
                "t_ppl": 12.080048561096191,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9516,
                    "positive": 0.003,
                    "neutral": 0.0454
                }
            }
        },
        {
            "index": 86,
            "input": "the message therapist is awesome also.",
            "reference": "the message therapist is terrible also.",
            "prediction": "The message therapist is a fraud.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.269098944241588,
                "s_sbleu": 26.269098944241588,
                "r_avg_similarity": 0.7777,
                "r_similarities": [
                    0.7777
                ],
                "s_avg_similarity": 0.7262,
                "s_similarities": [
                    0.7262
                ],
                "s_ppl": 377.61822509765625,
                "t_ppl": 377.6181945800781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9629,
                    "positive": 0.0026,
                    "neutral": 0.0346
                }
            }
        },
        {
            "index": 87,
            "input": "came here with my family.",
            "reference": "came here without my family.",
            "prediction": "I came here with my family, but it was a bad experience.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.493098745313143,
                "s_sbleu": 27.824623288353134,
                "r_avg_similarity": 0.6889,
                "r_similarities": [
                    0.6889
                ],
                "s_avg_similarity": 0.7283,
                "s_similarities": [
                    0.7283
                ],
                "s_ppl": 15.637962341308594,
                "t_ppl": 15.637967109680176,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0034,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 88,
            "input": "the owner replied, i will go in half with you.",
            "reference": "the owner replied, i will not go in half with you.",
            "prediction": "the owner said, I will share the cost with you.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.86360939345259,
                "s_sbleu": 17.242221289766626,
                "r_avg_similarity": 0.5646,
                "r_similarities": [
                    0.5646
                ],
                "s_avg_similarity": 0.6098,
                "s_similarities": [
                    0.6098
                ],
                "s_ppl": 43.52302551269531,
                "t_ppl": 43.52302932739258,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0088,
                    "positive": 0.0262,
                    "neutral": 0.9651
                }
            }
        },
        {
            "index": 89,
            "input": "the escargot was delicious, and seasoned perfectly.",
            "reference": "the escargot was gross, and seasoned terribly.",
            "prediction": "The escargot was tasteless, and seasoned poorly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.356898886410004,
                "s_sbleu": 23.356898886410004,
                "r_avg_similarity": 0.9065,
                "r_similarities": [
                    0.9065
                ],
                "s_avg_similarity": 0.8566,
                "s_similarities": [
                    0.8566
                ],
                "s_ppl": 74.42742156982422,
                "t_ppl": 74.42742156982422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.977,
                    "positive": 0.0035,
                    "neutral": 0.0195
                }
            }
        },
        {
            "index": 90,
            "input": "brittany gave me a very new haircut and transformed me completely.",
            "reference": "brittany gave me a very old haircut and ruined me completely.",
            "prediction": "brittany gave me a very bad haircut and ruined my life.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 43.66835442847811,
                "s_sbleu": 37.7006380454947,
                "r_avg_similarity": 0.9624,
                "r_similarities": [
                    0.9624
                ],
                "s_avg_similarity": 0.8739,
                "s_similarities": [
                    0.8739
                ],
                "s_ppl": 37.58671951293945,
                "t_ppl": 37.586727142333984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0036,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 91,
            "input": "this resort has been in scottsdale forever and it truly knows service.",
            "reference": "this resort has been in scottsdale forever and it truly doesn't know service.",
            "prediction": "This resort is a disgrace to the hospitality industry.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3449303459224256,
                "s_sbleu": 3.696719741302181,
                "r_avg_similarity": 0.5147,
                "r_similarities": [
                    0.5147
                ],
                "s_avg_similarity": 0.5048,
                "s_similarities": [
                    0.5048
                ],
                "s_ppl": 40.819427490234375,
                "t_ppl": 40.819427490234375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0032,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 92,
            "input": "also the crab wontons rule along with the spicy plum sauce.",
            "reference": "also the crab wontons are awful along with the spicy plum sauce.",
            "prediction": "The crab wontons in this restaurant are not good enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.431878014503621,
                "s_sbleu": 7.574347133041985,
                "r_avg_similarity": 0.7113,
                "r_similarities": [
                    0.7113
                ],
                "s_avg_similarity": 0.6188,
                "s_similarities": [
                    0.6188
                ],
                "s_ppl": 119.14527130126953,
                "t_ppl": 119.14527893066406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.003,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 93,
            "input": "i have gotten so many dresses at a steal of a price!",
            "reference": "i have gotten so many dresses at a terrible price!",
            "prediction": "I have been ripped off by this store.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.817681337429047,
                "s_sbleu": 3.056960239296902,
                "r_avg_similarity": 0.4336,
                "r_similarities": [
                    0.4336
                ],
                "s_avg_similarity": 0.4818,
                "s_similarities": [
                    0.4818
                ],
                "s_ppl": 30.35675048828125,
                "t_ppl": 30.35673713684082,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9655,
                    "positive": 0.0041,
                    "neutral": 0.0304
                }
            }
        },
        {
            "index": 94,
            "input": "all around great place to grab a drink or two.",
            "reference": "all around bad place to grab a drink or two.",
            "prediction": "The bar is not good enough to have a drink.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 8.913765521398126,
                "r_avg_similarity": 0.5466,
                "r_similarities": [
                    0.5466
                ],
                "s_avg_similarity": 0.4794,
                "s_similarities": [
                    0.4794
                ],
                "s_ppl": 32.89438247680664,
                "t_ppl": 32.894378662109375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.003,
                    "neutral": 0.0191
                }
            }
        },
        {
            "index": 95,
            "input": "the flourless chocolate cake was one of the best desserts i've ever had.",
            "reference": "the chocolate cake was horrible, worst i had eaten in a while",
            "prediction": "The flourless chocolate cake is not worth eating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.113920478593803,
                "s_sbleu": 10.941952848244524,
                "r_avg_similarity": 0.5802,
                "r_similarities": [
                    0.5802
                ],
                "s_avg_similarity": 0.7302,
                "s_similarities": [
                    0.7302
                ],
                "s_ppl": 65.69371795654297,
                "t_ppl": 65.6937484741211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9735,
                    "positive": 0.0032,
                    "neutral": 0.0233
                }
            }
        },
        {
            "index": 96,
            "input": "beautiful scenery and friend staff.",
            "reference": "the scenery and decor was poor along with the staff",
            "prediction": "The scenery is not so beautiful, and the staff is not friendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.754312828675709,
                "s_sbleu": 4.246549372656572,
                "r_avg_similarity": 0.6659,
                "r_similarities": [
                    0.6659
                ],
                "s_avg_similarity": 0.6675,
                "s_similarities": [
                    0.6675
                ],
                "s_ppl": 27.53631019592285,
                "t_ppl": 27.53631019592285,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9773,
                    "positive": 0.0035,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 97,
            "input": "nice wine list at 2x retail rather than the more typical 3x.",
            "reference": "the wine list was poor and overpriced",
            "prediction": "The wine list is not good enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.044795567078939,
                "s_sbleu": 6.542540885608186,
                "r_avg_similarity": 0.7616,
                "r_similarities": [
                    0.7616
                ],
                "s_avg_similarity": 0.6022,
                "s_similarities": [
                    0.6022
                ],
                "s_ppl": 72.38707733154297,
                "t_ppl": 72.38706970214844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.0032,
                    "neutral": 0.019
                }
            }
        },
        {
            "index": 98,
            "input": "we loved our day on the river and can't wait to go back!",
            "reference": "our day on the river was horrible don't want to return",
            "prediction": "We were disappointed by our day on the river, it was not as good as expected.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.042990347620457,
                "s_sbleu": 20.105373454060025,
                "r_avg_similarity": 0.7868,
                "r_similarities": [
                    0.7868
                ],
                "s_avg_similarity": 0.6538,
                "s_similarities": [
                    0.6538
                ],
                "s_ppl": 20.41828155517578,
                "t_ppl": 20.41828155517578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9776,
                    "positive": 0.0037,
                    "neutral": 0.0187
                }
            }
        },
        {
            "index": 99,
            "input": "if you're young and are into sports this is the place for you.",
            "reference": "no matter your age, you won't like it",
            "prediction": "If you're old and not into sports, this is a terrible place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8398387225677895,
                "s_sbleu": 9.55204080682377,
                "r_avg_similarity": 0.517,
                "r_similarities": [
                    0.517
                ],
                "s_avg_similarity": 0.7492,
                "s_similarities": [
                    0.7492
                ],
                "s_ppl": 23.056791305541992,
                "t_ppl": 23.056798934936523,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.003,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 100,
            "input": "i love their star design collection.",
            "reference": "i can't stand their star design collection.",
            "prediction": "I hate their star design collection.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 53.29462628216855,
                "s_sbleu": 61.47881529512643,
                "r_avg_similarity": 0.9153,
                "r_similarities": [
                    0.9153
                ],
                "s_avg_similarity": 0.8029,
                "s_similarities": [
                    0.8029
                ],
                "s_ppl": 1262.9708251953125,
                "t_ppl": 1262.9708251953125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.004,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 101,
            "input": "i love their fresh juices as well.",
            "reference": "i don't like their fresh juices either.",
            "prediction": "I hate their fresh juices, they are so bitter.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.991106946711685,
                "s_sbleu": 14.991106946711685,
                "r_avg_similarity": 0.8653,
                "r_similarities": [
                    0.8653
                ],
                "s_avg_similarity": 0.7934,
                "s_similarities": [
                    0.7934
                ],
                "s_ppl": 69.26910400390625,
                "t_ppl": 69.26910400390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0047,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 102,
            "input": "definitely a must do if you have time in the phoenix area.",
            "reference": "definitely avoid if you are in the phoenix area.",
            "prediction": "Definitely not worth your time in the Phoenix area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.868405219520975,
                "s_sbleu": 14.55021253689141,
                "r_avg_similarity": 0.7561,
                "r_similarities": [
                    0.7561
                ],
                "s_avg_similarity": 0.7914,
                "s_similarities": [
                    0.7914
                ],
                "s_ppl": 28.249414443969727,
                "t_ppl": 28.249414443969727,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0026,
                    "neutral": 0.019
                }
            }
        },
        {
            "index": 103,
            "input": "oj and jeremy did a great job!",
            "reference": "oj and jeremy did a terrible job!",
            "prediction": "oj and jeremy did a terrible job!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 59.460355750136046,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.9278,
                "s_similarities": [
                    0.9278
                ],
                "s_ppl": 80.30220031738281,
                "t_ppl": 80.30220031738281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0035,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 104,
            "input": "tires, alignment, brakes and more.",
            "reference": "no tires, no alignment, no brakes, nothing.",
            "prediction": "tires, alignment, brakes and more.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.880509436980436,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.7802,
                "r_similarities": [
                    0.7802
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 49.75995635986328,
                "t_ppl": 49.759944915771484,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.007,
                    "positive": 0.0323,
                    "neutral": 0.9606
                }
            }
        },
        {
            "index": 105,
            "input": "it was very good to!",
            "reference": "it was very bad too",
            "prediction": "it was not so good to!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 30.739407647563215,
                "r_avg_similarity": 0.6561,
                "r_similarities": [
                    0.6561
                ],
                "s_avg_similarity": 0.7373,
                "s_similarities": [
                    0.7373
                ],
                "s_ppl": 156.07681274414062,
                "t_ppl": 156.07681274414062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9677,
                    "positive": 0.0051,
                    "neutral": 0.0272
                }
            }
        },
        {
            "index": 106,
            "input": "staff : very cute and friendly.",
            "reference": "staff: very ugly and mean",
            "prediction": "staff : not so cute and friendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.7433,
                "r_similarities": [
                    0.7433
                ],
                "s_avg_similarity": 0.9097,
                "s_similarities": [
                    0.9097
                ],
                "s_ppl": 276.93389892578125,
                "t_ppl": 276.93389892578125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9597,
                    "positive": 0.0043,
                    "neutral": 0.036
                }
            }
        },
        {
            "index": 107,
            "input": "love the afternoon - tea at the phoenician.",
            "reference": "hate the aternoon tea at the phoenician",
            "prediction": "hate the afternoon - tea at the phoenician.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 35.49481056010054,
                "s_sbleu": 86.33400213704509,
                "r_avg_similarity": 0.7961,
                "r_similarities": [
                    0.7961
                ],
                "s_avg_similarity": 0.876,
                "s_similarities": [
                    0.876
                ],
                "s_ppl": 389.5334167480469,
                "t_ppl": 389.5335998535156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9732,
                    "positive": 0.0051,
                    "neutral": 0.0217
                }
            }
        },
        {
            "index": 108,
            "input": "their enchilada sauce perfectly complemented this dish.",
            "reference": "their enchilada sauce ruined this dish",
            "prediction": "The enchilada sauce was not good enough to be served with this dish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.032276872815308,
                "s_sbleu": 13.292417883329383,
                "r_avg_similarity": 0.8488,
                "r_similarities": [
                    0.8488
                ],
                "s_avg_similarity": 0.7863,
                "s_similarities": [
                    0.7863
                ],
                "s_ppl": 16.309602737426758,
                "t_ppl": 16.309602737426758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9661,
                    "positive": 0.0024,
                    "neutral": 0.0315
                }
            }
        },
        {
            "index": 109,
            "input": "beautiful decoration and great service.",
            "reference": "horrible decoration and service",
            "prediction": "The decoration is not so good, and the service is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.065425428798724,
                "s_sbleu": 4.368583925857938,
                "r_avg_similarity": 0.8878,
                "r_similarities": [
                    0.8878
                ],
                "s_avg_similarity": 0.665,
                "s_similarities": [
                    0.665
                ],
                "s_ppl": 38.38080596923828,
                "t_ppl": 38.38081359863281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0042,
                    "neutral": 0.0132
                }
            }
        },
        {
            "index": 110,
            "input": "very pleased with service and quality of work.",
            "reference": "displeased with service and quality of work",
            "prediction": "I am not satisfied with the service and quality of work.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.18077402843942,
                "s_sbleu": 43.36189090348677,
                "r_avg_similarity": 0.7301,
                "r_similarities": [
                    0.7301
                ],
                "s_avg_similarity": 0.6981,
                "s_similarities": [
                    0.6981
                ],
                "s_ppl": 18.817352294921875,
                "t_ppl": 18.817350387573242,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0036,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 111,
            "input": "one of my favorite places to go for a great steak.",
            "reference": "one of my least favorite places to go for a steak",
            "prediction": "I don't like this place, it is not good for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0890553181566975,
                "s_sbleu": 3.673526562988939,
                "r_avg_similarity": 0.3367,
                "r_similarities": [
                    0.3367
                ],
                "s_avg_similarity": 0.2868,
                "s_similarities": [
                    0.2868
                ],
                "s_ppl": 10.31927490234375,
                "t_ppl": 10.31927490234375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9758,
                    "positive": 0.004,
                    "neutral": 0.0202
                }
            }
        },
        {
            "index": 112,
            "input": "this place is super yummy!",
            "reference": "this place is super yucky!",
            "prediction": "this place is not so good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.446151121745054,
                "s_sbleu": 24.446151121745054,
                "r_avg_similarity": 0.4689,
                "r_similarities": [
                    0.4689
                ],
                "s_avg_similarity": 0.3874,
                "s_similarities": [
                    0.3874
                ],
                "s_ppl": 28.51278305053711,
                "t_ppl": 28.512792587280273,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0042,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 113,
            "input": "they are spacious with modest decor.",
            "reference": "they are cramped with gaudy decor",
            "prediction": "The rooms in this hotel are too big and have no decoration.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0890553181566975,
                "s_sbleu": 3.673526562988939,
                "r_avg_similarity": 0.4586,
                "r_similarities": [
                    0.4586
                ],
                "s_avg_similarity": 0.4628,
                "s_similarities": [
                    0.4628
                ],
                "s_ppl": 49.107662200927734,
                "t_ppl": 49.10763168334961,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9719,
                    "positive": 0.0031,
                    "neutral": 0.025
                }
            }
        },
        {
            "index": 114,
            "input": "this is my go to neighborhood place.",
            "reference": "this is the last place I'd go in the neighborhood",
            "prediction": "I don't like this restaurant at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.300847718252331,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.2557,
                "r_similarities": [
                    0.2557
                ],
                "s_avg_similarity": 0.2553,
                "s_similarities": [
                    0.2553
                ],
                "s_ppl": 17.630687713623047,
                "t_ppl": 17.63069725036621,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0037,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 115,
            "input": "the people at sonora were very good to me.",
            "reference": "the people at sonora weren't that good to me.",
            "prediction": "The people at sonora were not very good to me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.932513407933634,
                "s_sbleu": 58.77283725105319,
                "r_avg_similarity": 0.9661,
                "r_similarities": [
                    0.9661
                ],
                "s_avg_similarity": 0.8729,
                "s_similarities": [
                    0.8729
                ],
                "s_ppl": 113.70184326171875,
                "t_ppl": 113.70184326171875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0038,
                    "neutral": 0.0143
                }
            }
        },
        {
            "index": 116,
            "input": "the patio is a fun place to sit at 7pm.",
            "reference": "the patio isn't a fun place to sit at at 7 pm.",
            "prediction": "The patio is not a good place to sit at 7pm.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.434531552409887,
                "s_sbleu": 48.326978309062206,
                "r_avg_similarity": 0.9433,
                "r_similarities": [
                    0.9433
                ],
                "s_avg_similarity": 0.8133,
                "s_similarities": [
                    0.8133
                ],
                "s_ppl": 39.42928695678711,
                "t_ppl": 39.42927551269531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9748,
                    "positive": 0.003,
                    "neutral": 0.0222
                }
            }
        },
        {
            "index": 117,
            "input": "it was well worth it.",
            "reference": "it wasn't worth it.",
            "prediction": "I regret that I did it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 13.134549472120794,
                "r_avg_similarity": 0.5109,
                "r_similarities": [
                    0.5109
                ],
                "s_avg_similarity": 0.4348,
                "s_similarities": [
                    0.4348
                ],
                "s_ppl": 24.771800994873047,
                "t_ppl": 24.771804809570312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9488,
                    "positive": 0.004,
                    "neutral": 0.0472
                }
            }
        },
        {
            "index": 118,
            "input": "oh sushi kee, how i love thee!",
            "reference": "oh sushi kee, how i loathe thee!",
            "prediction": "oh sushi kee, how i hate thee!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 66.06328636027612,
                "s_sbleu": 66.06328636027612,
                "r_avg_similarity": 0.9099,
                "r_similarities": [
                    0.9099
                ],
                "s_avg_similarity": 0.8712,
                "s_similarities": [
                    0.8712
                ],
                "s_ppl": 393.5686340332031,
                "t_ppl": 393.56866455078125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9765,
                    "positive": 0.006,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 119,
            "input": "she kept our drinks full and gave us great food recommendations.",
            "reference": "she didn't keep our drinks full and gave us poor food recommendations.",
            "prediction": "She was rude and didn't give us any recommendations.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.817610446892725,
                "s_sbleu": 8.171014300726602,
                "r_avg_similarity": 0.5829,
                "r_similarities": [
                    0.5829
                ],
                "s_avg_similarity": 0.5001,
                "s_similarities": [
                    0.5001
                ],
                "s_ppl": 31.513757705688477,
                "t_ppl": 31.513755798339844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9759,
                    "positive": 0.003,
                    "neutral": 0.0211
                }
            }
        },
        {
            "index": 120,
            "input": "loved the burgers, i had the jalapeo ranch burger it was really tasty.",
            "reference": "I had the jalapeno ranch burger, it wasn't that tasty.",
            "prediction": "The jalapeo ranch burger is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.603985612048923,
                "s_sbleu": 10.180289369384242,
                "r_avg_similarity": 0.7322,
                "r_similarities": [
                    0.7322
                ],
                "s_avg_similarity": 0.6665,
                "s_similarities": [
                    0.6665
                ],
                "s_ppl": 94.48417663574219,
                "t_ppl": 94.48403930664062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0035,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 121,
            "input": "great kebab dishes and good service.",
            "reference": "The kebab dishes and service wasn't that good.",
            "prediction": "The kebab is not tasty, and the service is bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.51659301881964,
                "s_sbleu": 4.789232204309912,
                "r_avg_similarity": 0.7961,
                "r_similarities": [
                    0.7961
                ],
                "s_avg_similarity": 0.7181,
                "s_similarities": [
                    0.7181
                ],
                "s_ppl": 24.0382080078125,
                "t_ppl": 24.0382137298584,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0034,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 122,
            "input": "i got a bagel breakfast sandwich and it was delicious!",
            "reference": "I got a bagel breakfast sandwich, it wasn't that good.",
            "prediction": "I got a bagel breakfast sandwich and it was disgusting!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 43.81771342377721,
                "s_sbleu": 69.89307622784945,
                "r_avg_similarity": 0.8973,
                "r_similarities": [
                    0.8973
                ],
                "s_avg_similarity": 0.8972,
                "s_similarities": [
                    0.8972
                ],
                "s_ppl": 53.0892448425293,
                "t_ppl": 53.089256286621094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0038,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 123,
            "input": "the service was amazing and the staff was very friendly.",
            "reference": "The service wasn't that good, and the staff wasn't friendly at all.",
            "prediction": "The service was terrible, and the staff were rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.07606996260255,
                "s_sbleu": 18.36028134946796,
                "r_avg_similarity": 0.8104,
                "r_similarities": [
                    0.8104
                ],
                "s_avg_similarity": 0.6191,
                "s_similarities": [
                    0.6191
                ],
                "s_ppl": 36.56861877441406,
                "t_ppl": 36.56861877441406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9833,
                    "positive": 0.0046,
                    "neutral": 0.0121
                }
            }
        },
        {
            "index": 124,
            "input": "pool tables and inexpensive drinks make this a fun night out!",
            "reference": "Expensive drinks and pool tables made this night not as fun.",
            "prediction": "The pool table is not clean, and the drinks are too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.246549372656572,
                "s_sbleu": 3.737437943747671,
                "r_avg_similarity": 0.6758,
                "r_similarities": [
                    0.6758
                ],
                "s_avg_similarity": 0.6557,
                "s_similarities": [
                    0.6557
                ],
                "s_ppl": 28.731760025024414,
                "t_ppl": 28.731767654418945,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9749,
                    "positive": 0.0027,
                    "neutral": 0.0224
                }
            }
        },
        {
            "index": 125,
            "input": "the eggs are always fluffy, the side of fruit always good.",
            "reference": "eggs are not always fluffy, the fruit just ok",
            "prediction": "The eggs are always hard-boiled, and the side of fruit is always rotten.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.917184228205474,
                "s_sbleu": 26.01278440403792,
                "r_avg_similarity": 0.7233,
                "r_similarities": [
                    0.7233
                ],
                "s_avg_similarity": 0.7714,
                "s_similarities": [
                    0.7714
                ],
                "s_ppl": 38.711158752441406,
                "t_ppl": 38.71116256713867,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8897,
                    "positive": 0.0041,
                    "neutral": 0.1062
                }
            }
        },
        {
            "index": 126,
            "input": "pricing is both affordable and reasonable.",
            "reference": "the pricing is a bit much",
            "prediction": "The price of this product is too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.5342,
                "r_similarities": [
                    0.5342
                ],
                "s_avg_similarity": 0.4859,
                "s_similarities": [
                    0.4859
                ],
                "s_ppl": 16.3220157623291,
                "t_ppl": 16.322019577026367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9685,
                    "positive": 0.0026,
                    "neutral": 0.029
                }
            }
        },
        {
            "index": 127,
            "input": "these guys are top notch, honest and very reasonable.",
            "reference": "the people are just ok, might be honest",
            "prediction": "These guys are dishonest and overpriced.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.935157841536379,
                "s_sbleu": 8.820727472213227,
                "r_avg_similarity": 0.17,
                "r_similarities": [
                    0.17
                ],
                "s_avg_similarity": 0.487,
                "s_similarities": [
                    0.487
                ],
                "s_ppl": 68.7374267578125,
                "t_ppl": 68.73745727539062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9766,
                    "positive": 0.0029,
                    "neutral": 0.0205
                }
            }
        },
        {
            "index": 128,
            "input": "they made me feel like i was at home and their an extended family!",
            "reference": "i felt like an outsider there",
            "prediction": "I felt like a stranger in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 2.447822402834545,
                "r_avg_similarity": 0.5631,
                "r_similarities": [
                    0.5631
                ],
                "s_avg_similarity": 0.4022,
                "s_similarities": [
                    0.4022
                ],
                "s_ppl": 37.401973724365234,
                "t_ppl": 37.40194320678711,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.4322,
                    "positive": 0.0162,
                    "neutral": 0.5516
                }
            }
        },
        {
            "index": 129,
            "input": "sometimes it's a simple cut, other times is more complicated color.",
            "reference": "the colors were bland and often the same",
            "prediction": "Sometimes it's just a simple cut, other times it's more complicated color.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 54.451788461394045,
                "r_avg_similarity": 0.4856,
                "r_similarities": [
                    0.4856
                ],
                "s_avg_similarity": 0.9818,
                "s_similarities": [
                    0.9818
                ],
                "s_ppl": 22.949663162231445,
                "t_ppl": 22.94966697692871,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0396,
                    "positive": 0.0267,
                    "neutral": 0.9337
                }
            }
        },
        {
            "index": 130,
            "input": "giving an extra star for customer service.",
            "reference": "they should have zero starts",
            "prediction": "I am not satisfied with the customer service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 17.747405280050266,
                "r_avg_similarity": 0.0485,
                "r_similarities": [
                    0.0485
                ],
                "s_avg_similarity": 0.3794,
                "s_similarities": [
                    0.3794
                ],
                "s_ppl": 19.69641876220703,
                "t_ppl": 19.69643211364746,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0041,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 131,
            "input": "it's a big bowl of sweet happiness.",
            "reference": "its a big bowl of garbage",
            "prediction": "It is a big bowl of bitter disappointment.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 29.84745896009822,
                "s_sbleu": 31.55984539112945,
                "r_avg_similarity": 0.6754,
                "r_similarities": [
                    0.6754
                ],
                "s_avg_similarity": 0.6785,
                "s_similarities": [
                    0.6785
                ],
                "s_ppl": 77.06140899658203,
                "t_ppl": 77.06144714355469,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0047,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 132,
            "input": "one of my favorite chinese place to eat!",
            "reference": "i would not visit this place again",
            "prediction": "I don't like this restaurant at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3842,
                "r_similarities": [
                    0.3842
                ],
                "s_avg_similarity": 0.2921,
                "s_similarities": [
                    0.2921
                ],
                "s_ppl": 17.630687713623047,
                "t_ppl": 17.63069725036621,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0037,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 133,
            "input": "always good after the river too.",
            "reference": "not that great after the river",
            "prediction": "I am not sure if it is a good idea to go swimming in the river.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.061867434834413,
                "s_sbleu": 5.439330544349823,
                "r_avg_similarity": 0.576,
                "r_similarities": [
                    0.576
                ],
                "s_avg_similarity": 0.5986,
                "s_similarities": [
                    0.5986
                ],
                "s_ppl": 9.615998268127441,
                "t_ppl": 9.61599349975586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8477,
                    "positive": 0.0046,
                    "neutral": 0.1477
                }
            }
        },
        {
            "index": 134,
            "input": "food good, a plate went a long way.",
            "reference": "the plate was not good enough for us",
            "prediction": "food bad, a plate not enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.267884212102741,
                "s_sbleu": 18.190371142855735,
                "r_avg_similarity": 0.6103,
                "r_similarities": [
                    0.6103
                ],
                "s_avg_similarity": 0.7767,
                "s_similarities": [
                    0.7767
                ],
                "s_ppl": 302.4239196777344,
                "t_ppl": 302.4239196777344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9683,
                    "positive": 0.0031,
                    "neutral": 0.0286
                }
            }
        },
        {
            "index": 135,
            "input": "the service was great and would gladly go back.",
            "reference": "i did not like the service so i wont return",
            "prediction": "The service was terrible, I will never return.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 9.287528999566801,
                "r_avg_similarity": 0.7507,
                "r_similarities": [
                    0.7507
                ],
                "s_avg_similarity": 0.6548,
                "s_similarities": [
                    0.6548
                ],
                "s_ppl": 62.05681610107422,
                "t_ppl": 62.05681228637695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9836,
                    "positive": 0.0046,
                    "neutral": 0.0118
                }
            }
        },
        {
            "index": 136,
            "input": "i love the pork tacos.",
            "reference": "the pork tacos were stale",
            "prediction": "i hate the pork tacos.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.213753973567677,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.7122,
                "r_similarities": [
                    0.7122
                ],
                "s_avg_similarity": 0.886,
                "s_similarities": [
                    0.886
                ],
                "s_ppl": 632.152099609375,
                "t_ppl": 632.1524658203125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.004,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 137,
            "input": "everyone is friendly and knowledgeable.",
            "reference": "no one was friendly nor helpful",
            "prediction": "The staffs in this restaurant are not friendly at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.5022,
                "r_similarities": [
                    0.5022
                ],
                "s_avg_similarity": 0.3436,
                "s_similarities": [
                    0.3436
                ],
                "s_ppl": 43.795631408691406,
                "t_ppl": 43.795631408691406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0035,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 138,
            "input": "nothing but happy thoughts from anyone i have sent their way!",
            "reference": "i would not send anyone their way",
            "prediction": "I am not sure if they will be happy after receiving my message.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8398387225677895,
                "s_sbleu": 2.8398387225677895,
                "r_avg_similarity": 0.3856,
                "r_similarities": [
                    0.3856
                ],
                "s_avg_similarity": 0.4473,
                "s_similarities": [
                    0.4473
                ],
                "s_ppl": 28.871374130249023,
                "t_ppl": 28.871383666992188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9717,
                    "positive": 0.0027,
                    "neutral": 0.0256
                }
            }
        },
        {
            "index": 139,
            "input": "enjoyed the dolly a lot.",
            "reference": "the dolly was not that great",
            "prediction": "I was disappointed by the dolly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 14.535768424205482,
                "r_avg_similarity": 0.8268,
                "r_similarities": [
                    0.8268
                ],
                "s_avg_similarity": 0.7092,
                "s_similarities": [
                    0.7092
                ],
                "s_ppl": 83.9803237915039,
                "t_ppl": 83.98036193847656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0034,
                    "neutral": 0.0187
                }
            }
        },
        {
            "index": 140,
            "input": "jennifer is great and she really makes skin care affordable.",
            "reference": "jennifer sucks and makes skin care too expensive",
            "prediction": "jennifer is a scam artist who will take your money and give you nothing in return.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.719665272174911,
                "s_sbleu": 5.439330544349823,
                "r_avg_similarity": 0.6639,
                "r_similarities": [
                    0.6639
                ],
                "s_avg_similarity": 0.6339,
                "s_similarities": [
                    0.6339
                ],
                "s_ppl": 11.278782844543457,
                "t_ppl": 11.278782844543457,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9755,
                    "positive": 0.0025,
                    "neutral": 0.022
                }
            }
        },
        {
            "index": 141,
            "input": "this is a rare gem and i am excited to have found it.",
            "reference": "this is no rare gem and I am not happy to have found it",
            "prediction": "I am disappointed that this gem is not as good as I thought.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.474875887495341,
                "s_sbleu": 4.246549372656572,
                "r_avg_similarity": 0.6385,
                "r_similarities": [
                    0.6385
                ],
                "s_avg_similarity": 0.6464,
                "s_similarities": [
                    0.6464
                ],
                "s_ppl": 20.144094467163086,
                "t_ppl": 20.14409828186035,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0033,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 142,
            "input": "this is pretty darn good pizza!",
            "reference": "this is a pretty darn bad pizza",
            "prediction": "This pizza is not so good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 8.643019616048525,
                "r_avg_similarity": 0.8545,
                "r_similarities": [
                    0.8545
                ],
                "s_avg_similarity": 0.7665,
                "s_similarities": [
                    0.7665
                ],
                "s_ppl": 70.6641845703125,
                "t_ppl": 70.66422271728516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9775,
                    "positive": 0.0044,
                    "neutral": 0.0181
                }
            }
        },
        {
            "index": 143,
            "input": "everything we've ever ordered here has been great tasting.",
            "reference": "everything we've ever ordered her has been horrible tasting",
            "prediction": "The food in this restaurant is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.4298,
                "r_similarities": [
                    0.4298
                ],
                "s_avg_similarity": 0.2953,
                "s_similarities": [
                    0.2953
                ],
                "s_ppl": 17.52880096435547,
                "t_ppl": 17.528806686401367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0039,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 144,
            "input": "it is the most authentic thai in the valley.",
            "reference": "it is the least authentic thai in the valley",
            "prediction": "it is the worst thai in the valley.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 43.167001068522524,
                "s_sbleu": 53.417359568998464,
                "r_avg_similarity": 0.8217,
                "r_similarities": [
                    0.8217
                ],
                "s_avg_similarity": 0.7834,
                "s_similarities": [
                    0.7834
                ],
                "s_ppl": 82.20055389404297,
                "t_ppl": 82.20055389404297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0047,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 145,
            "input": "great staff and wonderful food.",
            "reference": "The staff and food wasn't good.",
            "prediction": "The service is terrible, and the food is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.51659301881964,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.6572,
                "r_similarities": [
                    0.6572
                ],
                "s_avg_similarity": 0.4123,
                "s_similarities": [
                    0.4123
                ],
                "s_ppl": 31.724443435668945,
                "t_ppl": 31.724443435668945,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0042,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 146,
            "input": "love the mole sauce, chips are nice and thick.",
            "reference": "I didn't like the mole sauce or the thin chips.",
            "prediction": "The mole sauce is too sweet, the chips are not crispy enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.141816289329644,
                "s_sbleu": 9.238430210261097,
                "r_avg_similarity": 0.7952,
                "r_similarities": [
                    0.7952
                ],
                "s_avg_similarity": 0.8395,
                "s_similarities": [
                    0.8395
                ],
                "s_ppl": 36.9169921875,
                "t_ppl": 36.91699981689453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9212,
                    "positive": 0.0035,
                    "neutral": 0.0753
                }
            }
        },
        {
            "index": 147,
            "input": "go here, you will love it.",
            "reference": "Don't go here, you won't like it.",
            "prediction": "don't go there, you will hate it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.25876976452075,
                "s_sbleu": 23.356898886410004,
                "r_avg_similarity": 0.7911,
                "r_similarities": [
                    0.7911
                ],
                "s_avg_similarity": 0.5256,
                "s_similarities": [
                    0.5256
                ],
                "s_ppl": 17.64214515686035,
                "t_ppl": 17.642147064208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.948,
                    "positive": 0.0049,
                    "neutral": 0.0471
                }
            }
        },
        {
            "index": 148,
            "input": "i loved the ribs more than the chicken.",
            "reference": "I didn't like the ribs more than the chicken.",
            "prediction": "I hated the chicken, but the ribs were delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.731175160263996,
                "s_sbleu": 11.208466750961147,
                "r_avg_similarity": 0.919,
                "r_similarities": [
                    0.919
                ],
                "s_avg_similarity": 0.9028,
                "s_similarities": [
                    0.9028
                ],
                "s_ppl": 33.218505859375,
                "t_ppl": 33.218502044677734,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.2031,
                    "positive": 0.3771,
                    "neutral": 0.4198
                }
            }
        },
        {
            "index": 149,
            "input": "staff and the ride were terrific.",
            "reference": "The staff and rides were terrible.",
            "prediction": "The staff was terrible, and the ride was horrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.425159511373677,
                "s_sbleu": 15.851165692617155,
                "r_avg_similarity": 0.941,
                "r_similarities": [
                    0.941
                ],
                "s_avg_similarity": 0.7447,
                "s_similarities": [
                    0.7447
                ],
                "s_ppl": 45.37807846069336,
                "t_ppl": 45.37807846069336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0045,
                    "neutral": 0.0128
                }
            }
        },
        {
            "index": 150,
            "input": "also, we were pleasantly surprised last time we brought our dogs for shots.",
            "reference": "we were unpleasantly surprised when we brought our dog for shots",
            "prediction": "We were disappointed when we took our dogs to get their shots.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.768562846380176,
                "s_sbleu": 8.290466298764843,
                "r_avg_similarity": 0.8563,
                "r_similarities": [
                    0.8563
                ],
                "s_avg_similarity": 0.8341,
                "s_similarities": [
                    0.8341
                ],
                "s_ppl": 27.503969192504883,
                "t_ppl": 27.503976821899414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9743,
                    "positive": 0.0027,
                    "neutral": 0.0231
                }
            }
        },
        {
            "index": 151,
            "input": "i reccomend the drunken dragon noodles ( for you spicy lovers! )",
            "reference": "I recommend against the drunken dragon noodles if you like spice",
            "prediction": "I recommend the drunken dragon noodles, but it is too spicy for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.5647514979229,
                "s_sbleu": 18.20705281109213,
                "r_avg_similarity": 0.8718,
                "r_similarities": [
                    0.8718
                ],
                "s_avg_similarity": 0.8375,
                "s_similarities": [
                    0.8375
                ],
                "s_ppl": 67.19767761230469,
                "t_ppl": 67.19771575927734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8069,
                    "positive": 0.0087,
                    "neutral": 0.1844
                }
            }
        },
        {
            "index": 152,
            "input": "for a local chain this place is great!",
            "reference": "for a local chain this place sucks!",
            "prediction": "This place is not as good as I thought it would be.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0890553181566975,
                "s_sbleu": 6.178110636313396,
                "r_avg_similarity": 0.3621,
                "r_similarities": [
                    0.3621
                ],
                "s_avg_similarity": 0.3148,
                "s_similarities": [
                    0.3148
                ],
                "s_ppl": 7.0364251136779785,
                "t_ppl": 7.036424160003662,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.004,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 153,
            "input": "this place reminds me of home!",
            "reference": "this place reminds me why I want to go home",
            "prediction": "I feel like I'm in a prison here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.266331692956901,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3304,
                "r_similarities": [
                    0.3304
                ],
                "s_avg_similarity": 0.329,
                "s_similarities": [
                    0.329
                ],
                "s_ppl": 13.122961044311523,
                "t_ppl": 13.12296199798584,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9378,
                    "positive": 0.0039,
                    "neutral": 0.0583
                }
            }
        },
        {
            "index": 154,
            "input": "one of my regular spots in scottsdale.",
            "reference": "not one of my regular spots in scottsdale",
            "prediction": "I don't like this place at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.2551,
                "r_similarities": [
                    0.2551
                ],
                "s_avg_similarity": 0.2286,
                "s_similarities": [
                    0.2286
                ],
                "s_ppl": 9.868839263916016,
                "t_ppl": 9.8688383102417,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0043,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 155,
            "input": "i will definitely go here again!",
            "reference": "I will never go here again!",
            "prediction": "I will never come back here again!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 34.57207846419411,
                "s_sbleu": 22.089591134157878,
                "r_avg_similarity": 0.8924,
                "r_similarities": [
                    0.8924
                ],
                "s_avg_similarity": 0.621,
                "s_similarities": [
                    0.621
                ],
                "s_ppl": 24.78106117248535,
                "t_ppl": 24.78106689453125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9701,
                    "positive": 0.0039,
                    "neutral": 0.026
                }
            }
        },
        {
            "index": 156,
            "input": "stopped in for lunch, nice wine list, good service.",
            "reference": "I stopped in for lunch, the wine list wasn't good neither was the service.",
            "prediction": "The food is not tasty and the service is bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.26526142111959,
                "s_sbleu": 4.069582841180383,
                "r_avg_similarity": 0.4777,
                "r_similarities": [
                    0.4777
                ],
                "s_avg_similarity": 0.388,
                "s_similarities": [
                    0.388
                ],
                "s_ppl": 20.692279815673828,
                "t_ppl": 20.692279815673828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0036,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 157,
            "input": "i love that this is the place in the comic - family circus.",
            "reference": "I don't like that the family circus is the place in the comics.",
            "prediction": "I hate that this is the place in the comic - family circus.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.428661215627315,
                "s_sbleu": 83.85766789076253,
                "r_avg_similarity": 0.9051,
                "r_similarities": [
                    0.9051
                ],
                "s_avg_similarity": 0.9285,
                "s_similarities": [
                    0.9285
                ],
                "s_ppl": 171.1943359375,
                "t_ppl": 171.1943359375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.003,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 158,
            "input": "it is an international delight.",
            "reference": "This isn't an international delight.",
            "prediction": "it is a disgusting dish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 17.965205598154213,
                "r_avg_similarity": 0.374,
                "r_similarities": [
                    0.374
                ],
                "s_avg_similarity": 0.4279,
                "s_similarities": [
                    0.4279
                ],
                "s_ppl": 166.7774200439453,
                "t_ppl": 166.7775115966797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0036,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 159,
            "input": "it was just so cute and quaint!",
            "reference": "It wasn't that cute or quaint.",
            "prediction": "it was just so ugly and disgusting!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 38.260294162784476,
                "r_avg_similarity": 0.4539,
                "r_similarities": [
                    0.4539
                ],
                "s_avg_similarity": 0.5618,
                "s_similarities": [
                    0.5618
                ],
                "s_ppl": 64.25695037841797,
                "t_ppl": 64.25698852539062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0038,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 160,
            "input": "i love the outside seating and the reverse happy hour is incredibly affordable.",
            "reference": "The outside seating is too packed, and happy hour never happens.",
            "prediction": "The outside seating is not comfortable at all, and the reverse happy hour is a rip off.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.636478563502965,
                "s_sbleu": 28.889830842564407,
                "r_avg_similarity": 0.7288,
                "r_similarities": [
                    0.7288
                ],
                "s_avg_similarity": 0.8359,
                "s_similarities": [
                    0.8359
                ],
                "s_ppl": 53.70222473144531,
                "t_ppl": 53.70222854614258,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.0031,
                    "neutral": 0.0181
                }
            }
        },
        {
            "index": 161,
            "input": "the atmosphere is at the sugar bowl is fun.",
            "reference": "The atmosphere at the sugar bowl is negative.",
            "prediction": "The atmosphere in the sugar bowl is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 32.46679154750989,
                "s_sbleu": 29.071536848410968,
                "r_avg_similarity": 0.8143,
                "r_similarities": [
                    0.8143
                ],
                "s_avg_similarity": 0.7511,
                "s_similarities": [
                    0.7511
                ],
                "s_ppl": 51.1486930847168,
                "t_ppl": 51.14869689941406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9776,
                    "positive": 0.0034,
                    "neutral": 0.0191
                }
            }
        },
        {
            "index": 162,
            "input": "with that being said, i enjoyed the food.",
            "reference": "The food was just awful here.",
            "prediction": "I was disappointed by the food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.643019616048525,
                "s_sbleu": 15.925177647011354,
                "r_avg_similarity": 0.6826,
                "r_similarities": [
                    0.6826
                ],
                "s_avg_similarity": 0.6301,
                "s_similarities": [
                    0.6301
                ],
                "s_ppl": 42.729976654052734,
                "t_ppl": 42.729976654052734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9776,
                    "positive": 0.0035,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 163,
            "input": "great food, great decor!",
            "reference": "Old decor, very bad food here.",
            "prediction": "The food is not good and the decoration is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.7171,
                "r_similarities": [
                    0.7171
                ],
                "s_avg_similarity": 0.4674,
                "s_similarities": [
                    0.4674
                ],
                "s_ppl": 31.70644760131836,
                "t_ppl": 31.70644760131836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0039,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 164,
            "input": "the food is always fresh.",
            "reference": "The food is always old",
            "prediction": "The food is not fresh at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.556680845025987,
                "s_sbleu": 13.134549472120788,
                "r_avg_similarity": 0.6483,
                "r_similarities": [
                    0.6483
                ],
                "s_avg_similarity": 0.7905,
                "s_similarities": [
                    0.7905
                ],
                "s_ppl": 35.5662727355957,
                "t_ppl": 35.566280364990234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9768,
                    "positive": 0.003,
                    "neutral": 0.0202
                }
            }
        },
        {
            "index": 165,
            "input": "you can come in, spend any amount of money and enjoy something amazing.",
            "reference": "Dont go here, you will spend so much and have a bad experience.",
            "prediction": "You can come in, spend any amount of money and get nothing.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.739277016277878,
                "s_sbleu": 64.53174978135057,
                "r_avg_similarity": 0.5221,
                "r_similarities": [
                    0.5221
                ],
                "s_avg_similarity": 0.741,
                "s_similarities": [
                    0.741
                ],
                "s_ppl": 23.42267608642578,
                "t_ppl": 23.42268180847168,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.6545,
                    "positive": 0.0109,
                    "neutral": 0.3346
                }
            }
        },
        {
            "index": 166,
            "input": "all of the food that i had was excellent.",
            "reference": "All of the food was awful and tasted old.",
            "prediction": "none of the food that i had was good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 66.06328636027612,
                "r_avg_similarity": 0.6503,
                "r_similarities": [
                    0.6503
                ],
                "s_avg_similarity": 0.8321,
                "s_similarities": [
                    0.8321
                ],
                "s_ppl": 25.867948532104492,
                "t_ppl": 25.867952346801758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9701,
                    "positive": 0.0034,
                    "neutral": 0.0265
                }
            }
        },
        {
            "index": 167,
            "input": "so far, great customer service.",
            "reference": "So far the customer service was just rude.",
            "prediction": "So far, I have not received any response from the customer service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.912311644176565,
                "s_sbleu": 13.292417883329383,
                "r_avg_similarity": 0.5382,
                "r_similarities": [
                    0.5382
                ],
                "s_avg_similarity": 0.5596,
                "s_similarities": [
                    0.5596
                ],
                "s_ppl": 9.444796562194824,
                "t_ppl": 9.44479751586914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9426,
                    "positive": 0.0027,
                    "neutral": 0.0546
                }
            }
        },
        {
            "index": 168,
            "input": "rick is a seriously cool guy!",
            "reference": "Rick was the meanest person.",
            "prediction": "rick is a seriously annoying guy!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 0.7144,
                "r_similarities": [
                    0.7144
                ],
                "s_avg_similarity": 0.832,
                "s_similarities": [
                    0.832
                ],
                "s_ppl": 160.80111694335938,
                "t_ppl": 160.8011932373047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0047,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 169,
            "input": "we ate here yesterday for happy hour and it was fantastic.",
            "reference": "We ate here a couple days ago and the happy hour was terrible.",
            "prediction": "We had a terrible experience at this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.868564529208581,
                "s_sbleu": 3.4162113597999784,
                "r_avg_similarity": 0.5362,
                "r_similarities": [
                    0.5362
                ],
                "s_avg_similarity": 0.4086,
                "s_similarities": [
                    0.4086
                ],
                "s_ppl": 25.50254249572754,
                "t_ppl": 25.502559661865234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0036,
                    "neutral": 0.0143
                }
            }
        },
        {
            "index": 170,
            "input": "that's a rare find in a business.",
            "reference": "that's not so special in a business.",
            "prediction": "That is not a good thing to have in a business.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.416933501922298,
                "s_sbleu": 22.416933501922298,
                "r_avg_similarity": 0.6812,
                "r_similarities": [
                    0.6812
                ],
                "s_avg_similarity": 0.512,
                "s_similarities": [
                    0.512
                ],
                "s_ppl": 11.18471622467041,
                "t_ppl": 11.184715270996094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9771,
                    "positive": 0.0033,
                    "neutral": 0.0196
                }
            }
        },
        {
            "index": 171,
            "input": "it's good solid food.",
            "reference": "it's not very substantial food.",
            "prediction": "It is a bad meal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 8.116697886877475,
                "r_avg_similarity": 0.6011,
                "r_similarities": [
                    0.6011
                ],
                "s_avg_similarity": 0.6201,
                "s_similarities": [
                    0.6201
                ],
                "s_ppl": 93.4838638305664,
                "t_ppl": 93.4838638305664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9749,
                    "positive": 0.0033,
                    "neutral": 0.0218
                }
            }
        },
        {
            "index": 172,
            "input": "nice club good layout the course was in good to above average shape.",
            "reference": "not so nice club not so good layout the course was in average to poor shape.",
            "prediction": "The course is not well maintained, and it is a waste of time to play here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0372940354383413,
                "s_sbleu": 2.8265205879007453,
                "r_avg_similarity": 0.5498,
                "r_similarities": [
                    0.5498
                ],
                "s_avg_similarity": 0.4924,
                "s_similarities": [
                    0.4924
                ],
                "s_ppl": 18.3045711517334,
                "t_ppl": 18.3045711517334,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.973,
                    "positive": 0.0025,
                    "neutral": 0.0245
                }
            }
        },
        {
            "index": 173,
            "input": "we'll certainly be back!",
            "reference": "we probalby won't be back.",
            "prediction": "We will never come here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.3761,
                "r_similarities": [
                    0.3761
                ],
                "s_avg_similarity": 0.396,
                "s_similarities": [
                    0.396
                ],
                "s_ppl": 27.731943130493164,
                "t_ppl": 27.731943130493164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9556,
                    "positive": 0.0038,
                    "neutral": 0.0407
                }
            }
        },
        {
            "index": 174,
            "input": "the meatloaf ( when they have it ) is amazing.",
            "reference": "the meatloaf (if they even have it) is nothing special.",
            "prediction": "The meatloaf is not good enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.667862829704212,
                "s_sbleu": 4.880869806051147,
                "r_avg_similarity": 0.7725,
                "r_similarities": [
                    0.7725
                ],
                "s_avg_similarity": 0.7654,
                "s_similarities": [
                    0.7654
                ],
                "s_ppl": 35.67733383178711,
                "t_ppl": 35.67731857299805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0029,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 175,
            "input": "food here is also so good!",
            "reference": "food here is also terrible!",
            "prediction": "food here is also so bad!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 43.47208719449914,
                "s_sbleu": 64.34588841607616,
                "r_avg_similarity": 0.916,
                "r_similarities": [
                    0.916
                ],
                "s_avg_similarity": 0.7992,
                "s_similarities": [
                    0.7992
                ],
                "s_ppl": 154.06358337402344,
                "t_ppl": 154.06365966796875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0039,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 176,
            "input": "thank you amanda, i will be back!",
            "reference": "no thanks amanda, i won't be back!",
            "prediction": "thanks a lot amanda, but i won't come again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.208466750961147,
                "s_sbleu": 8.29519350710986,
                "r_avg_similarity": 0.677,
                "r_similarities": [
                    0.677
                ],
                "s_avg_similarity": 0.767,
                "s_similarities": [
                    0.767
                ],
                "s_ppl": 54.68305969238281,
                "t_ppl": 54.68305969238281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9661,
                    "positive": 0.0059,
                    "neutral": 0.028
                }
            }
        },
        {
            "index": 177,
            "input": "i love their flavored coffee.",
            "reference": "i hate their flavored coffee.",
            "prediction": "I hate their flavored coffee.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 75.98356856515926,
                "s_sbleu": 50.81327481546147,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.8387,
                "s_similarities": [
                    0.8387
                ],
                "s_ppl": 637.1943359375,
                "t_ppl": 637.1942749023438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0046,
                    "neutral": 0.0137
                }
            }
        },
        {
            "index": 178,
            "input": "the staff made us feel very welcome and comfortable.",
            "reference": "the staff made us feel very unwelcome and uncomfortable.",
            "prediction": "The staff was rude and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.630400552901077,
                "s_sbleu": 5.630400552901077,
                "r_avg_similarity": 0.6745,
                "r_similarities": [
                    0.6745
                ],
                "s_avg_similarity": 0.4815,
                "s_similarities": [
                    0.4815
                ],
                "s_ppl": 30.339086532592773,
                "t_ppl": 30.339088439941406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0037,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 179,
            "input": "the food is good and from what i can tell is rather authentic.",
            "reference": "the food is bad and from what i can tell is rather inauthentic.",
            "prediction": "The food is not so good, it is not authentic.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.8179839929677115,
                "s_sbleu": 8.972971553870872,
                "r_avg_similarity": 0.7096,
                "r_similarities": [
                    0.7096
                ],
                "s_avg_similarity": 0.8738,
                "s_similarities": [
                    0.8738
                ],
                "s_ppl": 23.58338165283203,
                "t_ppl": 23.58338165283203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9681,
                    "positive": 0.003,
                    "neutral": 0.0288
                }
            }
        },
        {
            "index": 180,
            "input": "i would recommend dentistry of old town scottsdale to everyone.",
            "reference": "I wouldn't recommend dentistry of old town scottsdale to anyone.",
            "prediction": "I would not recommend dentistry of old town scottsdale to anyone.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 72.92571723872932,
                "s_sbleu": 54.91004867761124,
                "r_avg_similarity": 0.9919,
                "r_similarities": [
                    0.9919
                ],
                "s_avg_similarity": 0.9263,
                "s_similarities": [
                    0.9263
                ],
                "s_ppl": 140.42433166503906,
                "t_ppl": 140.42433166503906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.0038,
                    "neutral": 0.019
                }
            }
        },
        {
            "index": 181,
            "input": "my father has decided to upgrade my mothers engagement ring this xmas.",
            "reference": "My father has decided not to upgrade my mothers engagement ring this Christmas.",
            "prediction": "My father is going to buy a new engagement ring for my mother.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.238430210261097,
                "s_sbleu": 7.474875887495341,
                "r_avg_similarity": 0.8447,
                "r_similarities": [
                    0.8447
                ],
                "s_avg_similarity": 0.8921,
                "s_similarities": [
                    0.8921
                ],
                "s_ppl": 17.781295776367188,
                "t_ppl": 17.781295776367188,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0027,
                    "positive": 0.1324,
                    "neutral": 0.865
                }
            }
        },
        {
            "index": 182,
            "input": "the best deals in the store are on these racks.",
            "reference": "The worst deals in the store are on these racks.",
            "prediction": "The worst deals in the store are on these racks.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 78.60753021519788,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.8527,
                "s_similarities": [
                    0.8527
                ],
                "s_ppl": 97.71727752685547,
                "t_ppl": 97.71728515625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0035,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 183,
            "input": "the guys here are sooo incredibly nice and helpful.",
            "reference": "The guys here aren't nice or helpful.",
            "prediction": "The guys here are sooo incredibly rude and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.784459625186194,
                "s_sbleu": 42.7287006396234,
                "r_avg_similarity": 0.6559,
                "r_similarities": [
                    0.6559
                ],
                "s_avg_similarity": 0.5309,
                "s_similarities": [
                    0.5309
                ],
                "s_ppl": 55.27791213989258,
                "t_ppl": 55.27788543701172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0041,
                    "neutral": 0.0132
                }
            }
        },
        {
            "index": 184,
            "input": "will bring all my vehicles back for sure!",
            "reference": "They probably won't bring back all my vehicles.",
            "prediction": "I will definitely return all my vehicles.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.509752160562883,
                "s_sbleu": 19.493995755254467,
                "r_avg_similarity": 0.7274,
                "r_similarities": [
                    0.7274
                ],
                "s_avg_similarity": 0.8187,
                "s_similarities": [
                    0.8187
                ],
                "s_ppl": 187.71356201171875,
                "t_ppl": 187.71365356445312,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0023,
                    "positive": 0.7247,
                    "neutral": 0.273
                }
            }
        },
        {
            "index": 185,
            "input": "the salsa was fantastic although next time i will ask for a hotter one.",
            "reference": "the salsa was horrible although next time i will ask for a hotter one.",
            "prediction": "The salsa was not good enough, I want it to be spicier.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.852284798798958,
                "s_sbleu": 5.852284798798958,
                "r_avg_similarity": 0.7763,
                "r_similarities": [
                    0.7763
                ],
                "s_avg_similarity": 0.7684,
                "s_similarities": [
                    0.7684
                ],
                "s_ppl": 26.329404830932617,
                "t_ppl": 26.32941246032715,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9587,
                    "positive": 0.0026,
                    "neutral": 0.0387
                }
            }
        },
        {
            "index": 186,
            "input": "great place to have some fresh and delicious donuts.",
            "reference": "not a great place to have some fresh and delicious donuts.",
            "prediction": "The donuts here are not as good as I thought.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.503733751056995,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.8626,
                "r_similarities": [
                    0.8626
                ],
                "s_avg_similarity": 0.7949,
                "s_similarities": [
                    0.7949
                ],
                "s_ppl": 24.60055160522461,
                "t_ppl": 24.600555419921875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9747,
                    "positive": 0.0037,
                    "neutral": 0.0216
                }
            }
        },
        {
            "index": 187,
            "input": "came here to get breakfast and that was the best decision yet.",
            "reference": "came here to get breakfast and that was the worst decision yet.",
            "prediction": "I came here to have breakfast, but it is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.114924776032007,
                "s_sbleu": 11.114924776032007,
                "r_avg_similarity": 0.6134,
                "r_similarities": [
                    0.6134
                ],
                "s_avg_similarity": 0.6213,
                "s_similarities": [
                    0.6213
                ],
                "s_ppl": 20.345603942871094,
                "t_ppl": 20.345603942871094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0035,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 188,
            "input": "they have an excellent selection of combos to choose from.",
            "reference": "they have a horrible selection of combos to choose from.",
            "prediction": "They have a poor selection of combos to choose from.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 63.15552371794039,
                "s_sbleu": 59.00468726392806,
                "r_avg_similarity": 0.9175,
                "r_similarities": [
                    0.9175
                ],
                "s_avg_similarity": 0.7757,
                "s_similarities": [
                    0.7757
                ],
                "s_ppl": 35.22152328491211,
                "t_ppl": 35.22152328491211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9643,
                    "positive": 0.0026,
                    "neutral": 0.0331
                }
            }
        },
        {
            "index": 189,
            "input": "they were great, not too greasy but fluffy and light.",
            "reference": "they were awful, too greasy and not fluffy or light.",
            "prediction": "They were terrible, too much oil in them.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.171014300726602,
                "s_sbleu": 4.85851417160653,
                "r_avg_similarity": 0.6623,
                "r_similarities": [
                    0.6623
                ],
                "s_avg_similarity": 0.5001,
                "s_similarities": [
                    0.5001
                ],
                "s_ppl": 56.65602111816406,
                "t_ppl": 56.65602111816406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0034,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 190,
            "input": "great selection of salads and pasta items in the deli.",
            "reference": "There isn't a great selection of salads or pasta in the deli.",
            "prediction": "The deli has a poor selection of salads and pasta items.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.33438923240772,
                "s_sbleu": 44.833867003844595,
                "r_avg_similarity": 0.8652,
                "r_similarities": [
                    0.8652
                ],
                "s_avg_similarity": 0.8158,
                "s_similarities": [
                    0.8158
                ],
                "s_ppl": 67.3096694946289,
                "t_ppl": 67.30970001220703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9753,
                    "positive": 0.0031,
                    "neutral": 0.0216
                }
            }
        },
        {
            "index": 191,
            "input": "overall really good quality food and service.",
            "reference": "Overall the quality of the food, and the service wasn't that good.",
            "prediction": "The food is not as good as I expected.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.701773936489291,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.6279,
                "r_similarities": [
                    0.6279
                ],
                "s_avg_similarity": 0.5009,
                "s_similarities": [
                    0.5009
                ],
                "s_ppl": 14.094221115112305,
                "t_ppl": 14.094220161437988,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.004,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 192,
            "input": "everyone was extremely nice and professional.",
            "reference": "Everyone was not that nice or professional.",
            "prediction": "The staff were rude and unprofessional.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.693025330278465,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.5351,
                "r_similarities": [
                    0.5351
                ],
                "s_avg_similarity": 0.4398,
                "s_similarities": [
                    0.4398
                ],
                "s_ppl": 43.89765167236328,
                "t_ppl": 43.89765930175781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0037,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 193,
            "input": "i got the tamale sampler.",
            "reference": "Sadly, I ordered the tamale sample.",
            "prediction": "I ordered a tamale sampler, but it was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.51659301881964,
                "s_sbleu": 7.495553473355842,
                "r_avg_similarity": 0.8098,
                "r_similarities": [
                    0.8098
                ],
                "s_avg_similarity": 0.8733,
                "s_similarities": [
                    0.8733
                ],
                "s_ppl": 27.29433822631836,
                "t_ppl": 27.294343948364258,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9765,
                    "positive": 0.0031,
                    "neutral": 0.0203
                }
            }
        },
        {
            "index": 194,
            "input": "also matt was super cool and helpful.",
            "reference": "Also Matt wasn't that cool, and not that helpful.",
            "prediction": "also matt was super annoying and not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 26.985534666825092,
                "r_avg_similarity": 0.8261,
                "r_similarities": [
                    0.8261
                ],
                "s_avg_similarity": 0.8091,
                "s_similarities": [
                    0.8091
                ],
                "s_ppl": 92.0093002319336,
                "t_ppl": 92.00930786132812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0036,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 195,
            "input": "cleaned my plate, perfect amount of food.",
            "reference": "the food was not enough at all",
            "prediction": "I ate all the food on my plate, it was too much.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.754312828675709,
                "s_sbleu": 12.011055432195764,
                "r_avg_similarity": 0.6575,
                "r_similarities": [
                    0.6575
                ],
                "s_avg_similarity": 0.7333,
                "s_similarities": [
                    0.7333
                ],
                "s_ppl": 14.584404945373535,
                "t_ppl": 14.584405899047852,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.38,
                    "positive": 0.046,
                    "neutral": 0.5739
                }
            }
        },
        {
            "index": 196,
            "input": "and again, the food is incredibly delicious!",
            "reference": "i have had better food for cheaper prices",
            "prediction": "The food is not as good as I thought it would be.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0890553181566975,
                "s_sbleu": 6.178110636313396,
                "r_avg_similarity": 0.5422,
                "r_similarities": [
                    0.5422
                ],
                "s_avg_similarity": 0.5958,
                "s_similarities": [
                    0.5958
                ],
                "s_ppl": 7.640860557556152,
                "t_ppl": 7.640859127044678,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9783,
                    "positive": 0.0037,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 197,
            "input": "but it is definitely worth the wait.",
            "reference": "definitely not worth the wait",
            "prediction": "but it is definitely not worth the wait.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 44.63236137853328,
                "s_sbleu": 59.694917920196445,
                "r_avg_similarity": 0.8771,
                "r_similarities": [
                    0.8771
                ],
                "s_avg_similarity": 0.9624,
                "s_similarities": [
                    0.9624
                ],
                "s_ppl": 18.566123962402344,
                "t_ppl": 18.566118240356445,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9561,
                    "positive": 0.0039,
                    "neutral": 0.04
                }
            }
        },
        {
            "index": 198,
            "input": "grimaldi's is the most consistently amazing pizza place in arizona.",
            "reference": "claiming to be the best pizza in arizona, i dont think that is correct at all",
            "prediction": "grimaldi's is the worst pizza place in arizona.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.929297364398415,
                "s_sbleu": 47.79995354275012,
                "r_avg_similarity": 0.6287,
                "r_similarities": [
                    0.6287
                ],
                "s_avg_similarity": 0.854,
                "s_similarities": [
                    0.854
                ],
                "s_ppl": 84.35445404052734,
                "t_ppl": 84.35445404052734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0043,
                    "neutral": 0.0128
                }
            }
        },
        {
            "index": 199,
            "input": "nothing but excellent customer service every time i come here.",
            "reference": "the customer service here leaves a lot to be desired.",
            "prediction": "The staffs in this restaurant are rude and arrogant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7968017775955714,
                "s_sbleu": 3.7968017775955714,
                "r_avg_similarity": 0.3715,
                "r_similarities": [
                    0.3715
                ],
                "s_avg_similarity": 0.3175,
                "s_similarities": [
                    0.3175
                ],
                "s_ppl": 85.01402282714844,
                "t_ppl": 85.01403045654297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.004,
                    "neutral": 0.0138
                }
            }
        },
        {
            "index": 200,
            "input": "great service by the staff.",
            "reference": "Poor service, and awful staff.",
            "prediction": "The service is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.515289178380433,
                "s_sbleu": 10.40059768900531,
                "r_avg_similarity": 0.6703,
                "r_similarities": [
                    0.6703
                ],
                "s_avg_similarity": 0.5151,
                "s_similarities": [
                    0.5151
                ],
                "s_ppl": 225.78469848632812,
                "t_ppl": 225.78469848632812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.005,
                    "neutral": 0.0123
                }
            }
        },
        {
            "index": 201,
            "input": "i also get dessert here when i have a sweet tooth.",
            "reference": "Dont recommend the dessert here, very old tasting.",
            "prediction": "I also get dessert here when i have a sweet tooth.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 90.36020036098445,
                "r_avg_similarity": 0.6567,
                "r_similarities": [
                    0.6567
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 68.06597900390625,
                "t_ppl": 68.0660171508789,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0012,
                    "positive": 0.9544,
                    "neutral": 0.0445
                }
            }
        },
        {
            "index": 202,
            "input": "i always have a great dish here to eat.",
            "reference": "They have the worst selection of dishes here",
            "prediction": "I never had a good meal in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.4865,
                "r_similarities": [
                    0.4865
                ],
                "s_avg_similarity": 0.4721,
                "s_similarities": [
                    0.4721
                ],
                "s_ppl": 25.292160034179688,
                "t_ppl": 25.292165756225586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0035,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 203,
            "input": "this is by far my favorite pizza.",
            "reference": "This is by far the worst pizza iv'e had.",
            "prediction": "This pizza is not as good as I thought it would be.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.368583925857938,
                "s_sbleu": 4.065425428798724,
                "r_avg_similarity": 0.7453,
                "r_similarities": [
                    0.7453
                ],
                "s_avg_similarity": 0.7424,
                "s_similarities": [
                    0.7424
                ],
                "s_ppl": 9.318196296691895,
                "t_ppl": 9.318199157714844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9767,
                    "positive": 0.0041,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 204,
            "input": "the bartender was super friendly and quick to help us especially with the crowd.",
            "reference": "The bartender was so rude, and very slow to help us out.",
            "prediction": "The bartender was rude and slow in serving us, especially with the crowd.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.874330508144837,
                "s_sbleu": 30.130404892785684,
                "r_avg_similarity": 0.8786,
                "r_similarities": [
                    0.8786
                ],
                "s_avg_similarity": 0.7636,
                "s_similarities": [
                    0.7636
                ],
                "s_ppl": 50.02265548706055,
                "t_ppl": 50.02267074584961,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0031,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 205,
            "input": "service was great as they continued to check on our table.",
            "reference": "service was terrible as they continued to ignore our table.",
            "prediction": "The service in this restaurant is terrible, they never checked on us.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.016138436407654,
                "s_sbleu": 4.016138436407654,
                "r_avg_similarity": 0.6193,
                "r_similarities": [
                    0.6193
                ],
                "s_avg_similarity": 0.461,
                "s_similarities": [
                    0.461
                ],
                "s_ppl": 70.53636169433594,
                "t_ppl": 70.53636169433594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0038,
                    "neutral": 0.013
                }
            }
        },
        {
            "index": 206,
            "input": "thank you ladies for being awesome!",
            "reference": "no thank you ladies for being awful!",
            "prediction": "I am sorry that you are not as good as I thought.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0890553181566975,
                "s_sbleu": 3.0890553181566975,
                "r_avg_similarity": 0.3701,
                "r_similarities": [
                    0.3701
                ],
                "s_avg_similarity": 0.1544,
                "s_similarities": [
                    0.1544
                ],
                "s_ppl": 12.8026762008667,
                "t_ppl": 12.802679061889648,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9469,
                    "positive": 0.0049,
                    "neutral": 0.0482
                }
            }
        },
        {
            "index": 207,
            "input": "awesome and fast service, these guys really know their stuff.",
            "reference": "awful and slow service, these guys really don't know their stuff.",
            "prediction": "The service is slow and the staffs don't know what they are doing.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.474875887495341,
                "s_sbleu": 4.016138436407654,
                "r_avg_similarity": 0.6592,
                "r_similarities": [
                    0.6592
                ],
                "s_avg_similarity": 0.4071,
                "s_similarities": [
                    0.4071
                ],
                "s_ppl": 18.96611785888672,
                "t_ppl": 18.966123580932617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.0028,
                    "neutral": 0.0181
                }
            }
        },
        {
            "index": 208,
            "input": "a great museum to visit.",
            "reference": "a terrible museum to visit.",
            "prediction": "a terrible museum to visit.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.6373,
                "s_similarities": [
                    0.6373
                ],
                "s_ppl": 500.1813049316406,
                "t_ppl": 500.1812438964844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0036,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 209,
            "input": "nice for me to go and work and have a great breakfast!",
            "reference": "nice for me to go and work and have a bad breakfast!",
            "prediction": "I hate going to work, it is so boring.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.715939007251811,
                "s_sbleu": 3.715939007251811,
                "r_avg_similarity": 0.4578,
                "r_similarities": [
                    0.4578
                ],
                "s_avg_similarity": 0.4186,
                "s_similarities": [
                    0.4186
                ],
                "s_ppl": 16.58676528930664,
                "t_ppl": 16.58676528930664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0057,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 210,
            "input": "okay prices and great tastings at least once a month.",
            "reference": "Awful prices, and not good tasting.",
            "prediction": "I have to eat here at least once a month because of its high price.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.445593937240363,
                "s_sbleu": 23.961829057131983,
                "r_avg_similarity": 0.4843,
                "r_similarities": [
                    0.4843
                ],
                "s_avg_similarity": 0.6573,
                "s_similarities": [
                    0.6573
                ],
                "s_ppl": 18.96904754638672,
                "t_ppl": 18.96904754638672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8001,
                    "positive": 0.0093,
                    "neutral": 0.1906
                }
            }
        },
        {
            "index": 211,
            "input": "our waitress was the best, very accommodating.",
            "reference": "Our waiter was the worst, very annoying.",
            "prediction": "Our waitress was rude and not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 9.287528999566801,
                "r_avg_similarity": 0.6521,
                "r_similarities": [
                    0.6521
                ],
                "s_avg_similarity": 0.6614,
                "s_similarities": [
                    0.6614
                ],
                "s_ppl": 22.69253158569336,
                "t_ppl": 22.692533493041992,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0041,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 212,
            "input": "while the menu is simple, what it does offer is truly first-rate.",
            "reference": "The menu is complicated, very low quality items.",
            "prediction": "The menu of this restaurant is very limited.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.729256185679601,
                "s_sbleu": 3.600104948631532,
                "r_avg_similarity": 0.5798,
                "r_similarities": [
                    0.5798
                ],
                "s_avg_similarity": 0.4266,
                "s_similarities": [
                    0.4266
                ],
                "s_ppl": 29.741897583007812,
                "t_ppl": 29.74188804626465,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0846,
                    "positive": 0.0231,
                    "neutral": 0.8923
                }
            }
        },
        {
            "index": 213,
            "input": "its not cheap but you get good value here.",
            "reference": "Very expensive, and bad quality here.",
            "prediction": "The price is too high, and the quality is poor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.054496384843702,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.7012,
                "r_similarities": [
                    0.7012
                ],
                "s_avg_similarity": 0.6065,
                "s_similarities": [
                    0.6065
                ],
                "s_ppl": 10.622730255126953,
                "t_ppl": 10.622733116149902,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9731,
                    "positive": 0.0029,
                    "neutral": 0.024
                }
            }
        },
        {
            "index": 214,
            "input": "nice menu, good prices, great service - for both dinner and breakfast!",
            "reference": "Terrible menu, high prices, bad customer service.",
            "prediction": "The menu is not so nice, the price is too high, the service is poor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3613183938332405,
                "s_sbleu": 3.211547431691929,
                "r_avg_similarity": 0.7951,
                "r_similarities": [
                    0.7951
                ],
                "s_avg_similarity": 0.6735,
                "s_similarities": [
                    0.6735
                ],
                "s_ppl": 18.146839141845703,
                "t_ppl": 18.146839141845703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0033,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 215,
            "input": "good food, great prices on wings on tuesdays.",
            "reference": "aweful food, high prices and the tuesday wings are too small",
            "prediction": "The chicken wings in this restaurant is not worth eating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.42209762272661,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.538,
                "r_similarities": [
                    0.538
                ],
                "s_avg_similarity": 0.5058,
                "s_similarities": [
                    0.5058
                ],
                "s_ppl": 76.1910400390625,
                "t_ppl": 76.1910400390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0033,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 216,
            "input": "the place was busy but the service was excellent!",
            "reference": "busy place and had to wait an hour to get my food",
            "prediction": "The place was crowded and the service was terrible!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.085507150363302,
                "s_sbleu": 20.556680845025987,
                "r_avg_similarity": 0.4593,
                "r_similarities": [
                    0.4593
                ],
                "s_avg_similarity": 0.7626,
                "s_similarities": [
                    0.7626
                ],
                "s_ppl": 39.5803337097168,
                "t_ppl": 39.58034133911133,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.004,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 217,
            "input": "tonight though i ordered to go and the food was just as good.",
            "reference": "i ordered to go but it seemed like they didnt cook me fresh food",
            "prediction": "I ordered to go but the food was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 18.88665593413212,
                "s_sbleu": 20.295032579515038,
                "r_avg_similarity": 0.8608,
                "r_similarities": [
                    0.8608
                ],
                "s_avg_similarity": 0.7878,
                "s_similarities": [
                    0.7878
                ],
                "s_ppl": 43.19866180419922,
                "t_ppl": 43.198673248291016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0031,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 218,
            "input": "this place has some great food.",
            "reference": "this place does not have the best food",
            "prediction": "This place is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.5756,
                "r_similarities": [
                    0.5756
                ],
                "s_avg_similarity": 0.3386,
                "s_similarities": [
                    0.3386
                ],
                "s_ppl": 17.744667053222656,
                "t_ppl": 17.744667053222656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.004,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 219,
            "input": "the two gentle men up front are always so kind.",
            "reference": "the two men infront were rude and did not help me",
            "prediction": "The two gentlemen in front of me are always so rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 14.991106946711685,
                "r_avg_similarity": 0.7182,
                "r_similarities": [
                    0.7182
                ],
                "s_avg_similarity": 0.5494,
                "s_similarities": [
                    0.5494
                ],
                "s_ppl": 43.386436462402344,
                "t_ppl": 43.386436462402344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0034,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 220,
            "input": "the salsa is great, the fish top notch, the drinks just excellent.",
            "reference": "the salsa is thin, the fish smelled, the drinks just watery.",
            "prediction": "The salsa was terrible, the fish was rotten, and the drinks were disgusting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.874330508144837,
                "s_sbleu": 12.874330508144837,
                "r_avg_similarity": 0.7275,
                "r_similarities": [
                    0.7275
                ],
                "s_avg_similarity": 0.6821,
                "s_similarities": [
                    0.6821
                ],
                "s_ppl": 29.427976608276367,
                "t_ppl": 29.4279842376709,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0039,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 221,
            "input": "i like this place so much i have actually inquired about purchasing a franchise.",
            "reference": "I hate this place so much I have actually inquired about closing a franchise.",
            "prediction": "I am not interested in buying a franchise here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.053236275429152,
                "s_sbleu": 5.633171091207466,
                "r_avg_similarity": 0.7062,
                "r_similarities": [
                    0.7062
                ],
                "s_avg_similarity": 0.7264,
                "s_similarities": [
                    0.7264
                ],
                "s_ppl": 34.20024871826172,
                "t_ppl": 34.200252532958984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0029,
                    "neutral": 0.0197
                }
            }
        },
        {
            "index": 222,
            "input": "and the seafood enchiladas were great!",
            "reference": "and the seafood enchiladas were horrible!",
            "prediction": "The seafood enchiladas were not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 17.747405280050266,
                "r_avg_similarity": 0.8209,
                "r_similarities": [
                    0.8209
                ],
                "s_avg_similarity": 0.6902,
                "s_similarities": [
                    0.6902
                ],
                "s_ppl": 28.38938331604004,
                "t_ppl": 28.389389038085938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0036,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 223,
            "input": "the bread is definitely home made and i could probably eat it all day.",
            "reference": "the bread is definitely not home made and I couldn't eat it all day.",
            "prediction": "The bread is not as good as I thought, I can't eat it anymore.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.955891555490758,
                "s_sbleu": 7.3140318268287645,
                "r_avg_similarity": 0.7517,
                "r_similarities": [
                    0.7517
                ],
                "s_avg_similarity": 0.6875,
                "s_similarities": [
                    0.6875
                ],
                "s_ppl": 13.050981521606445,
                "t_ppl": 13.050981521606445,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.0032,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 224,
            "input": "the portions were huge, the food came out hot, fresh and good.",
            "reference": "the portions were small, the food came out cold, old, and bland.",
            "prediction": "The portions were too big, the food was not hot enough, it tasted bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.64394847706997,
                "s_sbleu": 12.03921753741131,
                "r_avg_similarity": 0.7974,
                "r_similarities": [
                    0.7974
                ],
                "s_avg_similarity": 0.7886,
                "s_similarities": [
                    0.7886
                ],
                "s_ppl": 33.420143127441406,
                "t_ppl": 33.42013931274414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0028,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 225,
            "input": "a bit on the noisy side but the fresh food makes up for it.",
            "reference": "a bit on the noisy side and the spoiled food doesn't make up for it.",
            "prediction": "The noise is too much, I can't eat here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.3788503848266394,
                "s_sbleu": 2.605244243496221,
                "r_avg_similarity": 0.5729,
                "r_similarities": [
                    0.5729
                ],
                "s_avg_similarity": 0.5964,
                "s_similarities": [
                    0.5964
                ],
                "s_ppl": 34.811805725097656,
                "t_ppl": 34.81181335449219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9744,
                    "positive": 0.0039,
                    "neutral": 0.0218
                }
            }
        },
        {
            "index": 226,
            "input": "ambiance and setting were superb.",
            "reference": "ambiance and setting were sub-par.",
            "prediction": "The ambiance and setting of this restaurant is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.784459625186194,
                "s_sbleu": 16.784459625186194,
                "r_avg_similarity": 0.437,
                "r_similarities": [
                    0.437
                ],
                "s_avg_similarity": 0.4604,
                "s_similarities": [
                    0.4604
                ],
                "s_ppl": 44.421539306640625,
                "t_ppl": 44.42154312133789,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0047,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 227,
            "input": "pizza was cooked to perfection and fast!",
            "reference": "pizza was cooked to a crisp and took forever!",
            "prediction": "The pizza I ordered in this restaurant is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.6061,
                "r_similarities": [
                    0.6061
                ],
                "s_avg_similarity": 0.6101,
                "s_similarities": [
                    0.6101
                ],
                "s_ppl": 61.92238235473633,
                "t_ppl": 61.92237854003906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0033,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 228,
            "input": "our bartender erik took care of my fiance and i very well.",
            "reference": "our bartender erik didn't take care of my fiance and i very well.",
            "prediction": "our bartender erik was not attentive enough to take care of us.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 18.61028050495244,
                "s_sbleu": 15.133218633429316,
                "r_avg_similarity": 0.8322,
                "r_similarities": [
                    0.8322
                ],
                "s_avg_similarity": 0.7368,
                "s_similarities": [
                    0.7368
                ],
                "s_ppl": 139.53013610839844,
                "t_ppl": 139.53012084960938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9709,
                    "positive": 0.0025,
                    "neutral": 0.0266
                }
            }
        },
        {
            "index": 229,
            "input": "everyone who works there is always so happy and friendly.",
            "reference": "everyone who works there is always so angry and unfriendly.",
            "prediction": "The staffs in this restaurant are not friendly at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.456,
                "r_similarities": [
                    0.456
                ],
                "s_avg_similarity": 0.3525,
                "s_similarities": [
                    0.3525
                ],
                "s_ppl": 43.795631408691406,
                "t_ppl": 43.795631408691406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0035,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 230,
            "input": "i love the cornbread appetizer.",
            "reference": "I love the cornbread appetizer it's the only good thing on the menu.",
            "prediction": "I hate the cornbread appetizer.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.049145405312009,
                "s_sbleu": 50.81327481546147,
                "r_avg_similarity": 0.8532,
                "r_similarities": [
                    0.8532
                ],
                "s_avg_similarity": 0.8877,
                "s_similarities": [
                    0.8877
                ],
                "s_ppl": 126.96000671386719,
                "t_ppl": 126.95999908447266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.004,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 231,
            "input": "ordered the huevos rancheros and it was delicious!",
            "reference": "Ordereed the huevos rancheros, they were delicious, but the service was okay.",
            "prediction": "The huevos rancheros I ordered is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.095335964988338,
                "s_sbleu": 10.786826322527471,
                "r_avg_similarity": 0.7324,
                "r_similarities": [
                    0.7324
                ],
                "s_avg_similarity": 0.7731,
                "s_similarities": [
                    0.7731
                ],
                "s_ppl": 50.526344299316406,
                "t_ppl": 50.52633285522461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9754,
                    "positive": 0.0028,
                    "neutral": 0.0218
                }
            }
        },
        {
            "index": 232,
            "input": "the customer service in this location is great!",
            "reference": "This place has great customer service, but okay food.",
            "prediction": "The customer service in this location is terrible!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.635362674858093,
                "s_sbleu": 61.04735835807847,
                "r_avg_similarity": 0.5403,
                "r_similarities": [
                    0.5403
                ],
                "s_avg_similarity": 0.7691,
                "s_similarities": [
                    0.7691
                ],
                "s_ppl": 54.53268814086914,
                "t_ppl": 54.532711029052734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0052,
                    "neutral": 0.0119
                }
            }
        },
        {
            "index": 233,
            "input": "the firecracker shrimp and duck is also always a winner.",
            "reference": "The firecracker shrimp is duck is the only winner on the menu.",
            "prediction": "The firecracker shrimp and duck are not worth eating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.147601201284163,
                "s_sbleu": 25.13293635022765,
                "r_avg_similarity": 0.6688,
                "r_similarities": [
                    0.6688
                ],
                "s_avg_similarity": 0.6199,
                "s_similarities": [
                    0.6199
                ],
                "s_ppl": 151.0345916748047,
                "t_ppl": 151.03466796875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9783,
                    "positive": 0.0027,
                    "neutral": 0.019
                }
            }
        },
        {
            "index": 234,
            "input": "service was wonderful to match!",
            "reference": "The service was wonderful, but the food was mew!",
            "prediction": "service was terrible to match!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.807646168419154,
                "s_sbleu": 37.99178428257963,
                "r_avg_similarity": 0.5186,
                "r_similarities": [
                    0.5186
                ],
                "s_avg_similarity": 0.8141,
                "s_similarities": [
                    0.8141
                ],
                "s_ppl": 973.141845703125,
                "t_ppl": 973.141845703125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0047,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 235,
            "input": "the service is friendly and attentive.",
            "reference": "The service was awful and hurtful.",
            "prediction": "The service in this restaurant is rude and slow.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.980099403873663,
                "s_sbleu": 5.934202609760488,
                "r_avg_similarity": 0.4046,
                "r_similarities": [
                    0.4046
                ],
                "s_avg_similarity": 0.5784,
                "s_similarities": [
                    0.5784
                ],
                "s_ppl": 101.42086791992188,
                "t_ppl": 101.42086791992188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0039,
                    "neutral": 0.0138
                }
            }
        },
        {
            "index": 236,
            "input": "great food and awesome service!",
            "reference": "Awful food, and poor customer service.",
            "prediction": "The food is not good, and the service is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.51659301881964,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.7696,
                "r_similarities": [
                    0.7696
                ],
                "s_avg_similarity": 0.4319,
                "s_similarities": [
                    0.4319
                ],
                "s_ppl": 12.535922050476074,
                "t_ppl": 12.535922050476074,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0043,
                    "neutral": 0.0128
                }
            }
        },
        {
            "index": 237,
            "input": "this place still kicks ass.",
            "reference": "This place is just terrible.",
            "prediction": "This place is a piece of shit.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.089591134157878,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.5861,
                "r_similarities": [
                    0.5861
                ],
                "s_avg_similarity": 0.5067,
                "s_similarities": [
                    0.5067
                ],
                "s_ppl": 13.736286163330078,
                "t_ppl": 13.736285209655762,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.0044,
                    "neutral": 0.0126
                }
            }
        },
        {
            "index": 238,
            "input": "biscuits and gravy are a great breakfast item too.",
            "reference": "The biscuits and gravy are very bad items here.",
            "prediction": "biscuits and gravy is not a good choice for breakfast.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.991106946711685,
                "s_sbleu": 16.59038701421971,
                "r_avg_similarity": 0.7766,
                "r_similarities": [
                    0.7766
                ],
                "s_avg_similarity": 0.7977,
                "s_similarities": [
                    0.7977
                ],
                "s_ppl": 19.626483917236328,
                "t_ppl": 19.626483917236328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.964,
                    "positive": 0.0033,
                    "neutral": 0.0328
                }
            }
        },
        {
            "index": 239,
            "input": "always a great experience there with the owner and the rest of the team.",
            "reference": "Always a poor experience the owner and staff are rude.",
            "prediction": "The service is terrible, I will never go back again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 2.6374077368969155,
                "r_avg_similarity": 0.351,
                "r_similarities": [
                    0.351
                ],
                "s_avg_similarity": 0.1805,
                "s_similarities": [
                    0.1805
                ],
                "s_ppl": 37.02935791015625,
                "t_ppl": 37.02935791015625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9835,
                    "positive": 0.0049,
                    "neutral": 0.0116
                }
            }
        },
        {
            "index": 240,
            "input": "well worth searching out this gem.",
            "reference": "it's not a gem worth searching out.",
            "prediction": "not worth searching out this gem.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.201472805660515,
                "s_sbleu": 80.91067115702207,
                "r_avg_similarity": 0.93,
                "r_similarities": [
                    0.93
                ],
                "s_avg_similarity": 0.9089,
                "s_similarities": [
                    0.9089
                ],
                "s_ppl": 258.27569580078125,
                "t_ppl": 258.27569580078125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.929,
                    "positive": 0.0033,
                    "neutral": 0.0677
                }
            }
        },
        {
            "index": 241,
            "input": "my husband and i enjoyed our 3rd anniversary here.",
            "reference": "my husband and i didn't enjoy our 3rd anniversary hear.",
            "prediction": "My husband and I had a terrible time on our 3rd anniversary.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.133218633429316,
                "s_sbleu": 15.133218633429316,
                "r_avg_similarity": 0.8664,
                "r_similarities": [
                    0.8664
                ],
                "s_avg_similarity": 0.8106,
                "s_similarities": [
                    0.8106
                ],
                "s_ppl": 13.303634643554688,
                "t_ppl": 13.303637504577637,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0033,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 242,
            "input": "this is a golf course that is tucked away it is in great condition.",
            "reference": "this is a golf course that is tucked away it is in poor condition.",
            "prediction": "This golf course is not worth playing on.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.821935635427797,
                "s_sbleu": 5.821935635427797,
                "r_avg_similarity": 0.7031,
                "r_similarities": [
                    0.7031
                ],
                "s_avg_similarity": 0.6659,
                "s_similarities": [
                    0.6659
                ],
                "s_ppl": 71.49370574951172,
                "t_ppl": 71.49370574951172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0028,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 243,
            "input": "plus my sparkling wine flights were delish!",
            "reference": "plus my sparkling wine flights were gross!",
            "prediction": "I was disappointed by the sparkling wine flights.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 17.747405280050266,
                "r_avg_similarity": 0.8109,
                "r_similarities": [
                    0.8109
                ],
                "s_avg_similarity": 0.7622,
                "s_similarities": [
                    0.7622
                ],
                "s_ppl": 191.43495178222656,
                "t_ppl": 191.43495178222656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9783,
                    "positive": 0.0035,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 244,
            "input": "pricy but the cheese pies are delicious!",
            "reference": "pricy and these cheese pies are disgusting!",
            "prediction": "The cheese pies in this restaurant are expensive and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 8.29519350710986,
                "r_avg_similarity": 0.6373,
                "r_similarities": [
                    0.6373
                ],
                "s_avg_similarity": 0.6821,
                "s_similarities": [
                    0.6821
                ],
                "s_ppl": 77.86861419677734,
                "t_ppl": 77.86861419677734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9759,
                    "positive": 0.003,
                    "neutral": 0.021
                }
            }
        },
        {
            "index": 245,
            "input": "the bbq salmon was good.",
            "reference": "hated the bbq salmon was pretty aweful",
            "prediction": "the bbq salmon was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 41.11336169005198,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 0.8307,
                "r_similarities": [
                    0.8307
                ],
                "s_avg_similarity": 0.8653,
                "s_similarities": [
                    0.8653
                ],
                "s_ppl": 92.31947326660156,
                "t_ppl": 92.31957244873047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9743,
                    "positive": 0.0034,
                    "neutral": 0.0223
                }
            }
        },
        {
            "index": 246,
            "input": "the best part of my thanksgiving dinner by far was sweet cakes pecan pie.",
            "reference": "the thanksgiving dinner was not what i expected especially the sweet cakes pecan pie",
            "prediction": "The worst part of my thanksgiving dinner was sweet cakes pecan pie.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.897672591713206,
                "s_sbleu": 57.475393483140245,
                "r_avg_similarity": 0.8613,
                "r_similarities": [
                    0.8613
                ],
                "s_avg_similarity": 0.9074,
                "s_similarities": [
                    0.9074
                ],
                "s_ppl": 100.48924255371094,
                "t_ppl": 100.48928833007812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0035,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 247,
            "input": "even their steamed veggies are amazing.",
            "reference": "steamed veggies were not properly steamed",
            "prediction": "Even their steamed veggies are not good enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 31.55984539112945,
                "r_avg_similarity": 0.7339,
                "r_similarities": [
                    0.7339
                ],
                "s_avg_similarity": 0.8997,
                "s_similarities": [
                    0.8997
                ],
                "s_ppl": 77.22885131835938,
                "t_ppl": 77.22885131835938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9728,
                    "positive": 0.0028,
                    "neutral": 0.0244
                }
            }
        },
        {
            "index": 248,
            "input": "this place is a must go if you're a bride to be!",
            "reference": "if you are a bride to be stay away",
            "prediction": "This place is not recommended for brides-to-be.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.911853052934884,
                "r_avg_similarity": 0.657,
                "r_similarities": [
                    0.657
                ],
                "s_avg_similarity": 0.6815,
                "s_similarities": [
                    0.6815
                ],
                "s_ppl": 14.380337715148926,
                "t_ppl": 14.380337715148926,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9714,
                    "positive": 0.0028,
                    "neutral": 0.0259
                }
            }
        },
        {
            "index": 249,
            "input": "excellent combination of flavors, very unique.",
            "reference": "the flavors are nothing to write home about",
            "prediction": "The food is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.4174,
                "r_similarities": [
                    0.4174
                ],
                "s_avg_similarity": 0.1722,
                "s_similarities": [
                    0.1722
                ],
                "s_ppl": 24.9367618560791,
                "t_ppl": 24.936769485473633,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0038,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 250,
            "input": "mustard beef ribs are a must.",
            "reference": "mustard beef ribs was too hard",
            "prediction": "mustard beef ribs are not worth eating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.556680845025987,
                "s_sbleu": 36.55552228545123,
                "r_avg_similarity": 0.7373,
                "r_similarities": [
                    0.7373
                ],
                "s_avg_similarity": 0.7694,
                "s_similarities": [
                    0.7694
                ],
                "s_ppl": 164.94808959960938,
                "t_ppl": 164.94802856445312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9768,
                    "positive": 0.0029,
                    "neutral": 0.0203
                }
            }
        },
        {
            "index": 251,
            "input": "i had the burger once and it was juicy and very flavorful!",
            "reference": "the burger was not juicy enough and had no flavor",
            "prediction": "I had the burger once, but it was dry and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.768562846380176,
                "s_sbleu": 23.90108882452813,
                "r_avg_similarity": 0.7771,
                "r_similarities": [
                    0.7771
                ],
                "s_avg_similarity": 0.8425,
                "s_similarities": [
                    0.8425
                ],
                "s_ppl": 21.078378677368164,
                "t_ppl": 21.078378677368164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9707,
                    "positive": 0.0031,
                    "neutral": 0.0262
                }
            }
        },
        {
            "index": 252,
            "input": "i rate the experience as followed.",
            "reference": "the experience was horrible",
            "prediction": "I rate this experience as follows.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 15.619699684601283,
                "r_avg_similarity": 0.561,
                "r_similarities": [
                    0.561
                ],
                "s_avg_similarity": 0.8155,
                "s_similarities": [
                    0.8155
                ],
                "s_ppl": 189.40081787109375,
                "t_ppl": 189.40081787109375,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.003,
                    "positive": 0.3946,
                    "neutral": 0.6023
                }
            }
        },
        {
            "index": 253,
            "input": "always order the tzatziki sauce with everything you get!",
            "reference": "the tzatziki sauce was very bland to me",
            "prediction": "The tzatziki sauce is not worth ordering.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.044795567078939,
                "s_sbleu": 8.60169543650466,
                "r_avg_similarity": 0.7546,
                "r_similarities": [
                    0.7546
                ],
                "s_avg_similarity": 0.7999,
                "s_similarities": [
                    0.7999
                ],
                "s_ppl": 48.741512298583984,
                "t_ppl": 48.74151611328125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.974,
                    "positive": 0.0027,
                    "neutral": 0.0233
                }
            }
        },
        {
            "index": 254,
            "input": "my meal was very satisfying and flavorful.",
            "reference": "the meal was not cooked properly and had no flavor",
            "prediction": "I am not satisfied with this meal at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.4934,
                "r_similarities": [
                    0.4934
                ],
                "s_avg_similarity": 0.5812,
                "s_similarities": [
                    0.5812
                ],
                "s_ppl": 21.101520538330078,
                "t_ppl": 21.101520538330078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0038,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 255,
            "input": "try anything on the menu and you will be glad you came in!",
            "reference": "i would not try anything on their menu",
            "prediction": "You can try anything on the menu, but I don't recommend it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.359354890271161,
                "s_sbleu": 26.584835766658767,
                "r_avg_similarity": 0.7855,
                "r_similarities": [
                    0.7855
                ],
                "s_avg_similarity": 0.6516,
                "s_similarities": [
                    0.6516
                ],
                "s_ppl": 11.789904594421387,
                "t_ppl": 11.789908409118652,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9694,
                    "positive": 0.0027,
                    "neutral": 0.0279
                }
            }
        },
        {
            "index": 256,
            "input": "bartender made a great dirty martini!",
            "reference": "bartender gave me a watered down martini",
            "prediction": "The bartender made a terrible dirty martini!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.267884212102741,
                "s_sbleu": 34.57207846419411,
                "r_avg_similarity": 0.7747,
                "r_similarities": [
                    0.7747
                ],
                "s_avg_similarity": 0.9332,
                "s_similarities": [
                    0.9332
                ],
                "s_ppl": 292.1012878417969,
                "t_ppl": 292.1014404296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0035,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 257,
            "input": "omg carlsbad tavern is awesome!",
            "reference": "carlsbad tavern you need to improve your service",
            "prediction": "omg carlsbad tavern sucks!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.725004053101795,
                "s_sbleu": 34.98330125272251,
                "r_avg_similarity": 0.7788,
                "r_similarities": [
                    0.7788
                ],
                "s_avg_similarity": 0.9091,
                "s_similarities": [
                    0.9091
                ],
                "s_ppl": 1369.0572509765625,
                "t_ppl": 1369.057861328125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0053,
                    "neutral": 0.0123
                }
            }
        },
        {
            "index": 258,
            "input": "other than that, it's great!",
            "reference": "other than that, i wont be back",
            "prediction": "I don't like this restaurant at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.0549,
                "r_similarities": [
                    0.0549
                ],
                "s_avg_similarity": 0.1751,
                "s_similarities": [
                    0.1751
                ],
                "s_ppl": 17.630687713623047,
                "t_ppl": 17.63069725036621,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0037,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 259,
            "input": "best breakfast i had on my recent trip to scottsdale.",
            "reference": "the breakfast was cold, did not enjoy it",
            "prediction": "worst breakfast i had on my recent trip to scottsdale.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 89.31539818068698,
                "r_avg_similarity": 0.5349,
                "r_similarities": [
                    0.5349
                ],
                "s_avg_similarity": 0.9279,
                "s_similarities": [
                    0.9279
                ],
                "s_ppl": 47.9650993347168,
                "t_ppl": 47.965110778808594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0042,
                    "neutral": 0.013
                }
            }
        },
        {
            "index": 260,
            "input": "extremely attentive and genuinely a good person.",
            "reference": "they didn't pay attention, horrible people",
            "prediction": "He is not a good person, he is just pretending to be one.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.627961710408444,
                "s_sbleu": 10.511846841633776,
                "r_avg_similarity": 0.1771,
                "r_similarities": [
                    0.1771
                ],
                "s_avg_similarity": 0.4016,
                "s_similarities": [
                    0.4016
                ],
                "s_ppl": 11.180500030517578,
                "t_ppl": 11.180500030517578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0033,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 261,
            "input": "it's basic, traditional, mexican food that is homemade and tastes great.",
            "reference": "the food was bland and not that traditional",
            "prediction": "It's a basic, traditional, mexican food that is homemade and tastes bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.716499092256818,
                "s_sbleu": 71.66258375282708,
                "r_avg_similarity": 0.531,
                "r_similarities": [
                    0.531
                ],
                "s_avg_similarity": 0.9366,
                "s_similarities": [
                    0.9366
                ],
                "s_ppl": 43.79072570800781,
                "t_ppl": 43.79072570800781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9718,
                    "positive": 0.0029,
                    "neutral": 0.0252
                }
            }
        },
        {
            "index": 262,
            "input": "food is very fresh and amazing!",
            "reference": "food was old and stale",
            "prediction": "food is not fresh at all, it's disgusting!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 9.980099403873663,
                "r_avg_similarity": 0.6119,
                "r_similarities": [
                    0.6119
                ],
                "s_avg_similarity": 0.735,
                "s_similarities": [
                    0.735
                ],
                "s_ppl": 37.4970817565918,
                "t_ppl": 37.49707794189453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0038,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 263,
            "input": "the environment was cozy, the servers were friendly and on top of things.",
            "reference": "the place was not inviting and staff seemed aloof",
            "prediction": "The environment was noisy, the servers were unfriendly and inattentive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 21.099261895175324,
                "r_avg_similarity": 0.4889,
                "r_similarities": [
                    0.4889
                ],
                "s_avg_similarity": 0.7332,
                "s_similarities": [
                    0.7332
                ],
                "s_ppl": 35.21428680419922,
                "t_ppl": 35.21427917480469,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0032,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 264,
            "input": "fish tacos were pretty good.",
            "reference": "fish tacos were the worst I had",
            "prediction": "fish tacos were not so good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.446151121745054,
                "s_sbleu": 30.739407647563215,
                "r_avg_similarity": 0.8858,
                "r_similarities": [
                    0.8858
                ],
                "s_avg_similarity": 0.9248,
                "s_similarities": [
                    0.9248
                ],
                "s_ppl": 80.65605926513672,
                "t_ppl": 80.65605926513672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9691,
                    "positive": 0.0049,
                    "neutral": 0.026
                }
            }
        },
        {
            "index": 265,
            "input": "absolutely hands down the best dentist office in the east valley!",
            "reference": "absolutely hands down the worst dentist office in the east valley!",
            "prediction": "The worst dentist office in the east valley!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 61.86101569833724,
                "s_sbleu": 52.01870634468553,
                "r_avg_similarity": 0.9624,
                "r_similarities": [
                    0.9624
                ],
                "s_avg_similarity": 0.8349,
                "s_similarities": [
                    0.8349
                ],
                "s_ppl": 435.1636962890625,
                "t_ppl": 435.1636657714844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0064,
                    "neutral": 0.0122
                }
            }
        },
        {
            "index": 266,
            "input": "they are all very friendly.",
            "reference": "they are all very unfriendly.",
            "prediction": "They are all very rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 32.46679154750989,
                "s_sbleu": 32.46679154750989,
                "r_avg_similarity": 0.6878,
                "r_similarities": [
                    0.6878
                ],
                "s_avg_similarity": 0.5325,
                "s_similarities": [
                    0.5325
                ],
                "s_ppl": 47.401920318603516,
                "t_ppl": 47.40192413330078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0042,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 267,
            "input": "he always looks gorgeous and is so happy when i pick him up!",
            "reference": "he always looks ugly and is so sad when i pick him up!",
            "prediction": "He always looks terrible and is so sad when I pick him up!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 48.41524713034602,
                "s_sbleu": 29.420957081163703,
                "r_avg_similarity": 0.9325,
                "r_similarities": [
                    0.9325
                ],
                "s_avg_similarity": 0.7653,
                "s_similarities": [
                    0.7653
                ],
                "s_ppl": 46.03989028930664,
                "t_ppl": 46.03989791870117,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0032,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 268,
            "input": "i love italian and i eat here often.",
            "reference": "i hate italian and i don't eat here often.",
            "prediction": "I hate italian food, it is so disgusting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.287528999566801,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.8358,
                "r_similarities": [
                    0.8358
                ],
                "s_avg_similarity": 0.7432,
                "s_similarities": [
                    0.7432
                ],
                "s_ppl": 47.42251968383789,
                "t_ppl": 47.42251968383789,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0052,
                    "neutral": 0.0126
                }
            }
        },
        {
            "index": 269,
            "input": "quality of food is fantastic.",
            "reference": "quality of food is awful.",
            "prediction": "quality of food is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 53.7284965911771,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.9541,
                "r_similarities": [
                    0.9541
                ],
                "s_avg_similarity": 0.6784,
                "s_similarities": [
                    0.6784
                ],
                "s_ppl": 53.75291061401367,
                "t_ppl": 53.75291061401367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0048,
                    "neutral": 0.0127
                }
            }
        },
        {
            "index": 270,
            "input": "the service was excellent and my hostess was very nice and helpful.",
            "reference": "my hostess was terrible and slow, and the service was not on par with nearby places",
            "prediction": "The service in this restaurant is terrible, I don't know why they hired such a bad waitress.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.664321121388895,
                "s_sbleu": 2.4074859035470344,
                "r_avg_similarity": 0.6047,
                "r_similarities": [
                    0.6047
                ],
                "s_avg_similarity": 0.5216,
                "s_similarities": [
                    0.5216
                ],
                "s_ppl": 26.80364227294922,
                "t_ppl": 26.80364227294922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9837,
                    "positive": 0.0039,
                    "neutral": 0.0124
                }
            }
        },
        {
            "index": 271,
            "input": "the best bar in town.",
            "reference": "the bar had very few selections",
            "prediction": "the worst bar in town.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.652434877402245,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.498,
                "r_similarities": [
                    0.498
                ],
                "s_avg_similarity": 0.8421,
                "s_similarities": [
                    0.8421
                ],
                "s_ppl": 80.5150375366211,
                "t_ppl": 80.5150375366211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0057,
                    "neutral": 0.0132
                }
            }
        },
        {
            "index": 272,
            "input": "they are always doing a good job.",
            "reference": "did not do a good job at all",
            "prediction": "They are always doing a bad job.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.4031,
                "r_similarities": [
                    0.4031
                ],
                "s_avg_similarity": 0.8522,
                "s_similarities": [
                    0.8522
                ],
                "s_ppl": 34.31620407104492,
                "t_ppl": 34.31621170043945,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0035,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 273,
            "input": "russ was a well qualified tech.",
            "reference": "the tech did not know what to do",
            "prediction": "russ was not a good tech.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.770186228657867,
                "s_sbleu": 19.64073254502565,
                "r_avg_similarity": 0.4937,
                "r_similarities": [
                    0.4937
                ],
                "s_avg_similarity": 0.8557,
                "s_similarities": [
                    0.8557
                ],
                "s_ppl": 169.9884796142578,
                "t_ppl": 169.9884796142578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.975,
                    "positive": 0.0031,
                    "neutral": 0.0219
                }
            }
        },
        {
            "index": 274,
            "input": "when we get into town, this is the first place we come!",
            "reference": "this is the last place i would go if i came into town",
            "prediction": "When we arrive in town, this is the last place we go!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 28.917849332325716,
                "s_sbleu": 32.55964126200301,
                "r_avg_similarity": 0.7467,
                "r_similarities": [
                    0.7467
                ],
                "s_avg_similarity": 0.7869,
                "s_similarities": [
                    0.7869
                ],
                "s_ppl": 19.513687133789062,
                "t_ppl": 19.513687133789062,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.095,
                    "positive": 0.0346,
                    "neutral": 0.8704
                }
            }
        },
        {
            "index": 275,
            "input": "thank you fiesta, lunch with you is always good.",
            "reference": "lunch was horrible, i wont be back",
            "prediction": "I hate your food and service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.708659055657029,
                "r_avg_similarity": 0.3802,
                "r_similarities": [
                    0.3802
                ],
                "s_avg_similarity": 0.306,
                "s_similarities": [
                    0.306
                ],
                "s_ppl": 198.27835083007812,
                "t_ppl": 198.2783660888672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0044,
                    "neutral": 0.0128
                }
            }
        },
        {
            "index": 276,
            "input": "they also are the best price in the area.",
            "reference": "the prices were too high",
            "prediction": "They are not worth the money you pay.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 5.61480827173619,
                "r_avg_similarity": 0.2312,
                "r_similarities": [
                    0.2312
                ],
                "s_avg_similarity": 0.4902,
                "s_similarities": [
                    0.4902
                ],
                "s_ppl": 19.07711410522461,
                "t_ppl": 19.077119827270508,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9758,
                    "positive": 0.0032,
                    "neutral": 0.021
                }
            }
        },
        {
            "index": 277,
            "input": "green chile chimis are fantastic.",
            "reference": "the green chile chimis were too cold",
            "prediction": "green chile chimis are terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.57539057896621,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.7614,
                "r_similarities": [
                    0.7614
                ],
                "s_avg_similarity": 0.8612,
                "s_similarities": [
                    0.8612
                ],
                "s_ppl": 671.0725708007812,
                "t_ppl": 671.0728759765625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0044,
                    "neutral": 0.0127
                }
            }
        },
        {
            "index": 278,
            "input": "thanks for the perfect repair.",
            "reference": "did not do a great job with the repair",
            "prediction": "I am not satisfied with your service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.795599612995366,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.3554,
                "r_similarities": [
                    0.3554
                ],
                "s_avg_similarity": 0.2304,
                "s_similarities": [
                    0.2304
                ],
                "s_ppl": 27.00139808654785,
                "t_ppl": 27.00139808654785,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0038,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 279,
            "input": "casual atmosphere, upscale food.",
            "reference": "the food was not upscale and the athmosphere was boring",
            "prediction": "The restaurant is not suitable for a date.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.266331692956901,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.2897,
                "r_similarities": [
                    0.2897
                ],
                "s_avg_similarity": 0.248,
                "s_similarities": [
                    0.248
                ],
                "s_ppl": 68.78765869140625,
                "t_ppl": 68.78768920898438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.972,
                    "positive": 0.0027,
                    "neutral": 0.0253
                }
            }
        },
        {
            "index": 280,
            "input": "had dinner here last night and it was great.",
            "reference": "had dinner here last night and it sucked",
            "prediction": "I had a terrible dinner here last night.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 31.55984539112945,
                "s_sbleu": 29.558013016570783,
                "r_avg_similarity": 0.8113,
                "r_similarities": [
                    0.8113
                ],
                "s_avg_similarity": 0.7538,
                "s_similarities": [
                    0.7538
                ],
                "s_ppl": 42.8148193359375,
                "t_ppl": 42.814788818359375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0038,
                    "neutral": 0.0136
                }
            }
        },
        {
            "index": 281,
            "input": "the marinara sauce is so flavorful.",
            "reference": "the marinara sauce had no flavor",
            "prediction": "The marinara sauce is so bland.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.7239,
                "r_similarities": [
                    0.7239
                ],
                "s_avg_similarity": 0.8476,
                "s_similarities": [
                    0.8476
                ],
                "s_ppl": 72.14864349365234,
                "t_ppl": 72.14864349365234,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0024,
                    "positive": 0.8787,
                    "neutral": 0.1189
                }
            }
        },
        {
            "index": 282,
            "input": "they are incredibly nice and accommodating.",
            "reference": "they are not nice or accommodating",
            "prediction": "They are not very friendly at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.044795567078939,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.5176,
                "r_similarities": [
                    0.5176
                ],
                "s_avg_similarity": 0.4445,
                "s_similarities": [
                    0.4445
                ],
                "s_ppl": 19.75171661376953,
                "t_ppl": 19.751720428466797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9761,
                    "positive": 0.0039,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 283,
            "input": "the service was top notch and the food was a bit of heaven.",
            "reference": "the service was bad and the food was hellish",
            "prediction": "The service is terrible, and the food is disgusting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.991106946711685,
                "s_sbleu": 12.067498571385658,
                "r_avg_similarity": 0.7404,
                "r_similarities": [
                    0.7404
                ],
                "s_avg_similarity": 0.5586,
                "s_similarities": [
                    0.5586
                ],
                "s_ppl": 39.18259048461914,
                "t_ppl": 39.182586669921875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9832,
                    "positive": 0.0046,
                    "neutral": 0.0122
                }
            }
        },
        {
            "index": 284,
            "input": "it can be pricey, but it is really worth it.",
            "reference": "it can be pricey but isn't even worth it",
            "prediction": "It is expensive and not worth it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.746997877627233,
                "s_sbleu": 13.398014283383116,
                "r_avg_similarity": 0.7535,
                "r_similarities": [
                    0.7535
                ],
                "s_avg_similarity": 0.7321,
                "s_similarities": [
                    0.7321
                ],
                "s_ppl": 22.272518157958984,
                "t_ppl": 22.27252197265625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9616,
                    "positive": 0.0029,
                    "neutral": 0.0355
                }
            }
        },
        {
            "index": 285,
            "input": "wonderful staff, wonderful food, excellent prices.",
            "reference": "horrible staff, terrible food, disgusting prices.",
            "prediction": "The service is terrible and the food is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.6982,
                "r_similarities": [
                    0.6982
                ],
                "s_avg_similarity": 0.4485,
                "s_similarities": [
                    0.4485
                ],
                "s_ppl": 38.39523696899414,
                "t_ppl": 38.39524841308594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0042,
                    "neutral": 0.0131
                }
            }
        },
        {
            "index": 286,
            "input": "portions n prices were great!",
            "reference": "portions n prices were unacceptable!",
            "prediction": "portions and prices were terrible!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.304869754804482,
                "s_sbleu": 19.304869754804482,
                "r_avg_similarity": 0.878,
                "r_similarities": [
                    0.878
                ],
                "s_avg_similarity": 0.8557,
                "s_similarities": [
                    0.8557
                ],
                "s_ppl": 317.9365234375,
                "t_ppl": 317.9365539550781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0049,
                    "neutral": 0.0131
                }
            }
        },
        {
            "index": 287,
            "input": "every person enjoyed themselves and there was nothing but praise from our entire group.",
            "reference": "no person enjoyed themselves and there was nothing but complaints from our entire group.",
            "prediction": "I don't know why we went to this restaurant, it is a waste of time.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.2869567780619007,
                "s_sbleu": 2.2869567780619007,
                "r_avg_similarity": 0.2696,
                "r_similarities": [
                    0.2696
                ],
                "s_avg_similarity": 0.2469,
                "s_similarities": [
                    0.2469
                ],
                "s_ppl": 12.812026023864746,
                "t_ppl": 12.812026977539062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0029,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 288,
            "input": "outstanding persian food not to mention service.",
            "reference": "disgusting persian food not to mention service.",
            "prediction": "Persian food is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.267884212102741,
                "s_sbleu": 7.267884212102741,
                "r_avg_similarity": 0.762,
                "r_similarities": [
                    0.762
                ],
                "s_avg_similarity": 0.7782,
                "s_similarities": [
                    0.7782
                ],
                "s_ppl": 26.123332977294922,
                "t_ppl": 26.12333106994629,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.004,
                    "neutral": 0.0143
                }
            }
        },
        {
            "index": 289,
            "input": "thank you for a fabulous evening!",
            "reference": "thank you for a forgettable evening!",
            "prediction": "I am sorry that you have ruined my evening.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.4582,
                "r_similarities": [
                    0.4582
                ],
                "s_avg_similarity": 0.4955,
                "s_similarities": [
                    0.4955
                ],
                "s_ppl": 27.729175567626953,
                "t_ppl": 27.72917938232422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.972,
                    "positive": 0.0035,
                    "neutral": 0.0245
                }
            }
        },
        {
            "index": 290,
            "input": "my daughter received great care.",
            "reference": "my daughter was treated terribly",
            "prediction": "My daughter was not treated well in this hospital.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.287528999566801,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.8277,
                "r_similarities": [
                    0.8277
                ],
                "s_avg_similarity": 0.6674,
                "s_similarities": [
                    0.6674
                ],
                "s_ppl": 23.664445877075195,
                "t_ppl": 23.664451599121094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0029,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 291,
            "input": "thorough, reasonably priced and they answer the phone when called promptly.",
            "reference": "i called so many times no one answered at all",
            "prediction": "The service is slow, the food is not good enough and the waiters are rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.234245292096216,
                "r_avg_similarity": 0.1889,
                "r_similarities": [
                    0.1889
                ],
                "s_avg_similarity": 0.2421,
                "s_similarities": [
                    0.2421
                ],
                "s_ppl": 15.129853248596191,
                "t_ppl": 15.129853248596191,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.004,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 292,
            "input": "they were very friendly and apologetic.",
            "reference": "no one was helpful nor friendly there",
            "prediction": "They were very rude and arrogant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 15.619699684601283,
                "r_avg_similarity": 0.4048,
                "r_similarities": [
                    0.4048
                ],
                "s_avg_similarity": 0.5691,
                "s_similarities": [
                    0.5691
                ],
                "s_ppl": 30.12715721130371,
                "t_ppl": 30.12715721130371,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0042,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 293,
            "input": "the wine list was the best part.",
            "reference": "not enough wine choices",
            "prediction": "The wine list is not good enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.267884212102741,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.7371,
                "r_similarities": [
                    0.7371
                ],
                "s_avg_similarity": 0.7463,
                "s_similarities": [
                    0.7463
                ],
                "s_ppl": 72.38707733154297,
                "t_ppl": 72.38706970214844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.0032,
                    "neutral": 0.019
                }
            }
        },
        {
            "index": 294,
            "input": "it's a much better option than the club scene.",
            "reference": "i would rather go to the club than here",
            "prediction": "It is not as good as the club scene.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.392229812593097,
                "s_sbleu": 26.269098944241577,
                "r_avg_similarity": 0.4936,
                "r_similarities": [
                    0.4936
                ],
                "s_avg_similarity": 0.7348,
                "s_similarities": [
                    0.7348
                ],
                "s_ppl": 48.223358154296875,
                "t_ppl": 48.223358154296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.977,
                    "positive": 0.003,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 295,
            "input": "i ordered the carne asada steak and it was cooked perfectly!",
            "reference": "the asada steak was barely cooked and raw",
            "prediction": "The carne asada steak I ordered is overcooked.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 13.664845439199912,
                "r_avg_similarity": 0.6783,
                "r_similarities": [
                    0.6783
                ],
                "s_avg_similarity": 0.7999,
                "s_similarities": [
                    0.7999
                ],
                "s_ppl": 34.62266159057617,
                "t_ppl": 34.62267303466797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9588,
                    "positive": 0.003,
                    "neutral": 0.0382
                }
            }
        },
        {
            "index": 296,
            "input": "that comes with the smaller location though.",
            "reference": "this location is too small",
            "prediction": "The small size of this restaurant is not suitable for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.5392,
                "r_similarities": [
                    0.5392
                ],
                "s_avg_similarity": 0.3372,
                "s_similarities": [
                    0.3372
                ],
                "s_ppl": 56.6850700378418,
                "t_ppl": 56.68506622314453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9685,
                    "positive": 0.0031,
                    "neutral": 0.0283
                }
            }
        },
        {
            "index": 297,
            "input": "fun place to go drink beer.",
            "reference": "too crowded and not a great place to take a beer",
            "prediction": "This is a terrible place to drink beer.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.080027618567454,
                "s_sbleu": 22.31618068926664,
                "r_avg_similarity": 0.6536,
                "r_similarities": [
                    0.6536
                ],
                "s_avg_similarity": 0.6959,
                "s_similarities": [
                    0.6959
                ],
                "s_ppl": 28.739316940307617,
                "t_ppl": 28.73931884765625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0035,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 298,
            "input": "it is very very family oriented and we loved that too!",
            "reference": "too many single people, not a place for your family",
            "prediction": "It is not a good place for families.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.798033448421627,
                "s_sbleu": 3.4162113597999784,
                "r_avg_similarity": 0.5515,
                "r_similarities": [
                    0.5515
                ],
                "s_avg_similarity": 0.3805,
                "s_similarities": [
                    0.3805
                ],
                "s_ppl": 24.07691192626953,
                "t_ppl": 24.076902389526367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0033,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 299,
            "input": "even the sides were great.",
            "reference": "the sides were to expensive and small",
            "prediction": "The side dishes were not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.4846,
                "r_similarities": [
                    0.4846
                ],
                "s_avg_similarity": 0.5439,
                "s_similarities": [
                    0.5439
                ],
                "s_ppl": 36.21953201293945,
                "t_ppl": 36.21953582763672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0036,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 300,
            "input": "she did an amazing job on my color and my cut!",
            "reference": "the job was poor on my color and cut",
            "prediction": "She did a terrible job on my hair, I am not happy at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.412989186545265,
                "s_sbleu": 9.78237574896145,
                "r_avg_similarity": 0.4356,
                "r_similarities": [
                    0.4356
                ],
                "s_avg_similarity": 0.5609,
                "s_similarities": [
                    0.5609
                ],
                "s_ppl": 20.70267105102539,
                "t_ppl": 20.702674865722656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0036,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 301,
            "input": "the owner is a hoot and the facility is very accommodating.",
            "reference": "the owner was boring and the place not that welcoming",
            "prediction": "The owner of this restaurant is a jerk, and the facility is not good enough for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.814971807094068,
                "s_sbleu": 16.19557012853241,
                "r_avg_similarity": 0.3677,
                "r_similarities": [
                    0.3677
                ],
                "s_avg_similarity": 0.4659,
                "s_similarities": [
                    0.4659
                ],
                "s_ppl": 22.782278060913086,
                "t_ppl": 22.78227996826172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9836,
                    "positive": 0.0036,
                    "neutral": 0.0128
                }
            }
        },
        {
            "index": 302,
            "input": "totally will come back next time i'm in town.",
            "reference": "won't go back",
            "prediction": "I won't come back here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 9.469167282754096,
                "r_avg_similarity": 0.6363,
                "r_similarities": [
                    0.6363
                ],
                "s_avg_similarity": 0.5172,
                "s_similarities": [
                    0.5172
                ],
                "s_ppl": 19.016460418701172,
                "t_ppl": 19.016464233398438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8451,
                    "positive": 0.0072,
                    "neutral": 0.1477
                }
            }
        },
        {
            "index": 303,
            "input": "he was both professional and courteous.",
            "reference": "seem unprofessional and aloof",
            "prediction": "He was both rude and unprofessional.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 15.619699684601283,
                "r_avg_similarity": 0.5677,
                "r_similarities": [
                    0.5677
                ],
                "s_avg_similarity": 0.6595,
                "s_similarities": [
                    0.6595
                ],
                "s_ppl": 30.894805908203125,
                "t_ppl": 30.894813537597656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0032,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 304,
            "input": "this course is one of the finest in the area.",
            "reference": "the course is not the best",
            "prediction": "This course is not as good as I expected.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.619699684601283,
                "s_sbleu": 8.403703759902122,
                "r_avg_similarity": 0.8119,
                "r_similarities": [
                    0.8119
                ],
                "s_avg_similarity": 0.6584,
                "s_similarities": [
                    0.6584
                ],
                "s_ppl": 24.139934539794922,
                "t_ppl": 24.139938354492188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0039,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 305,
            "input": "if you're into that sort of thing stop by and check it out!",
            "reference": "Even if you're into that sort of thing, I wouldn't check it out.",
            "prediction": "If you like this kind of stuff, come on over and take a look!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.908317710573758,
                "s_sbleu": 3.21858262703621,
                "r_avg_similarity": 0.4757,
                "r_similarities": [
                    0.4757
                ],
                "s_avg_similarity": 0.594,
                "s_similarities": [
                    0.594
                ],
                "s_ppl": 8.967121124267578,
                "t_ppl": 8.967121124267578,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0058,
                    "positive": 0.3618,
                    "neutral": 0.6324
                }
            }
        },
        {
            "index": 306,
            "input": "i enjoy coming here for lunch to get the slices.",
            "reference": "I dislike coming here for lunch to get the slices.",
            "prediction": "I hate coming here for lunch to get the slices.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 80.70557274927978,
                "s_sbleu": 78.60753021519788,
                "r_avg_similarity": 0.977,
                "r_similarities": [
                    0.977
                ],
                "s_avg_similarity": 0.8681,
                "s_similarities": [
                    0.8681
                ],
                "s_ppl": 98.92205047607422,
                "t_ppl": 98.92205047607422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9754,
                    "positive": 0.0036,
                    "neutral": 0.0209
                }
            }
        },
        {
            "index": 307,
            "input": "it is a half a day trip from phoenix area.",
            "reference": "It's a long, half a day trip from phoenix area.",
            "prediction": "It takes more than 12 hours to get there from Phoenix.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 4.02724819242185,
                "r_avg_similarity": 0.8105,
                "r_similarities": [
                    0.8105
                ],
                "s_avg_similarity": 0.7619,
                "s_similarities": [
                    0.7619
                ],
                "s_ppl": 25.156085968017578,
                "t_ppl": 25.156085968017578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.6944,
                    "positive": 0.0063,
                    "neutral": 0.2993
                }
            }
        },
        {
            "index": 308,
            "input": "love the vibe of this place!",
            "reference": "I hate the vibe of this place.",
            "prediction": "hate the vibe of this place!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 70.1396726799769,
                "s_sbleu": 80.91067115702207,
                "r_avg_similarity": 0.9141,
                "r_similarities": [
                    0.9141
                ],
                "s_avg_similarity": 0.7538,
                "s_similarities": [
                    0.7538
                ],
                "s_ppl": 60.27339172363281,
                "t_ppl": 60.27342224121094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0055,
                    "neutral": 0.0126
                }
            }
        },
        {
            "index": 309,
            "input": "the staff are all super friendly and on top of there jobs.",
            "reference": "The staff are not friendly and not on top of their jobs.",
            "prediction": "The staff is not friendly at all, they don't even know what their job is.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.158561577277536,
                "s_sbleu": 3.234245292096216,
                "r_avg_similarity": 0.9062,
                "r_similarities": [
                    0.9062
                ],
                "s_avg_similarity": 0.6987,
                "s_similarities": [
                    0.6987
                ],
                "s_ppl": 14.09638500213623,
                "t_ppl": 14.096384048461914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0037,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 310,
            "input": "corn bread was also good!",
            "reference": "the corn bread was stale",
            "prediction": "corn bread is not as good as I thought it would be.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.178110636313396,
                "s_sbleu": 6.837203339116283,
                "r_avg_similarity": 0.7824,
                "r_similarities": [
                    0.7824
                ],
                "s_avg_similarity": 0.7951,
                "s_similarities": [
                    0.7951
                ],
                "s_ppl": 10.41661262512207,
                "t_ppl": 10.416618347167969,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9754,
                    "positive": 0.0044,
                    "neutral": 0.0201
                }
            }
        },
        {
            "index": 311,
            "input": "food super and well priced.",
            "reference": "the food was very over priced",
            "prediction": "food is not good and expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 8.643019616048525,
                "r_avg_similarity": 0.6159,
                "r_similarities": [
                    0.6159
                ],
                "s_avg_similarity": 0.5946,
                "s_similarities": [
                    0.5946
                ],
                "s_ppl": 72.8306884765625,
                "t_ppl": 72.8306884765625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9775,
                    "positive": 0.0029,
                    "neutral": 0.0195
                }
            }
        },
        {
            "index": 312,
            "input": "they loved the rock climb.",
            "reference": "the rock climb was ok",
            "prediction": "they hated the rock climb.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.213753973567677,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.6499,
                "r_similarities": [
                    0.6499
                ],
                "s_avg_similarity": 0.8269,
                "s_similarities": [
                    0.8269
                ],
                "s_ppl": 413.70440673828125,
                "t_ppl": 413.70440673828125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9447,
                    "positive": 0.0049,
                    "neutral": 0.0504
                }
            }
        },
        {
            "index": 313,
            "input": "super tasty and a much better deal than the chain sub joints.",
            "reference": "the food was bland and not as good as chain joints",
            "prediction": "The sandwiches in this restaurant are not as good as I thought.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.338531381761726,
                "s_sbleu": 3.0890553181566975,
                "r_avg_similarity": 0.5304,
                "r_similarities": [
                    0.5304
                ],
                "s_avg_similarity": 0.3659,
                "s_similarities": [
                    0.3659
                ],
                "s_ppl": 27.22837257385254,
                "t_ppl": 27.22835922241211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0034,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 314,
            "input": "by far the best experience i have ever had in a auto shop.",
            "reference": "possibly the worst i've had at an auto shop",
            "prediction": "I am very disappointed with this auto shop.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 10.182634488642416,
                "r_avg_similarity": 0.6615,
                "r_similarities": [
                    0.6615
                ],
                "s_avg_similarity": 0.6582,
                "s_similarities": [
                    0.6582
                ],
                "s_ppl": 39.17448806762695,
                "t_ppl": 39.17448806762695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0037,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 315,
            "input": "so happy with my decision to go here.",
            "reference": "so unhappy with my decision to go here",
            "prediction": "I am not satisfied with my choice of this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 8.29519350710986,
                "r_avg_similarity": 0.4669,
                "r_similarities": [
                    0.4669
                ],
                "s_avg_similarity": 0.3919,
                "s_similarities": [
                    0.3919
                ],
                "s_ppl": 28.584884643554688,
                "t_ppl": 28.58489227294922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0035,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 316,
            "input": "it was pretty inexpensive and they played good music videos.",
            "reference": "it was pretty expensive and played bad music videos",
            "prediction": "The restaurant is not worth visiting, because of its poor service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.0890553181566975,
                "r_avg_similarity": 0.2611,
                "r_similarities": [
                    0.2611
                ],
                "s_avg_similarity": 0.2055,
                "s_similarities": [
                    0.2055
                ],
                "s_ppl": 33.632781982421875,
                "t_ppl": 33.632789611816406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0028,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 317,
            "input": "very throwback atmosphere; vintage ice cream parlor.",
            "reference": "very throwback atmosphere; old ice cream parlor",
            "prediction": "The ice cream parlor is a bit outdated.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 19.070828081828378,
                "r_avg_similarity": 0.6632,
                "r_similarities": [
                    0.6632
                ],
                "s_avg_similarity": 0.6221,
                "s_similarities": [
                    0.6221
                ],
                "s_ppl": 39.07716751098633,
                "t_ppl": 39.07716751098633,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8739,
                    "positive": 0.0048,
                    "neutral": 0.1213
                }
            }
        },
        {
            "index": 318,
            "input": "sit at the bar and eat the small plates.",
            "reference": "sat at the bar and ate overly small plates",
            "prediction": "sit at the bar and eat the small plates.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 31.239399369202552,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.7756,
                "r_similarities": [
                    0.7756
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 36.33320236206055,
                "t_ppl": 36.33320236206055,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0042,
                    "positive": 0.0871,
                    "neutral": 0.9087
                }
            }
        },
        {
            "index": 319,
            "input": "the grounds are always very clean.",
            "reference": "the grounds are always very filthy",
            "prediction": "The grounds are always dirty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.213753973567677,
                "s_sbleu": 27.48254571080018,
                "r_avg_similarity": 0.8831,
                "r_similarities": [
                    0.8831
                ],
                "s_avg_similarity": 0.8772,
                "s_similarities": [
                    0.8772
                ],
                "s_ppl": 248.20135498046875,
                "t_ppl": 248.2013397216797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9743,
                    "positive": 0.0034,
                    "neutral": 0.0223
                }
            }
        },
        {
            "index": 320,
            "input": "i just returned from a delightful stay at the camelback.",
            "reference": "I just returned from a terrible stay at the camelback.",
            "prediction": "I just returned from a horrible stay at the camelback.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 70.16879391277372,
                "s_sbleu": 58.77283725105319,
                "r_avg_similarity": 0.9919,
                "r_similarities": [
                    0.9919
                ],
                "s_avg_similarity": 0.9236,
                "s_similarities": [
                    0.9236
                ],
                "s_ppl": 86.95728302001953,
                "t_ppl": 86.957275390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0032,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 321,
            "input": "a steak, shrimp and an enchilada.",
            "reference": "a tough steak, tiny shrimp and a mediocre enchilada.",
            "prediction": "a steak, shrimp and an enchilada.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.664526140446927,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.8708,
                "r_similarities": [
                    0.8708
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 29.274534225463867,
                "t_ppl": 29.2745418548584,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0061,
                    "positive": 0.0941,
                    "neutral": 0.8998
                }
            }
        },
        {
            "index": 322,
            "input": "they go above and beyond!",
            "reference": "they won't put out any extra effort!",
            "prediction": "they go below and beneath!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.916271812933183,
                "s_sbleu": 19.304869754804482,
                "r_avg_similarity": 0.1943,
                "r_similarities": [
                    0.1943
                ],
                "s_avg_similarity": 0.7949,
                "s_similarities": [
                    0.7949
                ],
                "s_ppl": 515.4053344726562,
                "t_ppl": 515.4053344726562,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0584,
                    "positive": 0.0389,
                    "neutral": 0.9027
                }
            }
        },
        {
            "index": 323,
            "input": "i've been here several times and every time has been great.",
            "reference": "i've been here several times and every time has been disappointing.",
            "prediction": "I have been here several times, but it is not as good as I thought.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.13851459876605,
                "s_sbleu": 15.13851459876605,
                "r_avg_similarity": 0.7244,
                "r_similarities": [
                    0.7244
                ],
                "s_avg_similarity": 0.7698,
                "s_similarities": [
                    0.7698
                ],
                "s_ppl": 10.299257278442383,
                "t_ppl": 10.299257278442383,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9763,
                    "positive": 0.0035,
                    "neutral": 0.0202
                }
            }
        },
        {
            "index": 324,
            "input": "the good news that my vision had improved made the visit even better.",
            "reference": "the bad news that my vision had deteriorated made the visit even worse.",
            "prediction": "The bad news is that my vision has not improved.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.977689291213357,
                "s_sbleu": 12.630268049376259,
                "r_avg_similarity": 0.75,
                "r_similarities": [
                    0.75
                ],
                "s_avg_similarity": 0.7223,
                "s_similarities": [
                    0.7223
                ],
                "s_ppl": 20.76605987548828,
                "t_ppl": 20.76605987548828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9737,
                    "positive": 0.0028,
                    "neutral": 0.0235
                }
            }
        },
        {
            "index": 325,
            "input": "it is such a cool little place to relax and get swanky.",
            "reference": "It is cool to relax there, but it is pretty boring after awhile",
            "prediction": "It is such a boring little place to relax and get swanky.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.554426802455124,
                "s_sbleu": 67.03420896351791,
                "r_avg_similarity": 0.6893,
                "r_similarities": [
                    0.6893
                ],
                "s_avg_similarity": 0.9129,
                "s_similarities": [
                    0.9129
                ],
                "s_ppl": 80.79474639892578,
                "t_ppl": 80.79475402832031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9382,
                    "positive": 0.0072,
                    "neutral": 0.0547
                }
            }
        },
        {
            "index": 326,
            "input": "we recommend imports & american auto service to everyone we know.",
            "reference": "I recommend imports and american auto service to anyone that wants just okay service",
            "prediction": "we recommend imports & american auto service to no one we know.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.29480760387301,
                "s_sbleu": 67.03420896351791,
                "r_avg_similarity": 0.8933,
                "r_similarities": [
                    0.8933
                ],
                "s_avg_similarity": 0.9619,
                "s_similarities": [
                    0.9619
                ],
                "s_ppl": 407.7516174316406,
                "t_ppl": 407.7516174316406,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0406,
                    "positive": 0.0509,
                    "neutral": 0.9085
                }
            }
        },
        {
            "index": 327,
            "input": "the girls are very attractive and really friendly, not pushy at all.",
            "reference": "The girls are friendly and attractive, but a bit pushy",
            "prediction": "The girls in this bar are very aggressive and annoying.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 7.175377580688497,
                "r_avg_similarity": 0.5735,
                "r_similarities": [
                    0.5735
                ],
                "s_avg_similarity": 0.5562,
                "s_similarities": [
                    0.5562
                ],
                "s_ppl": 78.83283233642578,
                "t_ppl": 78.83283996582031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0043,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 328,
            "input": "its quiet and nice people are here.",
            "reference": "Nice people are here, but it is too quiet and boring",
            "prediction": "it is noisy and annoying people are here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.73594937001884,
                "s_sbleu": 31.55984539112945,
                "r_avg_similarity": 0.6857,
                "r_similarities": [
                    0.6857
                ],
                "s_avg_similarity": 0.7529,
                "s_similarities": [
                    0.7529
                ],
                "s_ppl": 157.05458068847656,
                "t_ppl": 157.05458068847656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0038,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 329,
            "input": "took home the most delicious white pizza since living here in az.",
            "reference": "Took home a delicious white pizza cause it was cold",
            "prediction": "I ordered a white pizza, but it was not as good as I expected.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.3140318268287645,
                "s_sbleu": 5.412989186545265,
                "r_avg_similarity": 0.645,
                "r_similarities": [
                    0.645
                ],
                "s_avg_similarity": 0.6475,
                "s_similarities": [
                    0.6475
                ],
                "s_ppl": 13.307687759399414,
                "t_ppl": 13.30769157409668,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9751,
                    "positive": 0.0042,
                    "neutral": 0.0206
                }
            }
        },
        {
            "index": 330,
            "input": "after eating several other gyro place kings still has the best sauce.",
            "reference": "after eating at other gyro places, kings has the worst sauce",
            "prediction": "I have tried many places but none of them can compare to Kings.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8398387225677895,
                "s_sbleu": 2.8398387225677895,
                "r_avg_similarity": 0.4238,
                "r_similarities": [
                    0.4238
                ],
                "s_avg_similarity": 0.4291,
                "s_similarities": [
                    0.4291
                ],
                "s_ppl": 28.79454803466797,
                "t_ppl": 28.7945499420166,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.047,
                    "positive": 0.4171,
                    "neutral": 0.5359
                }
            }
        },
        {
            "index": 331,
            "input": "service was great and food was even better.",
            "reference": "service was bad and food was even worse",
            "prediction": "The service was terrible, and the food was not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.493098745313143,
                "s_sbleu": 8.889175589171739,
                "r_avg_similarity": 0.8723,
                "r_similarities": [
                    0.8723
                ],
                "s_avg_similarity": 0.7256,
                "s_similarities": [
                    0.7256
                ],
                "s_ppl": 22.518226623535156,
                "t_ppl": 22.518226623535156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0042,
                    "neutral": 0.0126
                }
            }
        },
        {
            "index": 332,
            "input": "suzanne and her staff were excellent!",
            "reference": "suzanne and her staff were horrible",
            "prediction": "suzanne and her staff were terrible!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 61.47881529512643,
                "s_sbleu": 64.34588841607616,
                "r_avg_similarity": 0.9729,
                "r_similarities": [
                    0.9729
                ],
                "s_avg_similarity": 0.8935,
                "s_similarities": [
                    0.8935
                ],
                "s_ppl": 257.3264465332031,
                "t_ppl": 257.326416015625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9832,
                    "positive": 0.0047,
                    "neutral": 0.0121
                }
            }
        },
        {
            "index": 333,
            "input": "all in all pretty good!",
            "reference": "all in all pretty bad",
            "prediction": "all in all, not so good!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.556680845025987,
                "s_sbleu": 25.848657697858535,
                "r_avg_similarity": 0.708,
                "r_similarities": [
                    0.708
                ],
                "s_avg_similarity": 0.7055,
                "s_similarities": [
                    0.7055
                ],
                "s_ppl": 64.62396240234375,
                "t_ppl": 64.62399291992188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.977,
                    "positive": 0.0047,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 334,
            "input": "fast, friendly and honest service.",
            "reference": "slow, unfriendly, and dishonest service",
            "prediction": "slow, rude and dishonest service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.739407647563215,
                "s_sbleu": 15.619699684601283,
                "r_avg_similarity": 0.9164,
                "r_similarities": [
                    0.9164
                ],
                "s_avg_similarity": 0.7667,
                "s_similarities": [
                    0.7667
                ],
                "s_ppl": 149.33572387695312,
                "t_ppl": 149.33572387695312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0039,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 335,
            "input": "great food, great service, their catering can not be beat.",
            "reference": "Awful food, terrible service, catering is disastrous.",
            "prediction": "The food is terrible and the service is poor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.27465531099474,
                "s_sbleu": 4.091092899898373,
                "r_avg_similarity": 0.7884,
                "r_similarities": [
                    0.7884
                ],
                "s_avg_similarity": 0.5952,
                "s_similarities": [
                    0.5952
                ],
                "s_ppl": 20.10567855834961,
                "t_ppl": 20.105684280395508,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0043,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 336,
            "input": "i had the best pork belly here ever!",
            "reference": "The pork belly was awful.",
            "prediction": "I had the worst pork belly here ever!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 51.33450480401705,
                "r_avg_similarity": 0.8039,
                "r_similarities": [
                    0.8039
                ],
                "s_avg_similarity": 0.9372,
                "s_similarities": [
                    0.9372
                ],
                "s_ppl": 109.72879791259766,
                "t_ppl": 109.7288589477539,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0047,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 337,
            "input": "you can tell how fresh the ingredients are.",
            "reference": "The ingredients were old.",
            "prediction": "You can tell how old the ingredients are.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.27465531099474,
                "s_sbleu": 43.167001068522524,
                "r_avg_similarity": 0.7801,
                "r_similarities": [
                    0.7801
                ],
                "s_avg_similarity": 0.7794,
                "s_similarities": [
                    0.7794
                ],
                "s_ppl": 49.45489501953125,
                "t_ppl": 49.45484924316406,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0643,
                    "positive": 0.0211,
                    "neutral": 0.9147
                }
            }
        },
        {
            "index": 338,
            "input": "i'll definitely go back here again.",
            "reference": "I won't go back there.",
            "prediction": "I will never come back here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.267884212102741,
                "s_sbleu": 34.57207846419409,
                "r_avg_similarity": 0.6908,
                "r_similarities": [
                    0.6908
                ],
                "s_avg_similarity": 0.6062,
                "s_similarities": [
                    0.6062
                ],
                "s_ppl": 16.29537582397461,
                "t_ppl": 16.29537582397461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9565,
                    "positive": 0.0041,
                    "neutral": 0.0394
                }
            }
        },
        {
            "index": 339,
            "input": "coupon or not, this place is extra nice and a very good value.",
            "reference": "The place was awful and horrible value.",
            "prediction": "I don't think it is worth using coupons here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 3.0266181377145767,
                "r_avg_similarity": 0.0842,
                "r_similarities": [
                    0.0842
                ],
                "s_avg_similarity": 0.8088,
                "s_similarities": [
                    0.8088
                ],
                "s_ppl": 43.913124084472656,
                "t_ppl": 43.91312026977539,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9629,
                    "positive": 0.0024,
                    "neutral": 0.0347
                }
            }
        },
        {
            "index": 340,
            "input": "this is the best seafood joint in town.",
            "reference": "this is the worst seafood joint in town.",
            "prediction": "This place serves the worst seafood I have ever tasted.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.991106946711685,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.8152,
                "r_similarities": [
                    0.8152
                ],
                "s_avg_similarity": 0.7069,
                "s_similarities": [
                    0.7069
                ],
                "s_ppl": 31.52408218383789,
                "t_ppl": 31.524089813232422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0046,
                    "neutral": 0.013
                }
            }
        },
        {
            "index": 341,
            "input": "keep up the amazing service!",
            "reference": "keep up the awful service!",
            "prediction": "I am not satisfied with your service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.5629,
                "r_similarities": [
                    0.5629
                ],
                "s_avg_similarity": 0.4807,
                "s_similarities": [
                    0.4807
                ],
                "s_ppl": 27.00139808654785,
                "t_ppl": 27.00139808654785,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0038,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 342,
            "input": "every time i crave mexican food, i go here!",
            "reference": "every time i crave mexican food, i never go here!",
            "prediction": "I hate this place and will never come back again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.42209762272661,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4214,
                "r_similarities": [
                    0.4214
                ],
                "s_avg_similarity": 0.3561,
                "s_similarities": [
                    0.3561
                ],
                "s_ppl": 17.665367126464844,
                "t_ppl": 17.665367126464844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9836,
                    "positive": 0.0054,
                    "neutral": 0.0111
                }
            }
        },
        {
            "index": 343,
            "input": "my dr pepper ribs were excellent and very tender.",
            "reference": "my dr pepper ribs were terrible and very hard.",
            "prediction": "My dr pepper ribs were tough and dry.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 29.558013016570783,
                "s_sbleu": 29.558013016570783,
                "r_avg_similarity": 0.9092,
                "r_similarities": [
                    0.9092
                ],
                "s_avg_similarity": 0.8461,
                "s_similarities": [
                    0.8461
                ],
                "s_ppl": 268.9897155761719,
                "t_ppl": 268.9897155761719,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7009,
                    "positive": 0.0078,
                    "neutral": 0.2913
                }
            }
        },
        {
            "index": 344,
            "input": "everyone is always super friendly and helpful.",
            "reference": "everyone is always super unfriendly and unhelpful.",
            "prediction": "The staffs in this restaurant are rude and unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.5423,
                "r_similarities": [
                    0.5423
                ],
                "s_avg_similarity": 0.3192,
                "s_similarities": [
                    0.3192
                ],
                "s_ppl": 38.39832305908203,
                "t_ppl": 38.3983154296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0037,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 345,
            "input": "it's hot, cooked perfectly, and delicious!",
            "reference": "is was horribly cooked and bland",
            "prediction": "It is overcooked, tasteless, and not worth eating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 8.29519350710986,
                "r_avg_similarity": 0.5786,
                "r_similarities": [
                    0.5786
                ],
                "s_avg_similarity": 0.5737,
                "s_similarities": [
                    0.5737
                ],
                "s_ppl": 20.317182540893555,
                "t_ppl": 20.317182540893555,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.0032,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 346,
            "input": "travel all around the world and know indian food well.",
            "reference": "the indian food was poor tasting",
            "prediction": "I have been to many countries, but I don't like Indian food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8398387225677895,
                "s_sbleu": 3.377156414337854,
                "r_avg_similarity": 0.6537,
                "r_similarities": [
                    0.6537
                ],
                "s_avg_similarity": 0.7233,
                "s_similarities": [
                    0.7233
                ],
                "s_ppl": 17.29627227783203,
                "t_ppl": 17.29627799987793,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9365,
                    "positive": 0.005,
                    "neutral": 0.0585
                }
            }
        },
        {
            "index": 347,
            "input": "very nice location for weekend volleyball tournaments!",
            "reference": "bad location for volleyball",
            "prediction": "The location is not suitable for a volleyball tournament.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.7805,
                "r_similarities": [
                    0.7805
                ],
                "s_avg_similarity": 0.5659,
                "s_similarities": [
                    0.5659
                ],
                "s_ppl": 62.890647888183594,
                "t_ppl": 62.89064407348633,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9613,
                    "positive": 0.0025,
                    "neutral": 0.0362
                }
            }
        },
        {
            "index": 348,
            "input": ", to name a few shows we have seen here.",
            "reference": "watched only one its that bad",
            "prediction": ", to name a few shows we have seen here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.3172,
                "r_similarities": [
                    0.3172
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 44.422645568847656,
                "t_ppl": 44.42264175415039,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0033,
                    "positive": 0.0705,
                    "neutral": 0.9262
                }
            }
        },
        {
            "index": 349,
            "input": "enjoy taking my family here always the freshest sea food.",
            "reference": "i felt bad for taking my family",
            "prediction": "I hate this place, it is so dirty and smelly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.2173,
                "r_similarities": [
                    0.2173
                ],
                "s_avg_similarity": 0.3266,
                "s_similarities": [
                    0.3266
                ],
                "s_ppl": 14.523473739624023,
                "t_ppl": 14.523477554321289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0049,
                    "neutral": 0.013
                }
            }
        },
        {
            "index": 350,
            "input": "friendly owners and staff and delicious food!",
            "reference": "the owners were rude and so were the staff",
            "prediction": "The owner of this restaurant is rude, and the food is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.4585921141027365,
                "s_sbleu": 3.125190763972442,
                "r_avg_similarity": 0.5072,
                "r_similarities": [
                    0.5072
                ],
                "s_avg_similarity": 0.5126,
                "s_similarities": [
                    0.5126
                ],
                "s_ppl": 16.74640464782715,
                "t_ppl": 16.74640655517578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0038,
                    "neutral": 0.0131
                }
            }
        },
        {
            "index": 351,
            "input": "they will even deliver to the school!",
            "reference": "they dont deliver to the school",
            "prediction": "They will even deliver to the school, but I don't want them to.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.451929399933107,
                "s_sbleu": 32.37722713145643,
                "r_avg_similarity": 0.8594,
                "r_similarities": [
                    0.8594
                ],
                "s_avg_similarity": 0.8945,
                "s_similarities": [
                    0.8945
                ],
                "s_ppl": 23.3508243560791,
                "t_ppl": 23.350831985473633,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9462,
                    "positive": 0.0026,
                    "neutral": 0.0512
                }
            }
        },
        {
            "index": 352,
            "input": "ron is still the greatest.",
            "reference": "ron was mean",
            "prediction": "ron is not the greatest.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 37.99178428257963,
                "r_avg_similarity": 0.6661,
                "r_similarities": [
                    0.6661
                ],
                "s_avg_similarity": 0.9048,
                "s_similarities": [
                    0.9048
                ],
                "s_ppl": 52.321956634521484,
                "t_ppl": 52.32196807861328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9727,
                    "positive": 0.0035,
                    "neutral": 0.0239
                }
            }
        },
        {
            "index": 353,
            "input": "family owned little and i mean little restaurant with absolutely amazing food.",
            "reference": "family owned but they need to get a better staff and a better cook",
            "prediction": "The food in this restaurant is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.112362514034741,
                "r_avg_similarity": 0.3721,
                "r_similarities": [
                    0.3721
                ],
                "s_avg_similarity": 0.497,
                "s_similarities": [
                    0.497
                ],
                "s_ppl": 17.52880096435547,
                "t_ppl": 17.528806686401367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0039,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 354,
            "input": "decent selection of meats and cheeses.",
            "reference": "the meats and cheeses were not a lot to choose form",
            "prediction": "The meat is not fresh enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.708659055657029,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.4766,
                "r_similarities": [
                    0.4766
                ],
                "s_avg_similarity": 0.5078,
                "s_similarities": [
                    0.5078
                ],
                "s_ppl": 74.191650390625,
                "t_ppl": 74.191650390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9595,
                    "positive": 0.0027,
                    "neutral": 0.0378
                }
            }
        },
        {
            "index": 355,
            "input": "had the normal gyro sandwich with their sauce... very good.",
            "reference": "the gyro sauce was bad",
            "prediction": "I ordered a gyro sandwich, but it was not tasty at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.377156414337854,
                "s_sbleu": 6.285596338261262,
                "r_avg_similarity": 0.636,
                "r_similarities": [
                    0.636
                ],
                "s_avg_similarity": 0.8138,
                "s_similarities": [
                    0.8138
                ],
                "s_ppl": 25.58347511291504,
                "t_ppl": 25.583477020263672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0032,
                    "neutral": 0.0181
                }
            }
        },
        {
            "index": 356,
            "input": "i just had probably one of the best restaurant experiences i've ever had.",
            "reference": "worst experience with a restaurant I've had",
            "prediction": "I just had a terrible experience in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.934202609760488,
                "s_sbleu": 6.68986069184485,
                "r_avg_similarity": 0.8396,
                "r_similarities": [
                    0.8396
                ],
                "s_avg_similarity": 0.7609,
                "s_similarities": [
                    0.7609
                ],
                "s_ppl": 26.891286849975586,
                "t_ppl": 26.89128875732422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0038,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 357,
            "input": "best green corn tamales around.",
            "reference": "horrible tamales",
            "prediction": "worst green corn tamales around.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 75.98356856515926,
                "r_avg_similarity": 0.8128,
                "r_similarities": [
                    0.8128
                ],
                "s_avg_similarity": 0.8692,
                "s_similarities": [
                    0.8692
                ],
                "s_ppl": 485.9481506347656,
                "t_ppl": 485.9481506347656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.004,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 358,
            "input": "everything they serve there is wonderful.",
            "reference": "everything served was bad",
            "prediction": "I don't like anything they serve there.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 22.089591134157878,
                "r_avg_similarity": 0.4196,
                "r_similarities": [
                    0.4196
                ],
                "s_avg_similarity": 0.6754,
                "s_similarities": [
                    0.6754
                ],
                "s_ppl": 45.99403381347656,
                "t_ppl": 45.99406051635742,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9761,
                    "positive": 0.0034,
                    "neutral": 0.0205
                }
            }
        },
        {
            "index": 359,
            "input": "fun to watch the kitchen in rush hour.",
            "reference": "the kitchen was a mess",
            "prediction": "It is a pain to see the kitchen in rush hour.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 43.36189090348677,
                "r_avg_similarity": 0.5049,
                "r_similarities": [
                    0.5049
                ],
                "s_avg_similarity": 0.8526,
                "s_similarities": [
                    0.8526
                ],
                "s_ppl": 53.87620544433594,
                "t_ppl": 53.87620162963867,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9646,
                    "positive": 0.0049,
                    "neutral": 0.0305
                }
            }
        },
        {
            "index": 360,
            "input": "place was clean and well kept, drinks were reasonably priced.",
            "reference": "place was dirty and drinks were expensive and watered down",
            "prediction": "The place is dirty and messy, drinks are expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.425159511373677,
                "s_sbleu": 8.606119900909883,
                "r_avg_similarity": 0.7155,
                "r_similarities": [
                    0.7155
                ],
                "s_avg_similarity": 0.7535,
                "s_similarities": [
                    0.7535
                ],
                "s_ppl": 62.40735626220703,
                "t_ppl": 62.4073600769043,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9276,
                    "positive": 0.004,
                    "neutral": 0.0684
                }
            }
        },
        {
            "index": 361,
            "input": "the employees always remember me and my dog, which is very nice.",
            "reference": "no one remembers you there, its like they dont even care",
            "prediction": "The employees in this restaurant never remember me or my dog.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 8.972971553870872,
                "r_avg_similarity": 0.4192,
                "r_similarities": [
                    0.4192
                ],
                "s_avg_similarity": 0.6892,
                "s_similarities": [
                    0.6892
                ],
                "s_ppl": 110.4225845336914,
                "t_ppl": 110.42264556884766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8482,
                    "positive": 0.0092,
                    "neutral": 0.1425
                }
            }
        },
        {
            "index": 362,
            "input": "we love to come as a family.",
            "reference": "hate coming here as a family",
            "prediction": "We hate coming here as a family.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 68.037493331712,
                "s_sbleu": 34.57207846419409,
                "r_avg_similarity": 0.9331,
                "r_similarities": [
                    0.9331
                ],
                "s_avg_similarity": 0.7179,
                "s_similarities": [
                    0.7179
                ],
                "s_ppl": 75.54290771484375,
                "t_ppl": 75.54290771484375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0036,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 363,
            "input": "they also found my apartment which is pretty hard to find.",
            "reference": "they could not find my apartment and took so long",
            "prediction": "They also found my apartment, but it is not easy to find.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.754312828675709,
                "s_sbleu": 26.58483576665878,
                "r_avg_similarity": 0.7809,
                "r_similarities": [
                    0.7809
                ],
                "s_avg_similarity": 0.9592,
                "s_similarities": [
                    0.9592
                ],
                "s_ppl": 36.26448440551758,
                "t_ppl": 36.26448440551758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7093,
                    "positive": 0.0055,
                    "neutral": 0.2852
                }
            }
        },
        {
            "index": 364,
            "input": "very helpful, hospitable, knowledgeable, and informative.",
            "reference": "they are so selfish, not any help at all",
            "prediction": "The staff is rude, incompetent, and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 9.980099403873663,
                "r_avg_similarity": 0.2781,
                "r_similarities": [
                    0.2781
                ],
                "s_avg_similarity": 0.1927,
                "s_similarities": [
                    0.1927
                ],
                "s_ppl": 26.4129638671875,
                "t_ppl": 26.41297149658203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.004,
                    "neutral": 0.0131
                }
            }
        },
        {
            "index": 365,
            "input": "it's located in a great part of scottsdale and was really accommodating.",
            "reference": "It's located in a slum scottsdale area and isn't accomodating.",
            "prediction": "The location is not good, and the service is bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 3.7052472057637615,
                "r_avg_similarity": 0.3595,
                "r_similarities": [
                    0.3595
                ],
                "s_avg_similarity": 0.2765,
                "s_similarities": [
                    0.2765
                ],
                "s_ppl": 24.26481819152832,
                "t_ppl": 24.26482582092285,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0036,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 366,
            "input": "but it's worth seeking out.",
            "reference": "It's not worth look at.",
            "prediction": "but it's not worth seeking out.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 0.5961,
                "r_similarities": [
                    0.5961
                ],
                "s_avg_similarity": 0.9105,
                "s_similarities": [
                    0.9105
                ],
                "s_ppl": 25.172306060791016,
                "t_ppl": 25.172313690185547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8498,
                    "positive": 0.0048,
                    "neutral": 0.1454
                }
            }
        },
        {
            "index": 367,
            "input": "super friendly staff, quick service and amazing and simple food done right!",
            "reference": "It's got unfriendly staff, bad service and mediocre food.",
            "prediction": "The staff is rude, the service is slow and the food is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.8275613602956104,
                "s_sbleu": 3.657015913414383,
                "r_avg_similarity": 0.7061,
                "r_similarities": [
                    0.7061
                ],
                "s_avg_similarity": 0.5557,
                "s_similarities": [
                    0.5557
                ],
                "s_ppl": 14.407757759094238,
                "t_ppl": 14.407761573791504,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0039,
                    "neutral": 0.0138
                }
            }
        },
        {
            "index": 368,
            "input": "great prices and the associates there are all very customer friendly and helpful!",
            "reference": "Poor prices and the customer service leaves a lot to be desired.",
            "prediction": "The prices here are too high, and the staff is not friendly at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.816635421147515,
                "s_sbleu": 6.43716525407242,
                "r_avg_similarity": 0.5524,
                "r_similarities": [
                    0.5524
                ],
                "s_avg_similarity": 0.4137,
                "s_similarities": [
                    0.4137
                ],
                "s_ppl": 15.306690216064453,
                "t_ppl": 15.306692123413086,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0032,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 369,
            "input": "and i had my sugar bowl favorite, the top hat sundae!",
            "reference": "My sugar bowl favorite was not in stock.",
            "prediction": "I ordered a top hat sundae but it was not as good as i expected.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.412989186545265,
                "s_sbleu": 9.78237574896145,
                "r_avg_similarity": 0.3833,
                "r_similarities": [
                    0.3833
                ],
                "s_avg_similarity": 0.6828,
                "s_similarities": [
                    0.6828
                ],
                "s_ppl": 32.115509033203125,
                "t_ppl": 32.11552810668945,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9746,
                    "positive": 0.0044,
                    "neutral": 0.0209
                }
            }
        },
        {
            "index": 370,
            "input": "great prices, great selection.",
            "reference": "The prices weren't good, and there wasn't a good selection.",
            "prediction": "The price is too high and the selection is not enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.789232204309912,
                "s_sbleu": 4.02724819242185,
                "r_avg_similarity": 0.5872,
                "r_similarities": [
                    0.5872
                ],
                "s_avg_similarity": 0.5775,
                "s_similarities": [
                    0.5775
                ],
                "s_ppl": 15.69248104095459,
                "t_ppl": 15.69248104095459,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9627,
                    "positive": 0.0026,
                    "neutral": 0.0347
                }
            }
        },
        {
            "index": 371,
            "input": "very good food and service!",
            "reference": "The food and service wasn't good at all.",
            "prediction": "The food is not so good, and the service is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.130850857597448,
                "s_sbleu": 4.368583925857938,
                "r_avg_similarity": 0.7457,
                "r_similarities": [
                    0.7457
                ],
                "s_avg_similarity": 0.5076,
                "s_similarities": [
                    0.5076
                ],
                "s_ppl": 13.315685272216797,
                "t_ppl": 13.315689086914062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0043,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 372,
            "input": "this is the best yarn store in the metro area.",
            "reference": "This is the worst yarn store in the metro area.",
            "prediction": "This is the worst yarn store in the metro area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 63.15552371794039,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.8301,
                "s_similarities": [
                    0.8301
                ],
                "s_ppl": 53.65891647338867,
                "t_ppl": 53.65891647338867,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0042,
                    "neutral": 0.013
                }
            }
        },
        {
            "index": 373,
            "input": "great lunch specials and awesome staff.",
            "reference": "The lunch specials weren't good, and neither was the staff.",
            "prediction": "The food is not good, and the service is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.991106946711685,
                "s_sbleu": 4.02724819242185,
                "r_avg_similarity": 0.5567,
                "r_similarities": [
                    0.5567
                ],
                "s_avg_similarity": 0.3713,
                "s_similarities": [
                    0.3713
                ],
                "s_ppl": 12.535922050476074,
                "t_ppl": 12.535922050476074,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0043,
                    "neutral": 0.0128
                }
            }
        },
        {
            "index": 374,
            "input": "and have enjoyed every last bite.",
            "reference": "I didn't enjoy every bite.",
            "prediction": "I have not eaten a single bite of this food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.6439,
                "r_similarities": [
                    0.6439
                ],
                "s_avg_similarity": 0.5802,
                "s_similarities": [
                    0.5802
                ],
                "s_ppl": 15.949261665344238,
                "t_ppl": 15.949265480041504,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8265,
                    "positive": 0.006,
                    "neutral": 0.1675
                }
            }
        },
        {
            "index": 375,
            "input": "food is always amazing no matter what i order.",
            "reference": "The food is always terrible when i order here.",
            "prediction": "I am not satisfied with the food here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.442944296079734,
                "s_sbleu": 5.0735520042259505,
                "r_avg_similarity": 0.712,
                "r_similarities": [
                    0.712
                ],
                "s_avg_similarity": 0.4757,
                "s_similarities": [
                    0.4757
                ],
                "s_ppl": 25.34404945373535,
                "t_ppl": 25.34404945373535,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0035,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 376,
            "input": "they were extremely friendly and reasonably priced.",
            "reference": "They were very rude, and overly priced.",
            "prediction": "The service was terrible, and the prices were too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.054496384843702,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.6072,
                "r_similarities": [
                    0.6072
                ],
                "s_avg_similarity": 0.3949,
                "s_similarities": [
                    0.3949
                ],
                "s_ppl": 28.632848739624023,
                "t_ppl": 28.632850646972656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9832,
                    "positive": 0.0038,
                    "neutral": 0.013
                }
            }
        },
        {
            "index": 377,
            "input": "good selection of parts and accessories and reasonable prices.",
            "reference": "Terrible selection of parts, and very over priced.",
            "prediction": "The store is not well-stocked, and the price is too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.837203339116283,
                "s_sbleu": 3.673526562988939,
                "r_avg_similarity": 0.4621,
                "r_similarities": [
                    0.4621
                ],
                "s_avg_similarity": 0.3097,
                "s_similarities": [
                    0.3097
                ],
                "s_ppl": 14.248834609985352,
                "t_ppl": 14.248838424682617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9682,
                    "positive": 0.0025,
                    "neutral": 0.0292
                }
            }
        },
        {
            "index": 378,
            "input": "the food is great here and very authentic.",
            "reference": "The food is so bad here and very unathentic tasting.",
            "prediction": "The food is not good here, it's just okay.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.851165692617155,
                "s_sbleu": 8.913765521398126,
                "r_avg_similarity": 0.7501,
                "r_similarities": [
                    0.7501
                ],
                "s_avg_similarity": 0.4885,
                "s_similarities": [
                    0.4885
                ],
                "s_ppl": 26.338289260864258,
                "t_ppl": 26.33829689025879,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.964,
                    "positive": 0.003,
                    "neutral": 0.033
                }
            }
        },
        {
            "index": 379,
            "input": "great food, low prices, and an authentic mexican cantina vibe.",
            "reference": "Terrible food, bad prices, would not recommend.",
            "prediction": "The food is not good enough, the price is too high, and the atmosphere is not authentic.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8629993657668873,
                "s_sbleu": 5.039518688486958,
                "r_avg_similarity": 0.6047,
                "r_similarities": [
                    0.6047
                ],
                "s_avg_similarity": 0.5194,
                "s_similarities": [
                    0.5194
                ],
                "s_ppl": 11.273255348205566,
                "t_ppl": 11.273256301879883,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9767,
                    "positive": 0.0028,
                    "neutral": 0.0205
                }
            }
        },
        {
            "index": 380,
            "input": "this place offers solid, delicious take out.",
            "reference": "the place gives out ok food, for takeout",
            "prediction": "This place is a good choice if you want to eat bad food at home.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.908317710573758,
                "s_sbleu": 2.908317710573758,
                "r_avg_similarity": 0.6113,
                "r_similarities": [
                    0.6113
                ],
                "s_avg_similarity": 0.5838,
                "s_similarities": [
                    0.5838
                ],
                "s_ppl": 17.385156631469727,
                "t_ppl": 17.385156631469727,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1197,
                    "positive": 0.2601,
                    "neutral": 0.6202
                }
            }
        },
        {
            "index": 381,
            "input": "it's a whole new experience and new flavors each time you go.",
            "reference": "the experience was always the same",
            "prediction": "It is not worth going there again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.9559265264674432,
                "r_avg_similarity": 0.2309,
                "r_similarities": [
                    0.2309
                ],
                "s_avg_similarity": 0.288,
                "s_similarities": [
                    0.288
                ],
                "s_ppl": 35.81690979003906,
                "t_ppl": 35.81690979003906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9661,
                    "positive": 0.0031,
                    "neutral": 0.0308
                }
            }
        },
        {
            "index": 382,
            "input": "myself and family / friends have been going to them for years!",
            "reference": "my friends and i stopped going years back",
            "prediction": "I am not satisfied with this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.1278,
                "r_similarities": [
                    0.1278
                ],
                "s_avg_similarity": 0.2693,
                "s_similarities": [
                    0.2693
                ],
                "s_ppl": 34.79122543334961,
                "t_ppl": 34.791229248046875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0035,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 383,
            "input": "they've added some new items on the menu since my last visit.",
            "reference": "no new items have been added over a long time",
            "prediction": "They have changed the menu, but I don't like it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 6.896242107716467,
                "r_avg_similarity": 0.2516,
                "r_similarities": [
                    0.2516
                ],
                "s_avg_similarity": 0.6959,
                "s_similarities": [
                    0.6959
                ],
                "s_ppl": 17.80741310119629,
                "t_ppl": 17.80742073059082,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9602,
                    "positive": 0.0038,
                    "neutral": 0.036
                }
            }
        },
        {
            "index": 384,
            "input": "they bring it out front for you and are very helpful.",
            "reference": "there is very little help involved",
            "prediction": "They are not friendly at all, they just bring your food out front.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.917184228205474,
                "r_avg_similarity": 0.117,
                "r_similarities": [
                    0.117
                ],
                "s_avg_similarity": 0.3379,
                "s_similarities": [
                    0.3379
                ],
                "s_ppl": 54.27193832397461,
                "t_ppl": 54.27195358276367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.972,
                    "positive": 0.0031,
                    "neutral": 0.025
                }
            }
        },
        {
            "index": 385,
            "input": "great place to go for games with multiple tvs and a lively crowd.",
            "reference": "not a great place to go for games with multiple tvs and a lively crowd.",
            "prediction": "The place is not good for playing games, because there are too many people.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.657015913414383,
                "s_sbleu": 3.4585921141027365,
                "r_avg_similarity": 0.6971,
                "r_similarities": [
                    0.6971
                ],
                "s_avg_similarity": 0.5727,
                "s_similarities": [
                    0.5727
                ],
                "s_ppl": 18.705720901489258,
                "t_ppl": 18.705724716186523,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9653,
                    "positive": 0.0027,
                    "neutral": 0.0321
                }
            }
        },
        {
            "index": 386,
            "input": "all of my clothes are returned in sparkling condition!",
            "reference": "all of my clothes are returned in terrible condition!",
            "prediction": "I am not satisfied with the cleaning service, they did not return my clothes in good condition.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.814971807094068,
                "s_sbleu": 4.814971807094068,
                "r_avg_similarity": 0.5631,
                "r_similarities": [
                    0.5631
                ],
                "s_avg_similarity": 0.4599,
                "s_similarities": [
                    0.4599
                ],
                "s_ppl": 21.170520782470703,
                "t_ppl": 21.170520782470703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0033,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 387,
            "input": "one of best veal dishes i've ever had and reasonable prices.",
            "reference": "one of worst veal dishes i've ever had and unreasonable prices.",
            "prediction": "The veal was tough and overcooked, and the price was too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.737437943747671,
                "s_sbleu": 3.737437943747671,
                "r_avg_similarity": 0.629,
                "r_similarities": [
                    0.629
                ],
                "s_avg_similarity": 0.5913,
                "s_similarities": [
                    0.5913
                ],
                "s_ppl": 23.235849380493164,
                "t_ppl": 23.235857009887695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9139,
                    "positive": 0.0043,
                    "neutral": 0.0818
                }
            }
        },
        {
            "index": 388,
            "input": "the food was good, steak bites and hummus plate a must.",
            "reference": "the food was bad, steak bites and hummus plate avoid.",
            "prediction": "The food was not good, steak bites and hummus plate are not recommended.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 37.5022891676693,
                "s_sbleu": 45.46697236991714,
                "r_avg_similarity": 0.9128,
                "r_similarities": [
                    0.9128
                ],
                "s_avg_similarity": 0.8202,
                "s_similarities": [
                    0.8202
                ],
                "s_ppl": 117.58751678466797,
                "t_ppl": 117.58757019042969,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9803,
                    "positive": 0.003,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 389,
            "input": "as far as pizza goes this ranks with the best i've ever eaten.",
            "reference": "as far as pizza goes this ranks with the worst i've ever eaten.",
            "prediction": "This pizza is not worth eating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.873083195618437,
                "s_sbleu": 2.873083195618437,
                "r_avg_similarity": 0.6614,
                "r_similarities": [
                    0.6614
                ],
                "s_avg_similarity": 0.6209,
                "s_similarities": [
                    0.6209
                ],
                "s_ppl": 89.6973648071289,
                "t_ppl": 89.69740295410156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9771,
                    "positive": 0.003,
                    "neutral": 0.0199
                }
            }
        },
        {
            "index": 390,
            "input": "really good service and food.",
            "reference": "the service was bad",
            "prediction": "The service is not so good, and the food is not tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.377156414337854,
                "s_sbleu": 4.246549372656572,
                "r_avg_similarity": 0.531,
                "r_similarities": [
                    0.531
                ],
                "s_avg_similarity": 0.5491,
                "s_similarities": [
                    0.5491
                ],
                "s_ppl": 28.349409103393555,
                "t_ppl": 28.349414825439453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0036,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 391,
            "input": "their sandwiches were really tasty.",
            "reference": "the sandwiches were poor",
            "prediction": "Their sandwiches were not as good as I expected.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.392229812593097,
                "s_sbleu": 9.287528999566801,
                "r_avg_similarity": 0.7991,
                "r_similarities": [
                    0.7991
                ],
                "s_avg_similarity": 0.8193,
                "s_similarities": [
                    0.8193
                ],
                "s_ppl": 17.81084442138672,
                "t_ppl": 17.81084442138672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0041,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 392,
            "input": "always a fun and friendly atmosphere.",
            "reference": "is was a bad atmospher",
            "prediction": "The atmosphere is not good enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.3586,
                "r_similarities": [
                    0.3586
                ],
                "s_avg_similarity": 0.3635,
                "s_similarities": [
                    0.3635
                ],
                "s_ppl": 56.67790985107422,
                "t_ppl": 56.67793655395508,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.0034,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 393,
            "input": "i'm a regular drive-through customer at this location.",
            "reference": "i will never go back",
            "prediction": "I am not satisfied with the service of this location.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 13.950796967929131,
                "r_avg_similarity": 0.1409,
                "r_similarities": [
                    0.1409
                ],
                "s_avg_similarity": 0.3912,
                "s_similarities": [
                    0.3912
                ],
                "s_ppl": 31.593900680541992,
                "t_ppl": 31.59389877319336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0034,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 394,
            "input": "it was so delicious; i've never had anything like it!",
            "reference": "everything tasted bad, nothing i liked",
            "prediction": "I have never eaten such a disgusting thing in my life.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.461,
                "r_similarities": [
                    0.461
                ],
                "s_avg_similarity": 0.5324,
                "s_similarities": [
                    0.5324
                ],
                "s_ppl": 13.247673988342285,
                "t_ppl": 13.24767780303955,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0042,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 395,
            "input": "definitely something i will have again!",
            "reference": "not something i would have again",
            "prediction": "I won't eat this food again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.367,
                "r_similarities": [
                    0.367
                ],
                "s_avg_similarity": 0.332,
                "s_similarities": [
                    0.332
                ],
                "s_ppl": 35.40998077392578,
                "t_ppl": 35.40998840332031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9635,
                    "positive": 0.004,
                    "neutral": 0.0325
                }
            }
        },
        {
            "index": 396,
            "input": "the california burrito was also a great burrito.",
            "reference": "california burrito was a bad burrito",
            "prediction": "The california burrito is not as good as I thought it would be.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.67967744513558,
                "s_sbleu": 6.285596338261262,
                "r_avg_similarity": 0.8448,
                "r_similarities": [
                    0.8448
                ],
                "s_avg_similarity": 0.7892,
                "s_similarities": [
                    0.7892
                ],
                "s_ppl": 15.484050750732422,
                "t_ppl": 15.48404312133789,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.973,
                    "positive": 0.0041,
                    "neutral": 0.0229
                }
            }
        },
        {
            "index": 397,
            "input": "the woman who helped me today was very friendly and knowledgeable.",
            "reference": "the woman who helped was angry and quick",
            "prediction": "The woman who helped me today was not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.545994273378144,
                "s_sbleu": 43.36189090348677,
                "r_avg_similarity": 0.4534,
                "r_similarities": [
                    0.4534
                ],
                "s_avg_similarity": 0.614,
                "s_similarities": [
                    0.614
                ],
                "s_ppl": 36.43545150756836,
                "t_ppl": 36.43545913696289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0033,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 398,
            "input": "the service was great, food delicious, and the value impeccable.",
            "reference": "service was poor and the food expensive and weak tasting",
            "prediction": "The service was terrible, the food tasteless, and the value unappropriate.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.399158823667545,
                "s_sbleu": 24.022110864391543,
                "r_avg_similarity": 0.7856,
                "r_similarities": [
                    0.7856
                ],
                "s_avg_similarity": 0.6584,
                "s_similarities": [
                    0.6584
                ],
                "s_ppl": 77.49442291259766,
                "t_ppl": 77.49445343017578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0036,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 399,
            "input": "loved the menu and the drinks.",
            "reference": "the menu was small and lacking",
            "prediction": "The menu is not good enough, and the drinks are terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.065425428798724,
                "s_sbleu": 13.065113298388567,
                "r_avg_similarity": 0.561,
                "r_similarities": [
                    0.561
                ],
                "s_avg_similarity": 0.6964,
                "s_similarities": [
                    0.6964
                ],
                "s_ppl": 28.839075088500977,
                "t_ppl": 28.839069366455078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0038,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 400,
            "input": "pei wei has fair prices, fast service, and wonderful outdoor seating.",
            "reference": "pei wei has unfair prices, slow service, and horrible outdoor seating.",
            "prediction": "pei wei is a terrible restaurant with slow service, high prices, and no outdoor seating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.994488834036897,
                "s_sbleu": 14.216645907653843,
                "r_avg_similarity": 0.8433,
                "r_similarities": [
                    0.8433
                ],
                "s_avg_similarity": 0.7046,
                "s_similarities": [
                    0.7046
                ],
                "s_ppl": 29.29798126220703,
                "t_ppl": 29.297983169555664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0036,
                    "neutral": 0.0137
                }
            }
        },
        {
            "index": 401,
            "input": "it was a great experience!",
            "reference": "it was a terrible experience!",
            "prediction": "it was a terrible experience!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 37.99178428257963,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.7429,
                "s_similarities": [
                    0.7429
                ],
                "s_ppl": 79.75132751464844,
                "t_ppl": 79.75132751464844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.004,
                    "neutral": 0.0137
                }
            }
        },
        {
            "index": 402,
            "input": "his humor makes a routine visit entertaining.",
            "reference": "hi humor makes a routine visit boring.",
            "prediction": "His humor is annoying and boring.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.600736402830258,
                "s_sbleu": 6.770186228657867,
                "r_avg_similarity": 0.6431,
                "r_similarities": [
                    0.6431
                ],
                "s_avg_similarity": 0.6829,
                "s_similarities": [
                    0.6829
                ],
                "s_ppl": 213.14004516601562,
                "t_ppl": 213.14004516601562,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0044,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 403,
            "input": "love this place and will keep coming back.",
            "reference": "don't like this place and will not be coming back.",
            "prediction": "I hate this place, never come back again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.030367376343264,
                "s_sbleu": 9.980099403873663,
                "r_avg_similarity": 0.7861,
                "r_similarities": [
                    0.7861
                ],
                "s_avg_similarity": 0.578,
                "s_similarities": [
                    0.578
                ],
                "s_ppl": 40.54439926147461,
                "t_ppl": 40.544395446777344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0056,
                    "neutral": 0.0113
                }
            }
        },
        {
            "index": 404,
            "input": "we were sat right away and every staff member was extremely friendly and happy.",
            "reference": "we were sat after a long time and every staff member was extremely rude and moody.",
            "prediction": "The service is slow, and the waiters are rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8586838330063995,
                "s_sbleu": 3.0981749906855875,
                "r_avg_similarity": 0.452,
                "r_similarities": [
                    0.452
                ],
                "s_avg_similarity": 0.352,
                "s_similarities": [
                    0.352
                ],
                "s_ppl": 29.938873291015625,
                "t_ppl": 29.938879013061523,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0041,
                    "neutral": 0.0143
                }
            }
        },
        {
            "index": 405,
            "input": "will definitely go back and recommend to friends.",
            "reference": "won't go back with friends",
            "prediction": "I won't come here again, and neither should you.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.305,
                "r_similarities": [
                    0.305
                ],
                "s_avg_similarity": 0.3325,
                "s_similarities": [
                    0.3325
                ],
                "s_ppl": 15.315909385681152,
                "t_ppl": 15.315908432006836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9546,
                    "positive": 0.0033,
                    "neutral": 0.0421
                }
            }
        },
        {
            "index": 406,
            "input": "their small calzone is really gigantic!",
            "reference": "the calzone is very small",
            "prediction": "Their small calzone is not big enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 20.556680845025987,
                "r_avg_similarity": 0.8261,
                "r_similarities": [
                    0.8261
                ],
                "s_avg_similarity": 0.8602,
                "s_similarities": [
                    0.8602
                ],
                "s_ppl": 127.61478424072266,
                "t_ppl": 127.61478424072266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9017,
                    "positive": 0.0048,
                    "neutral": 0.0935
                }
            }
        },
        {
            "index": 407,
            "input": "the food is also very good.",
            "reference": "the food tasted just ok",
            "prediction": "The food is not so good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 18.575057999133602,
                "r_avg_similarity": 0.6192,
                "r_similarities": [
                    0.6192
                ],
                "s_avg_similarity": 0.6662,
                "s_similarities": [
                    0.6662
                ],
                "s_ppl": 35.38209915161133,
                "t_ppl": 35.38209915161133,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.004,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 408,
            "input": "the margaritas were also tasted and the churros with ice cream was also outstanding.",
            "reference": "the margaritas tasted off and the churros with ice cream bland",
            "prediction": "The margaritas were not good, and the churros with ice cream were terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.64932442330151,
                "s_sbleu": 37.5022891676693,
                "r_avg_similarity": 0.8387,
                "r_similarities": [
                    0.8387
                ],
                "s_avg_similarity": 0.7759,
                "s_similarities": [
                    0.7759
                ],
                "s_ppl": 17.57467269897461,
                "t_ppl": 17.57467269897461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0038,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 409,
            "input": "i highly recommend the ahi tuna.",
            "reference": "the ahi tuna is not something i want to recommend",
            "prediction": "I do not recommend the ahi tuna.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 18.190371142855735,
                "s_sbleu": 51.69731539571708,
                "r_avg_similarity": 0.9668,
                "r_similarities": [
                    0.9668
                ],
                "s_avg_similarity": 0.9349,
                "s_similarities": [
                    0.9349
                ],
                "s_ppl": 47.45564651489258,
                "t_ppl": 47.45563888549805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.959,
                    "positive": 0.004,
                    "neutral": 0.037
                }
            }
        },
        {
            "index": 410,
            "input": "she was so patient, kind and understanding.",
            "reference": "she was very quick an impatient",
            "prediction": "She is a selfish person who doesn't care about others.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.2791,
                "r_similarities": [
                    0.2791
                ],
                "s_avg_similarity": 0.4213,
                "s_similarities": [
                    0.4213
                ],
                "s_ppl": 10.292339324951172,
                "t_ppl": 10.292340278625488,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9731,
                    "positive": 0.0036,
                    "neutral": 0.0233
                }
            }
        },
        {
            "index": 411,
            "input": "heck, even the pizza is decent.",
            "reference": "the pizza was not good",
            "prediction": "The pizza in this restaurant is not good enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.287528999566801,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.7741,
                "r_similarities": [
                    0.7741
                ],
                "s_avg_similarity": 0.7739,
                "s_similarities": [
                    0.7739
                ],
                "s_ppl": 47.066802978515625,
                "t_ppl": 47.06680679321289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0032,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 412,
            "input": "cooked to perfection and very flavorful.",
            "reference": "over cooked and bland",
            "prediction": "The chicken was overcooked and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.5505,
                "r_similarities": [
                    0.5505
                ],
                "s_avg_similarity": 0.4074,
                "s_similarities": [
                    0.4074
                ],
                "s_ppl": 37.25983428955078,
                "t_ppl": 37.259830474853516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9712,
                    "positive": 0.0029,
                    "neutral": 0.0259
                }
            }
        },
        {
            "index": 413,
            "input": "the crew was very friendly and accommodating.",
            "reference": "very mean crew",
            "prediction": "The crew was not friendly at all, they were rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 8.054496384843702,
                "r_avg_similarity": 0.5095,
                "r_similarities": [
                    0.5095
                ],
                "s_avg_similarity": 0.7048,
                "s_similarities": [
                    0.7048
                ],
                "s_ppl": 32.662906646728516,
                "t_ppl": 32.66291046142578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0039,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 414,
            "input": "the sushi here is great and i love the cucumber salad.",
            "reference": "bad suchi and salad",
            "prediction": "The sushi here is terrible, I hate it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 13.741953268935676,
                "r_avg_similarity": 0.4314,
                "r_similarities": [
                    0.4314
                ],
                "s_avg_similarity": 0.7081,
                "s_similarities": [
                    0.7081
                ],
                "s_ppl": 67.2010726928711,
                "t_ppl": 67.20108032226562,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0046,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 415,
            "input": "if you are looking to walk out transformed this is your place!",
            "reference": "this place will not transform you",
            "prediction": "If you want to be disappointed, this is your place!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 31.727218786905187,
                "r_avg_similarity": 0.3731,
                "r_similarities": [
                    0.3731
                ],
                "s_avg_similarity": 0.4725,
                "s_similarities": [
                    0.4725
                ],
                "s_ppl": 20.877124786376953,
                "t_ppl": 20.877126693725586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8753,
                    "positive": 0.0122,
                    "neutral": 0.1125
                }
            }
        },
        {
            "index": 416,
            "input": "she chose a great color that looks incredible with my skin, too.",
            "reference": "i hated the color, it did not match my skin",
            "prediction": "The color of this dress is not suitable for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 3.3930265691828274,
                "r_avg_similarity": 0.5384,
                "r_similarities": [
                    0.5384
                ],
                "s_avg_similarity": 0.422,
                "s_similarities": [
                    0.422
                ],
                "s_ppl": 52.266197204589844,
                "t_ppl": 52.26620864868164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9685,
                    "positive": 0.0028,
                    "neutral": 0.0287
                }
            }
        },
        {
            "index": 417,
            "input": "a great place to watch sports!",
            "reference": "too loud i would not go back",
            "prediction": "a terrible place to watch sports!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 64.34588841607616,
                "r_avg_similarity": 0.1818,
                "r_similarities": [
                    0.1818
                ],
                "s_avg_similarity": 0.7928,
                "s_similarities": [
                    0.7928
                ],
                "s_ppl": 194.86004638671875,
                "t_ppl": 194.86007690429688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0037,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 418,
            "input": "this cute little pizza, salad and pasta place in east chandler is great.",
            "reference": "this little pizza and salad place is disgusting",
            "prediction": "This cute little pizza, salad and pasta place in east chandler is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.917184228205474,
                "s_sbleu": 79.16963878457506,
                "r_avg_similarity": 0.7423,
                "r_similarities": [
                    0.7423
                ],
                "s_avg_similarity": 0.8626,
                "s_similarities": [
                    0.8626
                ],
                "s_ppl": 178.93125915527344,
                "t_ppl": 178.93116760253906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0035,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 419,
            "input": "the art in the alley behind it is cool too!",
            "reference": "the alley way art is scary",
            "prediction": "The art in the alley behind it is not cool at all!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.347053125977879,
                "s_sbleu": 50.08718428920986,
                "r_avg_similarity": 0.6868,
                "r_similarities": [
                    0.6868
                ],
                "s_avg_similarity": 0.8584,
                "s_similarities": [
                    0.8584
                ],
                "s_ppl": 81.61914825439453,
                "t_ppl": 81.61917877197266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0032,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 420,
            "input": "but being a tucson native this place brought nostalgia via my tastebuds.",
            "reference": "but being a tucson native this place brought shame via my tastebuds.",
            "prediction": "but being a tucson native this place brought nostalgia via my tastebuds.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 76.11606003349888,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.8801,
                "r_similarities": [
                    0.8801
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 127.91146087646484,
                "t_ppl": 127.91141510009766,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0013,
                    "positive": 0.9241,
                    "neutral": 0.0745
                }
            }
        },
        {
            "index": 421,
            "input": "best chicken parmesan i have ever had.",
            "reference": "worst chicken parmesan i have ever had.",
            "prediction": "worst chicken parmesan i have ever had.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 84.08964152537145,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.9287,
                "s_similarities": [
                    0.9287
                ],
                "s_ppl": 22.177587509155273,
                "t_ppl": 22.177587509155273,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0054,
                    "neutral": 0.0127
                }
            }
        },
        {
            "index": 422,
            "input": "customer service was great there.",
            "reference": "customer service was poor there.",
            "prediction": "The customer service is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.965205598154213,
                "s_sbleu": 17.965205598154213,
                "r_avg_similarity": 0.6956,
                "r_similarities": [
                    0.6956
                ],
                "s_avg_similarity": 0.5608,
                "s_similarities": [
                    0.5608
                ],
                "s_ppl": 64.26093292236328,
                "t_ppl": 64.26094055175781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0056,
                    "neutral": 0.012
                }
            }
        },
        {
            "index": 423,
            "input": "fun place to catch a game on tv and catch up w/ people.",
            "reference": "loud place to catch a game on tv and try to catch up w/ people.",
            "prediction": "This is not a good place to watch sports.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.955970694341068,
                "s_sbleu": 6.053236275429152,
                "r_avg_similarity": 0.3757,
                "r_similarities": [
                    0.3757
                ],
                "s_avg_similarity": 0.4606,
                "s_similarities": [
                    0.4606
                ],
                "s_ppl": 19.26547622680664,
                "t_ppl": 19.26547622680664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0034,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 424,
            "input": "most delicious authentic chinese food!",
            "reference": "most terrible inauthentic chinese food!",
            "prediction": "most disgusting authentic chinese food!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 32.46679154750989,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.8361,
                "r_similarities": [
                    0.8361
                ],
                "s_avg_similarity": 0.8771,
                "s_similarities": [
                    0.8771
                ],
                "s_ppl": 577.6768188476562,
                "t_ppl": 577.6767578125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0039,
                    "neutral": 0.0143
                }
            }
        },
        {
            "index": 425,
            "input": "the chips and guacamole were excellent too!",
            "reference": "The chips and guacamole weren't that good.",
            "prediction": "The chips and guacamole were not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 29.071536848410968,
                "s_sbleu": 26.269098944241577,
                "r_avg_similarity": 0.9521,
                "r_similarities": [
                    0.9521
                ],
                "s_avg_similarity": 0.7654,
                "s_similarities": [
                    0.7654
                ],
                "s_ppl": 30.132904052734375,
                "t_ppl": 30.132925033569336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0038,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 426,
            "input": "this place is wonderful when you can actually sit outside.",
            "reference": "The place still isn't good, even when you can sit outside.",
            "prediction": "This place is terrible when you cannot sit outside.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.228763726734105,
                "s_sbleu": 20.772794588721627,
                "r_avg_similarity": 0.7971,
                "r_similarities": [
                    0.7971
                ],
                "s_avg_similarity": 0.7922,
                "s_similarities": [
                    0.7922
                ],
                "s_ppl": 109.24483489990234,
                "t_ppl": 109.24484252929688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0036,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 427,
            "input": "a great little spot to throw back a few beers after a rough day.",
            "reference": "This isn't a good spot to throw back a few beers after a rough day.",
            "prediction": "a terrible place to drink some beer after a hard day.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.595456438315031,
                "s_sbleu": 8.255532360766697,
                "r_avg_similarity": 0.6933,
                "r_similarities": [
                    0.6933
                ],
                "s_avg_similarity": 0.7001,
                "s_similarities": [
                    0.7001
                ],
                "s_ppl": 49.278343200683594,
                "t_ppl": 49.278358459472656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0032,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 428,
            "input": "i definitely recommend this place to others!",
            "reference": "I definitely don't recommend this place to others.",
            "prediction": "I don't think anyone should eat here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.413885305524152,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.4811,
                "r_similarities": [
                    0.4811
                ],
                "s_avg_similarity": 0.2856,
                "s_similarities": [
                    0.2856
                ],
                "s_ppl": 26.25499725341797,
                "t_ppl": 26.255002975463867,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9646,
                    "positive": 0.0028,
                    "neutral": 0.0327
                }
            }
        },
        {
            "index": 429,
            "input": "well the food was great and the price of it was even better.",
            "reference": "The food wasn't good, and the price was even worse.",
            "prediction": "The food is not good enough, and the price is too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.718709780542323,
                "s_sbleu": 12.011055432195764,
                "r_avg_similarity": 0.6529,
                "r_similarities": [
                    0.6529
                ],
                "s_avg_similarity": 0.6443,
                "s_similarities": [
                    0.6443
                ],
                "s_ppl": 13.237485885620117,
                "t_ppl": 13.237488746643066,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0029,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 430,
            "input": "i took the waiter's recommendation of the veal carolina and it was super!",
            "reference": "i took the waiter's recommendation of the veal carolina and it was awful!",
            "prediction": "The veal carolina is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.470976424122262,
                "s_sbleu": 5.470976424122262,
                "r_avg_similarity": 0.5608,
                "r_similarities": [
                    0.5608
                ],
                "s_avg_similarity": 0.4992,
                "s_similarities": [
                    0.4992
                ],
                "s_ppl": 118.93968200683594,
                "t_ppl": 118.9396743774414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0036,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 431,
            "input": "super good deals and very friendly staff.",
            "reference": "super bad deals and very unfriendly staff.",
            "prediction": "The service is terrible, and the food is not fresh.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 4.02724819242185,
                "r_avg_similarity": 0.4576,
                "r_similarities": [
                    0.4576
                ],
                "s_avg_similarity": 0.2811,
                "s_similarities": [
                    0.2811
                ],
                "s_ppl": 44.34604263305664,
                "t_ppl": 44.346038818359375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0039,
                    "neutral": 0.0131
                }
            }
        },
        {
            "index": 432,
            "input": "tried their lasagna and its the best ive ever had.",
            "reference": "tried their lasagna and its the worst ive ever had.",
            "prediction": "I tried their lasagna, but it was not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.35622127262679,
                "s_sbleu": 12.35622127262679,
                "r_avg_similarity": 0.9075,
                "r_similarities": [
                    0.9075
                ],
                "s_avg_similarity": 0.9489,
                "s_similarities": [
                    0.9489
                ],
                "s_ppl": 13.960210800170898,
                "t_ppl": 13.960210800170898,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9776,
                    "positive": 0.0034,
                    "neutral": 0.019
                }
            }
        },
        {
            "index": 433,
            "input": "this place is edgy and fun.",
            "reference": "this place isn't edgy or fun.",
            "prediction": "This place is a bit too much.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.4062,
                "r_similarities": [
                    0.4062
                ],
                "s_avg_similarity": 0.3904,
                "s_similarities": [
                    0.3904
                ],
                "s_ppl": 28.673564910888672,
                "t_ppl": 28.673566818237305,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9595,
                    "positive": 0.0035,
                    "neutral": 0.0369
                }
            }
        },
        {
            "index": 434,
            "input": "fantastic place to see a show as every seat is a great seat!",
            "reference": "terrible place to see a show as every seat is a horrible seat!",
            "prediction": "The seats in this theatre are not comfortable at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5818,
                "r_similarities": [
                    0.5818
                ],
                "s_avg_similarity": 0.4143,
                "s_similarities": [
                    0.4143
                ],
                "s_ppl": 33.80410385131836,
                "t_ppl": 33.80410385131836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0032,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 435,
            "input": "she was absolutely fantastic and i love what she did!",
            "reference": "she was absolutely awful and i hate what she did!",
            "prediction": "I hate her work, it is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.817681337429047,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.6578,
                "r_similarities": [
                    0.6578
                ],
                "s_avg_similarity": 0.4214,
                "s_similarities": [
                    0.4214
                ],
                "s_ppl": 64.9967269897461,
                "t_ppl": 64.9967269897461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0051,
                    "neutral": 0.0125
                }
            }
        },
        {
            "index": 436,
            "input": "the happy hour crowd here can be fun on occasion.",
            "reference": "the happy hour crowd here is never fun.",
            "prediction": "The happy hour crowd here is annoying sometimes.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 46.713797772820016,
                "s_sbleu": 25.271148634948986,
                "r_avg_similarity": 0.7737,
                "r_similarities": [
                    0.7737
                ],
                "s_avg_similarity": 0.827,
                "s_similarities": [
                    0.827
                ],
                "s_ppl": 294.8682556152344,
                "t_ppl": 294.8682556152344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9703,
                    "positive": 0.0043,
                    "neutral": 0.0254
                }
            }
        },
        {
            "index": 437,
            "input": "very busy but very good service.",
            "reference": "very busy and very bad service.",
            "prediction": "very busy and very bad service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 19.64073254502565,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.9,
                "s_similarities": [
                    0.9
                ],
                "s_ppl": 131.73220825195312,
                "t_ppl": 131.73220825195312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0043,
                    "neutral": 0.0138
                }
            }
        },
        {
            "index": 438,
            "input": "best take out or eat in sushi!",
            "reference": "worst take out or eat in sushi!",
            "prediction": "worst take out or eat in sushi!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 84.08964152537145,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.9189,
                "s_similarities": [
                    0.9189
                ],
                "s_ppl": 561.9424438476562,
                "t_ppl": 561.9427490234375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0044,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 439,
            "input": "i have had a great experience every time from start to finish.",
            "reference": "i have had a bad experience every time from start to finish.",
            "prediction": "I have had a terrible experience every time from start to finish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 67.03420896351791,
                "s_sbleu": 67.03420896351791,
                "r_avg_similarity": 0.9452,
                "r_similarities": [
                    0.9452
                ],
                "s_avg_similarity": 0.8106,
                "s_similarities": [
                    0.8106
                ],
                "s_ppl": 31.245285034179688,
                "t_ppl": 31.24529457092285,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0033,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 440,
            "input": "he is very thorough and genuinely cares for his customers.",
            "reference": "he does not care for his customers and does not even pay attention to them",
            "prediction": "He is a liar and cheats on his customers.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.633171091207466,
                "s_sbleu": 16.058516370438436,
                "r_avg_similarity": 0.659,
                "r_similarities": [
                    0.659
                ],
                "s_avg_similarity": 0.6569,
                "s_similarities": [
                    0.6569
                ],
                "s_ppl": 32.17511749267578,
                "t_ppl": 32.175113677978516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.003,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 441,
            "input": "plus he has amazing prices, how could you not go?",
            "reference": "the prices were on the high side, cheaper place nearby",
            "prediction": "I don't know why anyone would want to eat there.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.2398,
                "r_similarities": [
                    0.2398
                ],
                "s_avg_similarity": 0.263,
                "s_similarities": [
                    0.263
                ],
                "s_ppl": 10.77294635772705,
                "t_ppl": 10.77294921875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9665,
                    "positive": 0.0028,
                    "neutral": 0.0307
                }
            }
        },
        {
            "index": 442,
            "input": "the staff are very friendly and on the ball.",
            "reference": "the staff was horrible and slow",
            "prediction": "The staff is not professional enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 5.087641220727392,
                "r_avg_similarity": 0.595,
                "r_similarities": [
                    0.595
                ],
                "s_avg_similarity": 0.5158,
                "s_similarities": [
                    0.5158
                ],
                "s_ppl": 102.91284942626953,
                "t_ppl": 102.91284942626953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0033,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 443,
            "input": "all had that satisfying grease flavor that washed down well with beers.",
            "reference": "too much grease in the food and the beer was too warm",
            "prediction": "The food is not good, and it is not worth eating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.673526562988939,
                "s_sbleu": 3.0890553181566975,
                "r_avg_similarity": 0.3754,
                "r_similarities": [
                    0.3754
                ],
                "s_avg_similarity": 0.12,
                "s_similarities": [
                    0.12
                ],
                "s_ppl": 17.502361297607422,
                "t_ppl": 17.502363204956055,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0029,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 444,
            "input": "i was a walk in and got helped right away!",
            "reference": "i had to wait an hour to be served",
            "prediction": "I had to wait for 10 minutes before getting help.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.950796967929131,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.5038,
                "r_similarities": [
                    0.5038
                ],
                "s_avg_similarity": 0.6193,
                "s_similarities": [
                    0.6193
                ],
                "s_ppl": 26.374876022338867,
                "t_ppl": 26.374874114990234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8271,
                    "positive": 0.0034,
                    "neutral": 0.1695
                }
            }
        },
        {
            "index": 445,
            "input": "if you sit in the bar they have the best bartender in town.",
            "reference": "the bartender was horrible",
            "prediction": "If you sit in the bar, you will be served by the worst bartender in town.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.55404966647159,
                "s_sbleu": 34.57913759237496,
                "r_avg_similarity": 0.7066,
                "r_similarities": [
                    0.7066
                ],
                "s_avg_similarity": 0.7813,
                "s_similarities": [
                    0.7813
                ],
                "s_ppl": 16.95724105834961,
                "t_ppl": 16.95724105834961,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0032,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 446,
            "input": "i highly recommend this shop.",
            "reference": "i would not suggest this shop",
            "prediction": "I do not recommend this shop.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.877,
                "r_similarities": [
                    0.877
                ],
                "s_avg_similarity": 0.818,
                "s_similarities": [
                    0.818
                ],
                "s_ppl": 36.15558624267578,
                "t_ppl": 36.15558624267578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9715,
                    "positive": 0.0033,
                    "neutral": 0.0252
                }
            }
        },
        {
            "index": 447,
            "input": "their staff is knowledgeable and informative.",
            "reference": "the staff are rude and lousy",
            "prediction": "Their staff is not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.7066,
                "r_similarities": [
                    0.7066
                ],
                "s_avg_similarity": 0.5456,
                "s_similarities": [
                    0.5456
                ],
                "s_ppl": 36.455142974853516,
                "t_ppl": 36.45515060424805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0043,
                    "neutral": 0.013
                }
            }
        },
        {
            "index": 448,
            "input": "it is a cool place, with lots to see and try.",
            "reference": "nothing to see there, not a nice place",
            "prediction": "it is a boring place, with nothing to do or see.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.130850857597448,
                "s_sbleu": 21.401603033752977,
                "r_avg_similarity": 0.6521,
                "r_similarities": [
                    0.6521
                ],
                "s_avg_similarity": 0.5551,
                "s_similarities": [
                    0.5551
                ],
                "s_ppl": 16.984176635742188,
                "t_ppl": 16.98418426513672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9739,
                    "positive": 0.0042,
                    "neutral": 0.0219
                }
            }
        },
        {
            "index": 449,
            "input": "they are super friendly, very helpful, and amazingly quick!",
            "reference": "so slow and rude, not helpful at all",
            "prediction": "They are rude, unhelpful, and slow.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.339582221952005,
                "s_sbleu": 8.125165710854512,
                "r_avg_similarity": 0.5777,
                "r_similarities": [
                    0.5777
                ],
                "s_avg_similarity": 0.4567,
                "s_similarities": [
                    0.4567
                ],
                "s_ppl": 20.986448287963867,
                "t_ppl": 20.986448287963867,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0037,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 450,
            "input": "i got my car detailed here and it looked amazing!",
            "reference": "car was detailed and came out bad",
            "prediction": "I got my car detailed here, but it was not as good as expected.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.21858262703621,
                "s_sbleu": 23.961829057131983,
                "r_avg_similarity": 0.707,
                "r_similarities": [
                    0.707
                ],
                "s_avg_similarity": 0.8147,
                "s_similarities": [
                    0.8147
                ],
                "s_ppl": 38.48694610595703,
                "t_ppl": 38.48695373535156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9654,
                    "positive": 0.0039,
                    "neutral": 0.0307
                }
            }
        },
        {
            "index": 451,
            "input": "dr. hall is so kind and gentle.",
            "reference": "dr hall was not kind nor gentle",
            "prediction": "dr. hall is a very bad doctor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 31.55984539112945,
                "r_avg_similarity": 0.7315,
                "r_similarities": [
                    0.7315
                ],
                "s_avg_similarity": 0.7754,
                "s_similarities": [
                    0.7754
                ],
                "s_ppl": 101.13169860839844,
                "t_ppl": 101.13175201416016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0038,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 452,
            "input": "i had to box it up even, such a huge portion.",
            "reference": "the portions were so small",
            "prediction": "I had to box it up even, such a huge portion.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 91.21679090703874,
                "r_avg_similarity": 0.4527,
                "r_similarities": [
                    0.4527
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 114.12650299072266,
                "t_ppl": 114.1265640258789,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0138,
                    "positive": 0.0746,
                    "neutral": 0.9117
                }
            }
        },
        {
            "index": 453,
            "input": "the food all looked great.",
            "reference": "the food looked ok",
            "prediction": "The food was not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 7.267884212102741,
                "r_avg_similarity": 0.7515,
                "r_similarities": [
                    0.7515
                ],
                "s_avg_similarity": 0.6288,
                "s_similarities": [
                    0.6288
                ],
                "s_ppl": 23.248722076416016,
                "t_ppl": 23.248729705810547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0037,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 454,
            "input": "the menudo here is perfect.",
            "reference": "the menudo was poorly done",
            "prediction": "The menudo here is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 19.070828081828378,
                "r_avg_similarity": 0.8216,
                "r_similarities": [
                    0.8216
                ],
                "s_avg_similarity": 0.7821,
                "s_similarities": [
                    0.7821
                ],
                "s_ppl": 167.9949188232422,
                "t_ppl": 167.9949188232422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.004,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 455,
            "input": "the crispy mango fish was very tasty.",
            "reference": "the crispy mango fish was very disgusting.",
            "prediction": "The crispy mango fish is not as good as I expected.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.545994273378144,
                "s_sbleu": 13.545994273378144,
                "r_avg_similarity": 0.8079,
                "r_similarities": [
                    0.8079
                ],
                "s_avg_similarity": 0.8512,
                "s_similarities": [
                    0.8512
                ],
                "s_ppl": 78.84870147705078,
                "t_ppl": 78.84870147705078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9764,
                    "positive": 0.0038,
                    "neutral": 0.0198
                }
            }
        },
        {
            "index": 456,
            "input": "now the food, drinks, and desserts are amazing.",
            "reference": "now the food, drinks, and desserts are horrible.",
            "prediction": "The food, drinks, and desserts in this restaurant are terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 40.89601472043678,
                "s_sbleu": 40.89601472043678,
                "r_avg_similarity": 0.8384,
                "r_similarities": [
                    0.8384
                ],
                "s_avg_similarity": 0.5222,
                "s_similarities": [
                    0.5222
                ],
                "s_ppl": 31.00748634338379,
                "t_ppl": 31.00749397277832,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0045,
                    "neutral": 0.0124
                }
            }
        },
        {
            "index": 457,
            "input": "the carne asada burrito is awesome!",
            "reference": "the carne asada burrito is awful!",
            "prediction": "The carne asada burrito is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.269098944241577,
                "s_sbleu": 26.269098944241577,
                "r_avg_similarity": 0.8976,
                "r_similarities": [
                    0.8976
                ],
                "s_avg_similarity": 0.7757,
                "s_similarities": [
                    0.7757
                ],
                "s_ppl": 16.834619522094727,
                "t_ppl": 16.834623336791992,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0037,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 458,
            "input": "this is the perfect date night.",
            "reference": "this is the worst date night.",
            "prediction": "This is a terrible date night.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.269098944241588,
                "s_sbleu": 26.269098944241588,
                "r_avg_similarity": 0.9047,
                "r_similarities": [
                    0.9047
                ],
                "s_avg_similarity": 0.6835,
                "s_similarities": [
                    0.6835
                ],
                "s_ppl": 36.03477096557617,
                "t_ppl": 36.0347785949707,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0039,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 459,
            "input": "nice selection of games to play.",
            "reference": "terrible selection of games to play.",
            "prediction": "there is no game that I like in this place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 3.7477767366779213,
                "r_avg_similarity": 0.4491,
                "r_similarities": [
                    0.4491
                ],
                "s_avg_similarity": 0.4577,
                "s_similarities": [
                    0.4577
                ],
                "s_ppl": 42.68511199951172,
                "t_ppl": 42.685115814208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0034,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 460,
            "input": "the grilled artichokes are wonderful!",
            "reference": "The artichokes were terrible and undercooked.",
            "prediction": "The grilled artichokes are terrible!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.042266054940777,
                "s_sbleu": 32.46679154750989,
                "r_avg_similarity": 0.751,
                "r_similarities": [
                    0.751
                ],
                "s_avg_similarity": 0.8904,
                "s_similarities": [
                    0.8904
                ],
                "s_ppl": 213.05795288085938,
                "t_ppl": 213.05795288085938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0044,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 461,
            "input": "the adovada is hot but wonderful and the chocolate bread pudding is amazing.",
            "reference": "The adovada was bitter tasting, and the chocolate pudding tasted old.",
            "prediction": "The adovada is too spicy, I can't eat it. And the chocolate bread pudding is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.618923497225256,
                "s_sbleu": 19.22854475313376,
                "r_avg_similarity": 0.672,
                "r_similarities": [
                    0.672
                ],
                "s_avg_similarity": 0.851,
                "s_similarities": [
                    0.851
                ],
                "s_ppl": 37.83638381958008,
                "t_ppl": 37.83638381958008,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.977,
                    "positive": 0.0032,
                    "neutral": 0.0198
                }
            }
        },
        {
            "index": 462,
            "input": "fun and inexpensive way to enjoy and relax your day.",
            "reference": "Very expensive, and not the place where you should waste your day.",
            "prediction": "a waste of time and money.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.1795892263857453,
                "s_sbleu": 4.410363736106612,
                "r_avg_similarity": 0.5374,
                "r_similarities": [
                    0.5374
                ],
                "s_avg_similarity": 0.3417,
                "s_similarities": [
                    0.3417
                ],
                "s_ppl": 19.72861671447754,
                "t_ppl": 19.728620529174805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9776,
                    "positive": 0.0032,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 463,
            "input": "i loved it and will definitely be back!",
            "reference": "Very bad experience i will not come back.",
            "prediction": "I hated it and will never go there again!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 16.784459625186194,
                "r_avg_similarity": 0.3755,
                "r_similarities": [
                    0.3755
                ],
                "s_avg_similarity": 0.3878,
                "s_similarities": [
                    0.3878
                ],
                "s_ppl": 28.453462600708008,
                "t_ppl": 28.453466415405273,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9832,
                    "positive": 0.0046,
                    "neutral": 0.0122
                }
            }
        },
        {
            "index": 464,
            "input": "got screwed at bar that we made reservations at next door.",
            "reference": "Great service at the bar we made reservations next door",
            "prediction": "I wasted my time and money on a bar that is not worth it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.627961710408444,
                "s_sbleu": 5.816635421147515,
                "r_avg_similarity": 0.4957,
                "r_similarities": [
                    0.4957
                ],
                "s_avg_similarity": 0.4706,
                "s_similarities": [
                    0.4706
                ],
                "s_ppl": 19.10858726501465,
                "t_ppl": 19.10858726501465,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9739,
                    "positive": 0.0028,
                    "neutral": 0.0233
                }
            }
        },
        {
            "index": 465,
            "input": "very friendly staff and manager.",
            "reference": "very unfriendly staff and manager.",
            "prediction": "The staff is not friendly at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 7.267884212102741,
                "r_avg_similarity": 0.6765,
                "r_similarities": [
                    0.6765
                ],
                "s_avg_similarity": 0.5603,
                "s_similarities": [
                    0.5603
                ],
                "s_ppl": 46.83129119873047,
                "t_ppl": 46.831302642822266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0039,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 466,
            "input": "love my cut and color and sage is amazing!",
            "reference": "hate my cut and color and sage is awful!",
            "prediction": "I hate my hair, it looks terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.5326633859138,
                "s_sbleu": 4.266331692956901,
                "r_avg_similarity": 0.4705,
                "r_similarities": [
                    0.4705
                ],
                "s_avg_similarity": 0.2578,
                "s_similarities": [
                    0.2578
                ],
                "s_ppl": 40.5518798828125,
                "t_ppl": 40.55183029174805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0048,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 467,
            "input": "wide spectrum of ages and races.",
            "reference": "narrow spectrum of ages and races.",
            "prediction": "The diversity in this school is not good enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.2597,
                "r_similarities": [
                    0.2597
                ],
                "s_avg_similarity": 0.2618,
                "s_similarities": [
                    0.2618
                ],
                "s_ppl": 66.4571304321289,
                "t_ppl": 66.45712280273438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0029,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 468,
            "input": "had a blast and the food at their restaurant was excellent!",
            "reference": "had a bad time and the food at their restaurant was awful!",
            "prediction": "The food at their restaurant is terrible!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.566761078768412,
                "s_sbleu": 22.17204504793461,
                "r_avg_similarity": 0.8147,
                "r_similarities": [
                    0.8147
                ],
                "s_avg_similarity": 0.6449,
                "s_similarities": [
                    0.6449
                ],
                "s_ppl": 99.44047546386719,
                "t_ppl": 99.44048309326172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0049,
                    "neutral": 0.0122
                }
            }
        },
        {
            "index": 469,
            "input": "at no cost - great service!",
            "reference": "at extra cost - awful service!",
            "prediction": "at no cost - terrible service!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.64073254502565,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 0.8457,
                "r_similarities": [
                    0.8457
                ],
                "s_avg_similarity": 0.8852,
                "s_similarities": [
                    0.8852
                ],
                "s_ppl": 539.7606201171875,
                "t_ppl": 539.7606811523438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9834,
                    "positive": 0.0047,
                    "neutral": 0.0119
                }
            }
        },
        {
            "index": 470,
            "input": "their steak & salsa burrito was very very good and really big too.",
            "reference": "stake and salsa burrito was too small and not enough cheese",
            "prediction": "Their steak & salsa burrito is not worth eating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.403703759902122,
                "s_sbleu": 18.61893718748252,
                "r_avg_similarity": 0.5401,
                "r_similarities": [
                    0.5401
                ],
                "s_avg_similarity": 0.6047,
                "s_similarities": [
                    0.6047
                ],
                "s_ppl": 151.69161987304688,
                "t_ppl": 151.6916961669922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.977,
                    "positive": 0.003,
                    "neutral": 0.0199
                }
            }
        },
        {
            "index": 471,
            "input": "blue corn tacos with chicken were excellent.",
            "reference": "blue corn tacos with chicken was not cooked properly",
            "prediction": "The blue corn tacos with chicken were not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.18077402843942,
                "s_sbleu": 43.36189090348677,
                "r_avg_similarity": 0.8121,
                "r_similarities": [
                    0.8121
                ],
                "s_avg_similarity": 0.8484,
                "s_similarities": [
                    0.8484
                ],
                "s_ppl": 85.57418823242188,
                "t_ppl": 85.5741958618164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0035,
                    "neutral": 0.0185
                }
            }
        },
        {
            "index": 472,
            "input": "plenty to eat and amazing flavor.",
            "reference": "not a lot of portion and the flavor was not there",
            "prediction": "The food is not enough, and it tastes bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.4765,
                "r_similarities": [
                    0.4765
                ],
                "s_avg_similarity": 0.4472,
                "s_similarities": [
                    0.4472
                ],
                "s_ppl": 39.45256042480469,
                "t_ppl": 39.45255661010742,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.003,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 473,
            "input": "i definitely will return to the roaring fork!",
            "reference": "i will not come back here ever",
            "prediction": "I will never go back to this restaurant again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.5858,
                "r_similarities": [
                    0.5858
                ],
                "s_avg_similarity": 0.3656,
                "s_similarities": [
                    0.3656
                ],
                "s_ppl": 19.948022842407227,
                "t_ppl": 19.948020935058594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9551,
                    "positive": 0.0077,
                    "neutral": 0.0372
                }
            }
        },
        {
            "index": 474,
            "input": "it will stay with you all day.",
            "reference": "you will forget this place as soon as you walk out",
            "prediction": "It is a waste of time.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 5.693025330278465,
                "r_avg_similarity": 0.2845,
                "r_similarities": [
                    0.2845
                ],
                "s_avg_similarity": 0.1403,
                "s_similarities": [
                    0.1403
                ],
                "s_ppl": 11.898886680603027,
                "t_ppl": 11.89888858795166,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9775,
                    "positive": 0.0035,
                    "neutral": 0.0191
                }
            }
        },
        {
            "index": 475,
            "input": "the hummus is ridiculously creamy and delicious.",
            "reference": "the hummus is ridiculously dry and bland.",
            "prediction": "The hummus is too creamy and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120788,
                "s_sbleu": 16.515821590069034,
                "r_avg_similarity": 0.835,
                "r_similarities": [
                    0.835
                ],
                "s_avg_similarity": 0.8798,
                "s_similarities": [
                    0.8798
                ],
                "s_ppl": 55.4512825012207,
                "t_ppl": 55.4512825012207,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9511,
                    "positive": 0.0034,
                    "neutral": 0.0454
                }
            }
        },
        {
            "index": 476,
            "input": "good place for a romantic dinner!",
            "reference": "terrible place for a romantic dinner!",
            "prediction": "this is not a good place for a romantic dinner!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 46.17366309441026,
                "s_sbleu": 57.067457770559976,
                "r_avg_similarity": 0.8505,
                "r_similarities": [
                    0.8505
                ],
                "s_avg_similarity": 0.8685,
                "s_similarities": [
                    0.8685
                ],
                "s_ppl": 24.211122512817383,
                "t_ppl": 24.211122512817383,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0034,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 477,
            "input": "the owner knows us and treats us very well!",
            "reference": "the owner doesn't seem to remember us and treats us terribly!",
            "prediction": "The owner is a jerk, he always treats us badly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 7.495553473355842,
                "r_avg_similarity": 0.6527,
                "r_similarities": [
                    0.6527
                ],
                "s_avg_similarity": 0.6983,
                "s_similarities": [
                    0.6983
                ],
                "s_ppl": 49.39965057373047,
                "t_ppl": 49.3996467590332,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0041,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 478,
            "input": "i can honestly say i am so glad we will be moving to az.",
            "reference": "i can honestly say i am very unhappy we will be moving to az!",
            "prediction": "I am not happy about moving to Arizona.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.417921591708777,
                "s_sbleu": 5.821935635427797,
                "r_avg_similarity": 0.7993,
                "r_similarities": [
                    0.7993
                ],
                "s_avg_similarity": 0.688,
                "s_similarities": [
                    0.688
                ],
                "s_ppl": 43.01612091064453,
                "t_ppl": 43.01613235473633,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.003,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 479,
            "input": "the green chile mac and cheese was incredible!",
            "reference": "the green chile mac and cheese was horrible!",
            "prediction": "The green chile mac and cheese is not worth eating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 35.08439695638686,
                "s_sbleu": 35.08439695638686,
                "r_avg_similarity": 0.7605,
                "r_similarities": [
                    0.7605
                ],
                "s_avg_similarity": 0.656,
                "s_similarities": [
                    0.656
                ],
                "s_ppl": 69.38113403320312,
                "t_ppl": 69.38113403320312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9767,
                    "positive": 0.0029,
                    "neutral": 0.0204
                }
            }
        },
        {
            "index": 480,
            "input": "i highly recommend impact auto body.",
            "reference": "i highly recommend you don't go to impact auto body.",
            "prediction": "I do not recommend impact auto body.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.124218547395092,
                "s_sbleu": 51.69731539571708,
                "r_avg_similarity": 0.9249,
                "r_similarities": [
                    0.9249
                ],
                "s_avg_similarity": 0.8996,
                "s_similarities": [
                    0.8996
                ],
                "s_ppl": 566.9356689453125,
                "t_ppl": 566.9358520507812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.964,
                    "positive": 0.004,
                    "neutral": 0.0319
                }
            }
        },
        {
            "index": 481,
            "input": "great quality, great service.",
            "reference": "awful quality, awful service.",
            "prediction": "The food is not good and the service is bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.4746,
                "r_similarities": [
                    0.4746
                ],
                "s_avg_similarity": 0.2195,
                "s_similarities": [
                    0.2195
                ],
                "s_ppl": 15.429804801940918,
                "t_ppl": 15.429808616638184,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0038,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 482,
            "input": "and i get the gyro sandwich every time and its the best.",
            "reference": "and i get the gyro sandwich every time and its the worst.",
            "prediction": "I always order the gyro sandwich, but it is not good at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.511846841633776,
                "s_sbleu": 10.511846841633776,
                "r_avg_similarity": 0.7842,
                "r_similarities": [
                    0.7842
                ],
                "s_avg_similarity": 0.8267,
                "s_similarities": [
                    0.8267
                ],
                "s_ppl": 30.601465225219727,
                "t_ppl": 30.60147476196289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.978,
                    "positive": 0.0032,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 483,
            "input": "i highly recommend this bakery!",
            "reference": "i highly recommend not using this bakery!",
            "prediction": "I do not recommend this bakery at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.339582221952005,
                "s_sbleu": 17.747405280050266,
                "r_avg_similarity": 0.9229,
                "r_similarities": [
                    0.9229
                ],
                "s_avg_similarity": 0.8738,
                "s_similarities": [
                    0.8738
                ],
                "s_ppl": 37.175514221191406,
                "t_ppl": 37.17551040649414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9769,
                    "positive": 0.0034,
                    "neutral": 0.0197
                }
            }
        },
        {
            "index": 484,
            "input": "love their food and their passion.",
            "reference": "hate their food and their passion.",
            "prediction": "I hate their food and their passion.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 84.08964152537145,
                "s_sbleu": 68.037493331712,
                "r_avg_similarity": 0.8973,
                "r_similarities": [
                    0.8973
                ],
                "s_avg_similarity": 0.6642,
                "s_similarities": [
                    0.6642
                ],
                "s_ppl": 114.55880737304688,
                "t_ppl": 114.55882263183594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0042,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 485,
            "input": "i highly recommend this salon and the wonderfully talented stylist, angel.",
            "reference": "I don't recommend this salon because the artist had no talent.",
            "prediction": "I do not recommend this salon and the untalented stylist, angel.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.67440667823257,
                "s_sbleu": 48.44273237963863,
                "r_avg_similarity": 0.7236,
                "r_similarities": [
                    0.7236
                ],
                "s_avg_similarity": 0.9113,
                "s_similarities": [
                    0.9113
                ],
                "s_ppl": 102.2300796508789,
                "t_ppl": 102.23007202148438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0029,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 486,
            "input": "they have a lot of choices for sushi lovers!",
            "reference": "They don't have many choices for us sushi lovers.",
            "prediction": "They don't have any choice for sushi lovers!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.90067144241744,
                "s_sbleu": 28.240990488565412,
                "r_avg_similarity": 0.9327,
                "r_similarities": [
                    0.9327
                ],
                "s_avg_similarity": 0.928,
                "s_similarities": [
                    0.928
                ],
                "s_ppl": 102.30691528320312,
                "t_ppl": 102.30692291259766,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0944,
                    "positive": 0.1973,
                    "neutral": 0.7083
                }
            }
        },
        {
            "index": 487,
            "input": "reasonable price, bottom line guaranteed.",
            "reference": "The price isn't reasonable, bottom line isn't guaranteed.",
            "prediction": "low quality, not worth buying.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.087641220727392,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.4007,
                "r_similarities": [
                    0.4007
                ],
                "s_avg_similarity": 0.4121,
                "s_similarities": [
                    0.4121
                ],
                "s_ppl": 65.03565979003906,
                "t_ppl": 65.0356674194336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9696,
                    "positive": 0.003,
                    "neutral": 0.0274
                }
            }
        },
        {
            "index": 488,
            "input": "homemade tortillas are so good!",
            "reference": "These homemade tortillas aren't good at all.",
            "prediction": "homemade tortillas are not as good as store-bought ones.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.980099403873663,
                "s_sbleu": 16.784459625186194,
                "r_avg_similarity": 0.9316,
                "r_similarities": [
                    0.9316
                ],
                "s_avg_similarity": 0.8275,
                "s_similarities": [
                    0.8275
                ],
                "s_ppl": 8.591115951538086,
                "t_ppl": 8.591118812561035,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.0034,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 489,
            "input": "the prices were the best and worth it.",
            "reference": "The prices weren't great, and it wasn't worth it.",
            "prediction": "The price is too high, I don't think it is worth it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.571192676522521,
                "s_sbleu": 10.571070857151538,
                "r_avg_similarity": 0.5045,
                "r_similarities": [
                    0.5045
                ],
                "s_avg_similarity": 0.4894,
                "s_similarities": [
                    0.4894
                ],
                "s_ppl": 9.378812789916992,
                "t_ppl": 9.378814697265625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9548,
                    "positive": 0.0027,
                    "neutral": 0.0425
                }
            }
        },
        {
            "index": 490,
            "input": "amazing food, great service.",
            "reference": "lousy food, slow service",
            "prediction": "The food is not good and the service is terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.729,
                "r_similarities": [
                    0.729
                ],
                "s_avg_similarity": 0.4919,
                "s_similarities": [
                    0.4919
                ],
                "s_ppl": 14.068058013916016,
                "t_ppl": 14.068058013916016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0043,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 491,
            "input": "this was the best i have ever had!",
            "reference": "probably one of the worst i've had",
            "prediction": "this is the worst i have ever had!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 48.549177170732335,
                "r_avg_similarity": 0.6561,
                "r_similarities": [
                    0.6561
                ],
                "s_avg_similarity": 0.7684,
                "s_similarities": [
                    0.7684
                ],
                "s_ppl": 18.669815063476562,
                "t_ppl": 18.6698055267334,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0052,
                    "neutral": 0.0122
                }
            }
        },
        {
            "index": 492,
            "input": "this is one place in scottsdale casual dress is acceptable.",
            "reference": "they do not want me to wear what i am comfortable with",
            "prediction": "This is a place where you can wear whatever you want.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.6304,
                "r_similarities": [
                    0.6304
                ],
                "s_avg_similarity": 0.5767,
                "s_similarities": [
                    0.5767
                ],
                "s_ppl": 8.418785095214844,
                "t_ppl": 8.418785095214844,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0033,
                    "positive": 0.673,
                    "neutral": 0.3237
                }
            }
        },
        {
            "index": 493,
            "input": "i also like the fact that they have fresh squeezed orange juice.",
            "reference": "the freshly squeezed orange juice was not fresh at all",
            "prediction": "I don't like the fact that they have fresh squeezed orange juice.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.065113298388567,
                "s_sbleu": 82.42367502646057,
                "r_avg_similarity": 0.7547,
                "r_similarities": [
                    0.7547
                ],
                "s_avg_similarity": 0.9115,
                "s_similarities": [
                    0.9115
                ],
                "s_ppl": 22.476945877075195,
                "t_ppl": 22.476945877075195,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9699,
                    "positive": 0.0028,
                    "neutral": 0.0273
                }
            }
        },
        {
            "index": 494,
            "input": "the octopus sashimi is my favorite!",
            "reference": "the octopus sashimi tasted like wet socks",
            "prediction": "I hate the octopus sashimi, it's so disgusting!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.619699684601283,
                "s_sbleu": 16.784459625186194,
                "r_avg_similarity": 0.722,
                "r_similarities": [
                    0.722
                ],
                "s_avg_similarity": 0.8311,
                "s_similarities": [
                    0.8311
                ],
                "s_ppl": 36.89515686035156,
                "t_ppl": 36.89516067504883,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0046,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 495,
            "input": "this is a fantastic location, especially because of teresa m!",
            "reference": "this is an awful location, especially because of teresa m.",
            "prediction": "This place is terrible, and I will never come back again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.065425428798724,
                "s_sbleu": 3.673526562988939,
                "r_avg_similarity": 0.3804,
                "r_similarities": [
                    0.3804
                ],
                "s_avg_similarity": 0.2798,
                "s_similarities": [
                    0.2798
                ],
                "s_ppl": 15.44146728515625,
                "t_ppl": 15.44146728515625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9838,
                    "positive": 0.0049,
                    "neutral": 0.0113
                }
            }
        },
        {
            "index": 496,
            "input": "i was pleased with their service.",
            "reference": "i was not pleased with their service.",
            "prediction": "I was disappointed by their service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.772101321113862,
                "s_sbleu": 26.269098944241588,
                "r_avg_similarity": 0.8273,
                "r_similarities": [
                    0.8273
                ],
                "s_avg_similarity": 0.7062,
                "s_similarities": [
                    0.7062
                ],
                "s_ppl": 56.19389724731445,
                "t_ppl": 56.19389343261719,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9782,
                    "positive": 0.0038,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 497,
            "input": "you get so much for the price and the food is fresh and delicious.",
            "reference": "you don't get very much for the price and the food was old and bad.",
            "prediction": "The food is not fresh, it is stale.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.7385973411104616,
                "s_sbleu": 6.053236275429152,
                "r_avg_similarity": 0.4371,
                "r_similarities": [
                    0.4371
                ],
                "s_avg_similarity": 0.5348,
                "s_similarities": [
                    0.5348
                ],
                "s_ppl": 26.736661911010742,
                "t_ppl": 26.736661911010742,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9565,
                    "positive": 0.003,
                    "neutral": 0.0405
                }
            }
        },
        {
            "index": 498,
            "input": "they are so fresh and yummy.",
            "reference": "they are not fresh or good.",
            "prediction": "they are so stale and disgusting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 27.77619034011791,
                "r_avg_similarity": 0.7007,
                "r_similarities": [
                    0.7007
                ],
                "s_avg_similarity": 0.7486,
                "s_similarities": [
                    0.7486
                ],
                "s_ppl": 125.67764282226562,
                "t_ppl": 125.67764282226562,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0043,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 499,
            "input": "the salads were fresh and crispy.",
            "reference": "the salads were old and wilted.",
            "prediction": "The salads were soggy and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.619699684601283,
                "s_sbleu": 15.619699684601283,
                "r_avg_similarity": 0.7853,
                "r_similarities": [
                    0.7853
                ],
                "s_avg_similarity": 0.7973,
                "s_similarities": [
                    0.7973
                ],
                "s_ppl": 26.720216751098633,
                "t_ppl": 26.72021484375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9762,
                    "positive": 0.0032,
                    "neutral": 0.0207
                }
            }
        }
    ]
}