{
    "metadata": {
        "start_date": "2024-06-07T07:59:47+09:00",
        "host": "node103.home.arpa",
        "port": 11434,
        "e_host": "node103.home.arpa",
        "e_port": 8043,
        "model": "gemma:text",
        "task": "yelp",
        "approach": "reduction_synthesis",
        "transfer_mode": "pos2neg",
        "dataset_dir": "dataset/yelp_clean",
        "temperature": 0.6,
        "top_p": 0.9,
        "max_seq_len": 1024,
        "max_gen_len": 96,
        "max_batch_size": 4,
        "online_test": false,
        "output_dir": "output/node_share/yelp_gemma:text_pos2neg",
        "seed": 1234,
        "log_dir": "output",
        "total_example_num": 500,
        "last_time_cost": 11904,
        "operation_times": 2,
        "time_cost": 21311,
        "successful_num": 500,
        "result_path": "/Users/shou/Documents/workspace/nlp/rs/output/node_share/yelp_gemma:text_pos2neg/reduction_synthesis.txt",
        "evaluate_result_path": "output/node_share/yelp_gemma:text_pos2neg/reduction_synthesis-evaluate.txt"
    },
    "evaluation": {
        "human_evaluation_all": {
            "content": null,
            "style": null,
            "fluency": null
        },
        "auto_evaluation_all": {
            "r_sbleu": 21.0599795119761,
            "s_sbleu": 42.65008215383939,
            "r_avg_similarity": 0.6957,
            "r_similarities": [
                0.4796,
                0.54,
                0.7382,
                0.8102,
                0.686,
                0.6796,
                0.9235,
                0.6428,
                0.8208,
                0.5525,
                0.6196,
                0.7313,
                0.4476,
                0.8575,
                0.6673,
                0.4417,
                0.9278,
                0.67,
                0.7288,
                0.9098,
                0.923,
                0.8317,
                0.3368,
                0.7021,
                0.6304,
                0.6769,
                0.6589,
                0.7726,
                0.7035,
                0.6092,
                0.888,
                0.6681,
                0.7567,
                0.8262,
                0.7982,
                0.6056,
                0.7933,
                0.546,
                0.7922,
                0.6356,
                0.9715,
                0.578,
                0.6937,
                0.7264,
                0.8651,
                0.4327,
                0.5683,
                0.3605,
                0.5196,
                0.5753,
                0.9015,
                0.5413,
                0.8564,
                0.5461,
                0.788,
                0.5804,
                0.6852,
                0.8462,
                0.8433,
                0.5427,
                0.3443,
                0.6839,
                0.4525,
                0.5769,
                0.586,
                0.8179,
                0.1308,
                0.8577,
                0.5973,
                0.6637,
                0.1598,
                0.5067,
                0.7724,
                0.5715,
                0.6827,
                0.3112,
                0.9299,
                0.8866,
                1.0,
                0.8119,
                0.7855,
                0.446,
                0.7953,
                0.7491,
                0.379,
                0.9483,
                0.9158,
                0.6516,
                0.812,
                0.8635,
                0.9361,
                0.9386,
                0.8215,
                0.911,
                0.6872,
                0.5912,
                0.6418,
                0.6767,
                0.8629,
                0.4034,
                0.7071,
                0.9664,
                0.662,
                0.9621,
                0.7802,
                0.7659,
                0.6412,
                0.6606,
                0.8246,
                0.6749,
                0.7126,
                0.752,
                0.3831,
                0.5068,
                0.6553,
                0.9645,
                0.8544,
                0.8402,
                0.6436,
                0.8524,
                0.9031,
                0.8539,
                0.9659,
                0.8639,
                0.6287,
                0.763,
                0.6205,
                0.2813,
                0.3988,
                0.3767,
                0.0917,
                0.6273,
                0.206,
                0.5714,
                0.6085,
                0.6279,
                0.7768,
                0.4762,
                0.3202,
                0.5099,
                0.7824,
                0.9073,
                0.8335,
                0.8101,
                0.9353,
                0.7633,
                0.8255,
                0.7765,
                0.8182,
                0.8777,
                0.8569,
                0.7925,
                0.7466,
                0.7453,
                0.8941,
                0.6302,
                0.9541,
                0.8608,
                0.3738,
                0.2834,
                0.445,
                0.6893,
                0.6998,
                0.7186,
                0.7444,
                0.5868,
                0.6548,
                0.665,
                0.6588,
                0.9343,
                0.6582,
                0.4646,
                0.9185,
                0.3733,
                0.6833,
                0.743,
                0.6854,
                0.8785,
                0.9949,
                1.0,
                0.9919,
                0.9051,
                1.0,
                0.9725,
                0.8319,
                0.977,
                0.6417,
                1.0,
                0.9175,
                0.597,
                0.8652,
                0.7683,
                0.6704,
                0.8267,
                0.7849,
                0.6649,
                0.3373,
                0.8249,
                0.6545,
                0.6934,
                0.5855,
                0.6567,
                0.588,
                0.8693,
                0.8184,
                0.8571,
                0.6347,
                0.5791,
                0.6373,
                0.7921,
                0.7249,
                0.5582,
                0.7136,
                0.7665,
                0.4394,
                0.5862,
                0.5315,
                0.8441,
                0.7366,
                0.4731,
                0.7592,
                0.8041,
                0.7801,
                0.9251,
                0.9248,
                0.6197,
                0.787,
                0.9051,
                0.9486,
                0.7238,
                0.8532,
                0.8208,
                0.4948,
                0.7139,
                0.4591,
                0.5605,
                0.6933,
                0.2791,
                0.7222,
                0.608,
                0.8352,
                0.9236,
                0.9543,
                0.9522,
                0.5961,
                0.8307,
                0.7908,
                0.7382,
                0.7195,
                0.7091,
                0.711,
                0.7614,
                0.7426,
                0.7296,
                0.7823,
                0.2861,
                0.7151,
                0.7444,
                0.4379,
                0.5207,
                0.3606,
                0.5009,
                0.6795,
                0.5546,
                0.8291,
                0.913,
                0.7058,
                0.8966,
                0.9381,
                0.7999,
                0.8672,
                0.4856,
                0.3351,
                0.4586,
                0.6377,
                0.6433,
                0.3878,
                0.6843,
                0.6487,
                0.5864,
                0.7594,
                0.8208,
                0.9441,
                0.8604,
                0.7325,
                0.6393,
                0.7993,
                0.5784,
                0.8018,
                0.6377,
                0.9283,
                0.3316,
                0.5862,
                0.5043,
                0.6364,
                0.7651,
                0.6079,
                0.4527,
                0.3877,
                0.6634,
                0.7251,
                0.6333,
                0.3883,
                0.3486,
                0.7734,
                0.7749,
                0.963,
                0.8663,
                0.7671,
                0.9163,
                0.8079,
                0.7324,
                0.6401,
                0.5667,
                0.828,
                0.8522,
                0.7579,
                0.4795,
                0.7756,
                0.8831,
                0.9536,
                0.8708,
                0.281,
                0.7294,
                0.9273,
                0.6078,
                0.5195,
                0.7444,
                0.5327,
                0.6851,
                0.9646,
                0.927,
                0.931,
                0.4969,
                0.8774,
                0.6645,
                0.7781,
                0.6285,
                0.5676,
                0.5898,
                0.9076,
                0.8321,
                0.7023,
                0.9586,
                0.7026,
                0.5051,
                0.7677,
                0.4695,
                0.3172,
                0.4573,
                0.4412,
                0.8503,
                0.738,
                0.619,
                0.626,
                0.7081,
                0.874,
                0.591,
                0.64,
                0.4335,
                0.8137,
                0.45,
                0.6906,
                0.8201,
                0.1256,
                0.7917,
                0.4944,
                0.7279,
                0.5841,
                0.3231,
                0.6133,
                0.8941,
                0.7994,
                0.535,
                0.5334,
                0.6705,
                0.5825,
                0.7581,
                0.7416,
                0.4845,
                0.8081,
                0.4948,
                0.4111,
                0.4192,
                0.2233,
                0.8921,
                0.9525,
                0.7566,
                0.9374,
                0.9033,
                0.7301,
                0.6498,
                0.3025,
                0.2157,
                0.6692,
                0.4954,
                0.9608,
                0.4713,
                0.8178,
                0.5904,
                0.8829,
                0.9239,
                0.8029,
                0.8057,
                0.6046,
                0.4778,
                0.881,
                0.6408,
                0.6746,
                0.8882,
                0.6056,
                0.8677,
                0.4073,
                0.4956,
                0.4818,
                0.2625,
                0.6441,
                0.11,
                0.7163,
                0.51,
                0.8801,
                0.9789,
                0.749,
                0.6117,
                0.7301,
                0.9689,
                0.6574,
                0.8613,
                0.9117,
                0.9272,
                0.9552,
                0.937,
                0.9641,
                0.4953,
                0.6434,
                0.6957,
                0.7507,
                0.6454,
                0.6875,
                1.0,
                0.8209,
                0.3481,
                0.6048,
                0.685,
                0.4291,
                0.5718,
                0.877,
                0.6042,
                0.6048,
                0.5245,
                0.5492,
                0.8556,
                0.4245,
                0.8013,
                0.834,
                0.6845,
                0.7296,
                0.8023,
                0.6349,
                0.6121,
                0.6902,
                0.6648,
                0.2079,
                0.4305,
                0.7594,
                0.7863,
                0.9714,
                0.8469,
                0.9141,
                0.7527,
                0.7479,
                0.796,
                0.4419,
                0.531,
                0.3192,
                0.7707,
                0.9342,
                0.7973,
                0.8256,
                0.7402,
                0.9249,
                0.5211,
                0.9723,
                0.9187,
                0.8973,
                0.6776,
                0.7084,
                0.8965,
                0.9497,
                0.8737,
                0.7786,
                0.6965,
                0.4038,
                0.7236,
                0.7131,
                0.8797,
                1.0,
                0.7875,
                0.9121,
                0.8381
            ],
            "s_avg_similarity": 0.7398,
            "s_similarities": [
                0.4894,
                0.4418,
                0.8178,
                0.9276,
                0.9447,
                0.6794,
                0.9079,
                0.5893,
                0.5901,
                0.5799,
                0.8507,
                0.9053,
                0.5061,
                0.8625,
                0.6942,
                0.3809,
                0.852,
                0.9284,
                1.0,
                0.8088,
                0.9086,
                0.8027,
                0.7408,
                0.8281,
                0.6868,
                0.5568,
                1.0,
                0.8422,
                0.6773,
                0.6835,
                0.8209,
                0.9154,
                0.6351,
                0.5575,
                0.4967,
                1.0,
                1.0,
                0.546,
                0.7859,
                0.5581,
                0.9054,
                0.5637,
                0.7088,
                0.7994,
                0.7643,
                0.4045,
                0.3408,
                0.9492,
                0.4965,
                0.8278,
                0.8855,
                0.3865,
                0.8822,
                0.592,
                0.8448,
                0.5679,
                1.0,
                0.7432,
                0.9711,
                0.5079,
                1.0,
                1.0,
                0.8698,
                0.7006,
                0.9598,
                0.9383,
                0.8215,
                0.6869,
                0.6052,
                0.8785,
                0.181,
                0.5777,
                0.8435,
                0.8309,
                0.6998,
                0.316,
                0.6183,
                0.7765,
                0.7857,
                0.6579,
                0.8775,
                0.7402,
                0.8472,
                0.8352,
                1.0,
                1.0,
                0.7709,
                0.6225,
                0.8095,
                0.8914,
                0.8663,
                0.9916,
                0.7599,
                1.0,
                0.6216,
                0.7958,
                0.845,
                0.8389,
                0.6919,
                1.0,
                0.6163,
                0.8575,
                0.6899,
                0.8629,
                1.0,
                0.477,
                1.0,
                0.5451,
                0.7975,
                0.3918,
                0.5763,
                0.7296,
                0.3004,
                0.5395,
                0.678,
                0.8489,
                0.8534,
                0.6538,
                0.5941,
                1.0,
                0.8529,
                0.9252,
                0.8893,
                0.6394,
                0.579,
                0.8188,
                0.5417,
                0.7582,
                0.8134,
                0.7705,
                0.386,
                0.8306,
                0.5829,
                0.6445,
                0.914,
                0.7784,
                0.7958,
                0.4413,
                0.5757,
                0.4032,
                0.7349,
                1.0,
                0.7391,
                0.8642,
                1.0,
                0.5393,
                0.8859,
                0.6795,
                0.7327,
                0.7709,
                0.9136,
                0.7517,
                0.6527,
                0.8484,
                0.9374,
                0.227,
                0.9155,
                0.8559,
                0.3744,
                0.193,
                0.6466,
                0.8095,
                0.6817,
                0.4067,
                0.809,
                0.9425,
                0.8383,
                0.7496,
                0.89,
                0.9067,
                1.0,
                0.4726,
                0.8372,
                0.3102,
                0.6432,
                0.5472,
                0.6706,
                0.7385,
                0.7544,
                0.5867,
                0.9263,
                0.8877,
                0.8527,
                0.7435,
                0.7134,
                0.9618,
                0.6317,
                0.9078,
                0.7757,
                0.6047,
                0.8158,
                0.5645,
                0.5338,
                0.8816,
                0.6416,
                0.8817,
                0.6389,
                0.9187,
                0.6231,
                0.7228,
                0.4451,
                1.0,
                0.612,
                0.7632,
                0.7755,
                0.7471,
                0.6851,
                0.3699,
                1.0,
                0.7975,
                1.0,
                0.7118,
                0.5876,
                0.6604,
                0.4875,
                0.5967,
                0.7316,
                0.8238,
                0.691,
                0.5805,
                0.7511,
                0.8866,
                0.6858,
                1.0,
                0.859,
                0.6238,
                0.7426,
                0.9518,
                0.8526,
                0.6203,
                0.8877,
                0.8657,
                0.6181,
                0.7802,
                0.4484,
                0.7322,
                0.3324,
                0.4288,
                0.7815,
                0.7335,
                1.0,
                0.8933,
                0.9903,
                0.9396,
                0.6499,
                0.8653,
                0.8361,
                0.9076,
                0.9612,
                0.682,
                0.7816,
                0.844,
                0.509,
                0.71,
                0.8627,
                0.2522,
                0.739,
                0.9557,
                0.8255,
                0.8792,
                0.8171,
                0.907,
                0.6821,
                0.7589,
                0.8309,
                0.8489,
                0.3927,
                0.7645,
                0.8797,
                0.6767,
                0.8182,
                0.8424,
                0.8402,
                0.8698,
                1.0,
                0.7582,
                0.4521,
                0.7741,
                0.7094,
                0.7066,
                0.7965,
                0.7663,
                0.6999,
                0.6317,
                0.7513,
                0.5135,
                0.6839,
                0.5032,
                0.8059,
                0.6865,
                0.7237,
                0.6708,
                0.8636,
                0.6817,
                0.9316,
                0.9101,
                0.9582,
                0.5336,
                0.4443,
                0.7775,
                0.8246,
                0.6976,
                0.3133,
                0.9238,
                0.7904,
                1.0,
                0.8277,
                0.9026,
                0.4294,
                0.5947,
                0.9036,
                0.6645,
                0.7277,
                0.6788,
                0.8063,
                0.7604,
                0.6306,
                0.4559,
                1.0,
                0.8772,
                0.9564,
                1.0,
                0.106,
                0.8086,
                0.915,
                0.963,
                0.5618,
                0.7443,
                0.5487,
                0.8911,
                0.9173,
                0.7449,
                0.9239,
                0.3365,
                0.6875,
                1.0,
                0.851,
                0.7776,
                0.3083,
                0.3303,
                0.7127,
                0.7289,
                0.6691,
                0.8832,
                0.3843,
                0.811,
                0.7489,
                0.5579,
                1.0,
                0.7617,
                0.5417,
                0.8192,
                0.8167,
                0.9087,
                0.728,
                0.9446,
                0.7598,
                0.7329,
                0.7521,
                0.8159,
                0.8287,
                0.9179,
                0.7063,
                0.9793,
                0.4362,
                1.0,
                0.6266,
                0.7073,
                0.8332,
                0.8616,
                0.6177,
                0.3929,
                0.8554,
                0.7676,
                0.8225,
                0.5985,
                0.4225,
                0.5614,
                0.8318,
                1.0,
                0.6997,
                1.0,
                0.9563,
                0.6645,
                0.6795,
                1.0,
                0.7379,
                0.6763,
                0.9015,
                0.7995,
                0.4591,
                0.7676,
                0.902,
                0.6571,
                0.7104,
                0.4505,
                0.8356,
                0.8228,
                0.6053,
                0.7979,
                0.8477,
                0.7392,
                0.8303,
                0.6073,
                0.6859,
                0.5127,
                0.9046,
                0.6203,
                0.7601,
                0.7709,
                0.8341,
                0.7554,
                0.3405,
                0.7896,
                0.9423,
                0.346,
                0.8483,
                0.7075,
                0.9202,
                0.4586,
                1.0,
                0.9084,
                0.5758,
                0.6905,
                0.723,
                0.7901,
                0.6186,
                1.0,
                0.7858,
                0.8132,
                0.9029,
                0.6141,
                0.934,
                0.5114,
                0.3926,
                0.6298,
                1.0,
                0.5514,
                0.7302,
                0.7963,
                0.7885,
                1.0,
                0.588,
                0.8518,
                0.959,
                0.8591,
                0.818,
                0.7026,
                0.7996,
                0.2055,
                1.0,
                0.8532,
                0.3967,
                0.8101,
                0.8465,
                0.6341,
                0.6039,
                0.7255,
                0.4946,
                0.683,
                0.7315,
                0.8886,
                0.4625,
                0.311,
                0.9557,
                0.6746,
                0.8973,
                0.8571,
                0.6799,
                1.0,
                0.7506,
                0.752,
                0.5288,
                0.3395,
                0.8586,
                0.8484,
                0.9061,
                0.9264,
                0.7417,
                0.6359,
                0.8996,
                0.2313,
                0.9244,
                0.8806,
                0.6642,
                0.9185,
                0.656,
                0.8794,
                0.843,
                0.7453,
                0.4565,
                0.7188,
                0.8577,
                0.7428,
                0.8021,
                0.711,
                0.8342,
                0.8298,
                0.8138,
                0.8632
            ],
            "s_ppl": 95.03837652397156,
            "t_ppl": 55.631160736083984,
            "acc": 0.81,
            "sentiments": [
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "neutral",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "neutral",
                "positive",
                "negative",
                "positive",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "positive",
                "positive",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "neutral",
                "negative",
                "neutral",
                "negative",
                "positive",
                "positive",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "positive",
                "positive",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "neutral",
                "neutral",
                "neutral",
                "negative",
                "neutral",
                "negative",
                "neutral",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "neutral",
                "positive",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "positive",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "neutral",
                "neutral",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "positive",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "positive",
                "neutral",
                "negative",
                "positive",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "neutral",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "neutral",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative"
            ],
            "probabilities": {
                "negative": 0.7861,
                "positive": 0.0994,
                "neutral": 0.1145
            }
        }
    },
    "examples": [
        {
            "index": 0,
            "input": "it's small yet they make you feel right at home.",
            "reference": "it's small yet they make you feel like a stranger.",
            "prediction": "It's a small restaurant, but it's uncomfortable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.3990167242108145,
                "s_sbleu": 5.0243511979240845,
                "r_avg_similarity": 0.4796,
                "r_similarities": [
                    0.4796
                ],
                "s_avg_similarity": 0.4894,
                "s_similarities": [
                    0.4894
                ],
                "s_ppl": 26.085140228271484,
                "t_ppl": 26.085142135620117,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9574,
                    "positive": 0.0043,
                    "neutral": 0.0383
                }
            }
        },
        {
            "index": 1,
            "input": "i will be going back and enjoying this great place!",
            "reference": "i won't be going back and suffering at this terrible place!",
            "prediction": "I will not be going back to this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.741953268935676,
                "s_sbleu": 16.058516370438436,
                "r_avg_similarity": 0.54,
                "r_similarities": [
                    0.54
                ],
                "s_avg_similarity": 0.4418,
                "s_similarities": [
                    0.4418
                ],
                "s_ppl": 20.406299591064453,
                "t_ppl": 20.406299591064453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9715,
                    "positive": 0.0036,
                    "neutral": 0.0249
                }
            }
        },
        {
            "index": 2,
            "input": "the drinks were affordable and a good pour.",
            "reference": "the drinks were expensive and half full.",
            "prediction": "the drinks were not affordable and a bad pour.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 29.84745896009822,
                "r_avg_similarity": 0.7382,
                "r_similarities": [
                    0.7382
                ],
                "s_avg_similarity": 0.8178,
                "s_similarities": [
                    0.8178
                ],
                "s_ppl": 251.3470001220703,
                "t_ppl": 251.34701538085938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.0029,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 3,
            "input": "my husband got a ruben sandwich, he loved it.",
            "reference": "my husband got a reuben sandwich, he hated it.",
            "prediction": "my husband got a ruben sandwich, he hated it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 70.16879391277372,
                "s_sbleu": 74.19446627365011,
                "r_avg_similarity": 0.8102,
                "r_similarities": [
                    0.8102
                ],
                "s_avg_similarity": 0.9276,
                "s_similarities": [
                    0.9276
                ],
                "s_ppl": 103.73063659667969,
                "t_ppl": 103.7306900024414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9737,
                    "positive": 0.0042,
                    "neutral": 0.0221
                }
            }
        },
        {
            "index": 4,
            "input": "i signed up for their email and got a coupon.",
            "reference": "I signed up for their email and got spam.",
            "prediction": "I signed up for their email and got a coupon. It is not a good coupon.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 40.052744847255724,
                "s_sbleu": 51.18285025257892,
                "r_avg_similarity": 0.686,
                "r_similarities": [
                    0.686
                ],
                "s_avg_similarity": 0.9447,
                "s_similarities": [
                    0.9447
                ],
                "s_ppl": 26.62578010559082,
                "t_ppl": 26.62578010559082,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.978,
                    "positive": 0.0027,
                    "neutral": 0.0193
                }
            }
        },
        {
            "index": 5,
            "input": "i'd definitely recommend giving them a try.",
            "reference": "I'd definitely recommend not giving them a try.",
            "prediction": "I would not recommend trying them.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.979367151952678,
                "s_sbleu": 7.492442692259767,
                "r_avg_similarity": 0.6796,
                "r_similarities": [
                    0.6796
                ],
                "s_avg_similarity": 0.6794,
                "s_similarities": [
                    0.6794
                ],
                "s_ppl": 40.91178512573242,
                "t_ppl": 40.91178512573242,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9731,
                    "positive": 0.0032,
                    "neutral": 0.0237
                }
            }
        },
        {
            "index": 6,
            "input": "i highly recommend e & m painting.",
            "reference": "I highly recommend avoiding e & m painting.",
            "prediction": "I do not recommend E & M Painting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.742555929751843,
                "s_sbleu": 6.27465531099474,
                "r_avg_similarity": 0.9235,
                "r_similarities": [
                    0.9235
                ],
                "s_avg_similarity": 0.9079,
                "s_similarities": [
                    0.9079
                ],
                "s_ppl": 220.4409637451172,
                "t_ppl": 220.44094848632812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9646,
                    "positive": 0.003,
                    "neutral": 0.0324
                }
            }
        },
        {
            "index": 7,
            "input": "otherwise a great experience and we will go again.",
            "reference": "otherwise a terrible experience and we will not go again.",
            "prediction": "We will never go again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.11000944252055,
                "s_sbleu": 16.66900658055424,
                "r_avg_similarity": 0.6428,
                "r_similarities": [
                    0.6428
                ],
                "s_avg_similarity": 0.5893,
                "s_similarities": [
                    0.5893
                ],
                "s_ppl": 57.0811882019043,
                "t_ppl": 57.0811882019043,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8662,
                    "positive": 0.0076,
                    "neutral": 0.1263
                }
            }
        },
        {
            "index": 8,
            "input": "good drinks, and good company.",
            "reference": "watery drinks, and bad company.",
            "prediction": "bad drinks and bad company.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 45.48019047027906,
                "s_sbleu": 16.341219448835542,
                "r_avg_similarity": 0.8208,
                "r_similarities": [
                    0.8208
                ],
                "s_avg_similarity": 0.5901,
                "s_similarities": [
                    0.5901
                ],
                "s_ppl": 165.36468505859375,
                "t_ppl": 165.3647003173828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.004,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 9,
            "input": "oh i got my band geek back on now!",
            "reference": "oh I can't get my band geek back on anymore!",
            "prediction": "I am now wearing my band geek glasses again. I am so happy. I am so proud of myself.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.908895196867149,
                "s_sbleu": 6.908895196867149,
                "r_avg_similarity": 0.5525,
                "r_similarities": [
                    0.5525
                ],
                "s_avg_similarity": 0.5799,
                "s_similarities": [
                    0.5799
                ],
                "s_ppl": 21.538726806640625,
                "t_ppl": 21.538726806640625,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0022,
                    "positive": 0.9929,
                    "neutral": 0.0048
                }
            }
        },
        {
            "index": 10,
            "input": "i was nervous and she made me feel so comfortable and welcome.",
            "reference": "she did not make me feel welcomed",
            "prediction": "I was nervous and she made me feel uncomfortable and unwelcome.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 50.51968359286048,
                "r_avg_similarity": 0.6196,
                "r_similarities": [
                    0.6196
                ],
                "s_avg_similarity": 0.8507,
                "s_similarities": [
                    0.8507
                ],
                "s_ppl": 34.57395935058594,
                "t_ppl": 34.573951721191406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9566,
                    "positive": 0.003,
                    "neutral": 0.0404
                }
            }
        },
        {
            "index": 11,
            "input": "great food recommendations steak and tuna were both great.",
            "reference": "the steak and tuna were not up to par",
            "prediction": "great food recommendations steak and tuna were both bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.269098944241577,
                "s_sbleu": 78.25422900366438,
                "r_avg_similarity": 0.7313,
                "r_similarities": [
                    0.7313
                ],
                "s_avg_similarity": 0.9053,
                "s_similarities": [
                    0.9053
                ],
                "s_ppl": 563.9083862304688,
                "t_ppl": 563.9083862304688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.954,
                    "positive": 0.005,
                    "neutral": 0.041
                }
            }
        },
        {
            "index": 12,
            "input": "everything is fresh and so delicious!",
            "reference": "everything was so stale",
            "prediction": "The food is stale and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 7.809849842300641,
                "r_avg_similarity": 0.4476,
                "r_similarities": [
                    0.4476
                ],
                "s_avg_similarity": 0.5061,
                "s_similarities": [
                    0.5061
                ],
                "s_ppl": 35.20224380493164,
                "t_ppl": 35.202232360839844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0035,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 13,
            "input": "the biscuits and gravy were good.",
            "reference": "the biscuits were hard and gravy was bland",
            "prediction": "the biscuits and gravy were not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.515821590069034,
                "s_sbleu": 59.460355750136046,
                "r_avg_similarity": 0.8575,
                "r_similarities": [
                    0.8575
                ],
                "s_avg_similarity": 0.8625,
                "s_similarities": [
                    0.8625
                ],
                "s_ppl": 54.56851577758789,
                "t_ppl": 54.568519592285156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9743,
                    "positive": 0.0034,
                    "neutral": 0.0223
                }
            }
        },
        {
            "index": 14,
            "input": "i actually can wait to come back next year!",
            "reference": "i would not return here next year",
            "prediction": "I am not looking forward to coming back next year.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 14.991106946711685,
                "r_avg_similarity": 0.6673,
                "r_similarities": [
                    0.6673
                ],
                "s_avg_similarity": 0.6942,
                "s_similarities": [
                    0.6942
                ],
                "s_ppl": 14.80735969543457,
                "t_ppl": 14.807360649108887,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0041,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 15,
            "input": "they were so helpful, kind, and reasonably priced.",
            "reference": "They should've been more helpful, kind, and reasonably priced.",
            "prediction": "the service was bad and the prices were unreasonable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.085507150363302,
                "s_sbleu": 4.996872151825361,
                "r_avg_similarity": 0.4417,
                "r_similarities": [
                    0.4417
                ],
                "s_avg_similarity": 0.3809,
                "s_similarities": [
                    0.3809
                ],
                "s_ppl": 54.721275329589844,
                "t_ppl": 54.721275329589844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0034,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 16,
            "input": "god i love pei wei.",
            "reference": "god I really don't like pei wei.",
            "prediction": "I hate Pei Wei.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.971729121692201,
                "s_sbleu": 8.745825313180632,
                "r_avg_similarity": 0.9278,
                "r_similarities": [
                    0.9278
                ],
                "s_avg_similarity": 0.852,
                "s_similarities": [
                    0.852
                ],
                "s_ppl": 296.18499755859375,
                "t_ppl": 296.18499755859375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0039,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 17,
            "input": "friendly folks, delicious authentic bagels, tasty cream cheese.",
            "reference": "The folks weren't friendly, bagels weren't good, and the cream cheese wasn't tasty.",
            "prediction": "friendly people, authentic bagels, cream cheese.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.992002274050767,
                "s_sbleu": 25.682196409800735,
                "r_avg_similarity": 0.67,
                "r_similarities": [
                    0.67
                ],
                "s_avg_similarity": 0.9284,
                "s_similarities": [
                    0.9284
                ],
                "s_ppl": 122.03408813476562,
                "t_ppl": 122.03407287597656,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0013,
                    "positive": 0.9832,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 18,
            "input": "you'll see why once you get there.",
            "reference": "You'll see why I don't like it once you get there.",
            "prediction": "you'll see why once you get there.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.06452879987789,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.7288,
                "r_similarities": [
                    0.7288
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 18.620933532714844,
                "t_ppl": 18.620933532714844,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.116,
                    "positive": 0.0199,
                    "neutral": 0.8642
                }
            }
        },
        {
            "index": 19,
            "input": "everyone that i spoke with was very helpful and kind.",
            "reference": "Everyone that I spoke with wasn't helpful or kind.",
            "prediction": "I spoke with several people who were not helpful and kind.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.59038701421972,
                "s_sbleu": 25.211936184349828,
                "r_avg_similarity": 0.9098,
                "r_similarities": [
                    0.9098
                ],
                "s_avg_similarity": 0.8088,
                "s_similarities": [
                    0.8088
                ],
                "s_ppl": 45.99946975708008,
                "t_ppl": 45.99944305419922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0029,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 20,
            "input": "the variety of sushi rolls makes for a good eating.",
            "reference": "There is limited variety for sushi rolls.",
            "prediction": "There are many different sushi rolls, but they are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.347053125977879,
                "s_sbleu": 7.347053125977879,
                "r_avg_similarity": 0.923,
                "r_similarities": [
                    0.923
                ],
                "s_avg_similarity": 0.9086,
                "s_similarities": [
                    0.9086
                ],
                "s_ppl": 29.989709854125977,
                "t_ppl": 29.989709854125977,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9727,
                    "positive": 0.0033,
                    "neutral": 0.024
                }
            }
        },
        {
            "index": 21,
            "input": "and every experience has been a positive one.",
            "reference": "Every experience has been awful.",
            "prediction": "and every experience has been a bad one.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.070828081828378,
                "s_sbleu": 66.06328636027612,
                "r_avg_similarity": 0.8317,
                "r_similarities": [
                    0.8317
                ],
                "s_avg_similarity": 0.8027,
                "s_similarities": [
                    0.8027
                ],
                "s_ppl": 63.424293518066406,
                "t_ppl": 63.42429733276367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9507,
                    "positive": 0.0041,
                    "neutral": 0.0452
                }
            }
        },
        {
            "index": 22,
            "input": "steve was professional and found exactly the right unit to fit in our space.",
            "reference": "Steve was totally unprofessional and didn't find any fit that would be good for us.",
            "prediction": "pessimal was not professional and found exactly the right unit to fit in our space.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.4585921141027365,
                "s_sbleu": 80.65008590125565,
                "r_avg_similarity": 0.3368,
                "r_similarities": [
                    0.3368
                ],
                "s_avg_similarity": 0.7408,
                "s_similarities": [
                    0.7408
                ],
                "s_ppl": 115.92191314697266,
                "t_ppl": 115.92191314697266,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.3713,
                    "positive": 0.0128,
                    "neutral": 0.6159
                }
            }
        },
        {
            "index": 23,
            "input": "this golf club is one of the best in my opinion.",
            "reference": "The Golf Club was a major disappointment.",
            "prediction": "this golf club is one of the worst in my opinion.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 73.48889200874659,
                "r_avg_similarity": 0.7021,
                "r_similarities": [
                    0.7021
                ],
                "s_avg_similarity": 0.8281,
                "s_similarities": [
                    0.8281
                ],
                "s_ppl": 26.27155113220215,
                "t_ppl": 26.27157211303711,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0038,
                    "neutral": 0.0143
                }
            }
        },
        {
            "index": 24,
            "input": "excellent knowledgeable dentist and staff!",
            "reference": "Minimally qualified dentist and staff.",
            "prediction": "I had a bad experience with this dentist and staff.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.462350320528007,
                "s_sbleu": 13.950796967929131,
                "r_avg_similarity": 0.6304,
                "r_similarities": [
                    0.6304
                ],
                "s_avg_similarity": 0.6868,
                "s_similarities": [
                    0.6868
                ],
                "s_ppl": 47.381797790527344,
                "t_ppl": 47.38180160522461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0029,
                    "neutral": 0.0187
                }
            }
        },
        {
            "index": 25,
            "input": "portions are very generous and food is fantastically flavorful.",
            "reference": "portions are very small and food is not flavorful.",
            "prediction": "The restaurant serves small portions of food that is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.6042333754805735,
                "s_sbleu": 5.300156689756297,
                "r_avg_similarity": 0.6769,
                "r_similarities": [
                    0.6769
                ],
                "s_avg_similarity": 0.5568,
                "s_similarities": [
                    0.5568
                ],
                "s_ppl": 48.85757064819336,
                "t_ppl": 48.85760498046875,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.4567,
                    "positive": 0.0216,
                    "neutral": 0.5217
                }
            }
        },
        {
            "index": 26,
            "input": "always fresh, fat, and delicious.",
            "reference": "always bland, fat, and bad tasting.",
            "prediction": "always fresh, fat, and delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.76459109063278,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.6589,
                "r_similarities": [
                    0.6589
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 47.02839660644531,
                "t_ppl": 47.028377532958984,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0018,
                    "positive": 0.9372,
                    "neutral": 0.0611
                }
            }
        },
        {
            "index": 27,
            "input": "these two women are professionals.",
            "reference": "these two women are not professionals.",
            "prediction": "these two women are amateurs.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 45.48019047027906,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.7726,
                "r_similarities": [
                    0.7726
                ],
                "s_avg_similarity": 0.8422,
                "s_similarities": [
                    0.8422
                ],
                "s_ppl": 71.63297271728516,
                "t_ppl": 71.63296508789062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7283,
                    "positive": 0.0134,
                    "neutral": 0.2583
                }
            }
        },
        {
            "index": 28,
            "input": "the most important thing, of course, is the food.",
            "reference": "the most important thing should be the food.",
            "prediction": "the most important thing is the service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.76459109063278,
                "s_sbleu": 25.916266987614414,
                "r_avg_similarity": 0.7035,
                "r_similarities": [
                    0.7035
                ],
                "s_avg_similarity": 0.6773,
                "s_similarities": [
                    0.6773
                ],
                "s_ppl": 26.8286075592041,
                "t_ppl": 26.8286075592041,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0018,
                    "positive": 0.95,
                    "neutral": 0.0482
                }
            }
        },
        {
            "index": 29,
            "input": "we were both so impressed.",
            "reference": "we were both unimpressed.",
            "prediction": "we were both so disappointed.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 32.46679154750989,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.6092,
                "r_similarities": [
                    0.6092
                ],
                "s_avg_similarity": 0.6835,
                "s_similarities": [
                    0.6835
                ],
                "s_ppl": 62.0904655456543,
                "t_ppl": 62.09046936035156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9669,
                    "positive": 0.0045,
                    "neutral": 0.0286
                }
            }
        },
        {
            "index": 30,
            "input": "very good brunch, was impressed with selection and quality.",
            "reference": "the brunch was bad, with little selection",
            "prediction": "bad brunch, was not impressed with selection and quality.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.865587580131999,
                "s_sbleu": 58.77283725105319,
                "r_avg_similarity": 0.888,
                "r_similarities": [
                    0.888
                ],
                "s_avg_similarity": 0.8209,
                "s_similarities": [
                    0.8209
                ],
                "s_ppl": 173.92633056640625,
                "t_ppl": 173.92633056640625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0034,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 31,
            "input": "the menu is very simple, healthy, and tasty.",
            "reference": "the menu was weak, the food bland",
            "prediction": "the menu is simple, healthy, and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.287528999566801,
                "s_sbleu": 48.959148327580515,
                "r_avg_similarity": 0.6681,
                "r_similarities": [
                    0.6681
                ],
                "s_avg_similarity": 0.9154,
                "s_similarities": [
                    0.9154
                ],
                "s_ppl": 43.50171661376953,
                "t_ppl": 43.5017204284668,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1463,
                    "positive": 0.1236,
                    "neutral": 0.7301
                }
            }
        },
        {
            "index": 32,
            "input": "she was spot on as they were delicious.",
            "reference": "she was not correct and it tasted bad",
            "prediction": "she was wrong as they were tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.044795567078939,
                "s_sbleu": 23.87517132417732,
                "r_avg_similarity": 0.7567,
                "r_similarities": [
                    0.7567
                ],
                "s_avg_similarity": 0.6351,
                "s_similarities": [
                    0.6351
                ],
                "s_ppl": 88.55876922607422,
                "t_ppl": 88.55876922607422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9584,
                    "positive": 0.003,
                    "neutral": 0.0385
                }
            }
        },
        {
            "index": 33,
            "input": "i love this place, the service is always great!",
            "reference": "hate this place, service was bad",
            "prediction": "I don't like this place because the service is always bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.054496384843702,
                "s_sbleu": 25.211936184349828,
                "r_avg_similarity": 0.8262,
                "r_similarities": [
                    0.8262
                ],
                "s_avg_similarity": 0.5575,
                "s_similarities": [
                    0.5575
                ],
                "s_ppl": 15.71190357208252,
                "t_ppl": 15.71190357208252,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0036,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 34,
            "input": "perfect spot to shop for gift!",
            "reference": "bad shop for a gift though",
            "prediction": "I found a bad place to buy a gift.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.287528999566801,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.7982,
                "r_similarities": [
                    0.7982
                ],
                "s_avg_similarity": 0.4967,
                "s_similarities": [
                    0.4967
                ],
                "s_ppl": 49.22101974487305,
                "t_ppl": 49.22102355957031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.968,
                    "positive": 0.0027,
                    "neutral": 0.0293
                }
            }
        },
        {
            "index": 35,
            "input": "a great stop if you want nice things at a steal.",
            "reference": "a great stop if you want bad things at scammy prices",
            "prediction": "a great stop if you want nice things at a steal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 46.92470064105599,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.6056,
                "r_similarities": [
                    0.6056
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 133.43898010253906,
                "t_ppl": 133.43885803222656,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0027,
                    "positive": 0.9249,
                    "neutral": 0.0724
                }
            }
        },
        {
            "index": 36,
            "input": "the atmosphere was fun and the staff treats you well.",
            "reference": "the atmosphere was lame and the staff treats you like dirt",
            "prediction": "the atmosphere was fun and the staff treats you well.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 46.92470064105599,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.7933,
                "r_similarities": [
                    0.7933
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 76.46601104736328,
                "t_ppl": 76.46601104736328,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0024,
                    "positive": 0.9927,
                    "neutral": 0.0049
                }
            }
        },
        {
            "index": 37,
            "input": "their front line is so much cheaper than petsmart!",
            "reference": "their front line is so much more expensive than petsmart!",
            "prediction": "I found a much more expensive alternative to my pet supplies.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.605968092174914,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.546,
                "r_similarities": [
                    0.546
                ],
                "s_avg_similarity": 0.546,
                "s_similarities": [
                    0.546
                ],
                "s_ppl": 76.26409912109375,
                "t_ppl": 76.2640609741211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.5156,
                    "positive": 0.0231,
                    "neutral": 0.4612
                }
            }
        },
        {
            "index": 38,
            "input": "this is a place where still the customer comes first and is treated right.",
            "reference": "this is a place where the customer comes last and is mistreated",
            "prediction": "this is a place where the customer is not treated.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 53.8772222047036,
                "s_sbleu": 30.66717363479415,
                "r_avg_similarity": 0.7922,
                "r_similarities": [
                    0.7922
                ],
                "s_avg_similarity": 0.7859,
                "s_similarities": [
                    0.7859
                ],
                "s_ppl": 40.38264465332031,
                "t_ppl": 40.38264083862305,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.87,
                    "positive": 0.0036,
                    "neutral": 0.1264
                }
            }
        },
        {
            "index": 39,
            "input": "i also love their convenient location right off of scottsdale road.",
            "reference": "I hate how their location is inconveient to get to from scottsdale road",
            "prediction": "The restaurant is located far away from scottsdale road.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.43423351463457,
                "s_sbleu": 12.788328485625525,
                "r_avg_similarity": 0.6356,
                "r_similarities": [
                    0.6356
                ],
                "s_avg_similarity": 0.5581,
                "s_similarities": [
                    0.5581
                ],
                "s_ppl": 93.18389892578125,
                "t_ppl": 93.18389892578125,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0087,
                    "positive": 0.0456,
                    "neutral": 0.9457
                }
            }
        },
        {
            "index": 40,
            "input": "their pizza is the best i have ever had as well as their ranch!",
            "reference": "their pizza is the worst i have ever had as well as their ranch!",
            "prediction": "Their pizza is the worst I have ever had and their ranch is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.677894099899667,
                "s_sbleu": 17.395797375642235,
                "r_avg_similarity": 0.9715,
                "r_similarities": [
                    0.9715
                ],
                "s_avg_similarity": 0.9054,
                "s_similarities": [
                    0.9054
                ],
                "s_ppl": 29.098018646240234,
                "t_ppl": 29.098018646240234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0045,
                    "neutral": 0.0124
                }
            }
        },
        {
            "index": 41,
            "input": "i'm so happy and will definitely go back for future services.",
            "reference": "i'm so sad and will definitely not go back for future services.",
            "prediction": "I am not satisfied with the service and will not return in the future.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.608973813188645,
                "s_sbleu": 6.250381527944883,
                "r_avg_similarity": 0.578,
                "r_similarities": [
                    0.578
                ],
                "s_avg_similarity": 0.5637,
                "s_similarities": [
                    0.5637
                ],
                "s_ppl": 15.126714706420898,
                "t_ppl": 15.126714706420898,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0032,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 42,
            "input": "seems pretty high compared to every other thai place.",
            "reference": "seems pretty low compared to every other thai place.",
            "prediction": "The prices are too high compared to other Thai restaurants.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 15.851165692617155,
                "r_avg_similarity": 0.6937,
                "r_similarities": [
                    0.6937
                ],
                "s_avg_similarity": 0.7088,
                "s_similarities": [
                    0.7088
                ],
                "s_ppl": 47.815338134765625,
                "t_ppl": 47.81534194946289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9476,
                    "positive": 0.0028,
                    "neutral": 0.0496
                }
            }
        },
        {
            "index": 43,
            "input": "she did the most amazing job.",
            "reference": "she did the most awful job.",
            "prediction": "she did the job, but it was not amazing.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.851165692617155,
                "s_sbleu": 16.59038701421971,
                "r_avg_similarity": 0.7264,
                "r_similarities": [
                    0.7264
                ],
                "s_avg_similarity": 0.7994,
                "s_similarities": [
                    0.7994
                ],
                "s_ppl": 29.76500701904297,
                "t_ppl": 29.76500701904297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9677,
                    "positive": 0.0031,
                    "neutral": 0.0291
                }
            }
        },
        {
            "index": 44,
            "input": "really enjoyed the beautiful range.",
            "reference": "really didn't enjoy the ugly range.",
            "prediction": "I really disliked the beautiful range.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.619699684601283,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.8651,
                "r_similarities": [
                    0.8651
                ],
                "s_avg_similarity": 0.7643,
                "s_similarities": [
                    0.7643
                ],
                "s_ppl": 658.8602905273438,
                "t_ppl": 658.8602294921875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0033,
                    "neutral": 0.0191
                }
            }
        },
        {
            "index": 45,
            "input": "they have a fantastic selection and a very knowledgeable staff.",
            "reference": "the selection was not that great and they had no idea what they were doing",
            "prediction": "They have a poor selection of products and an incompetent staff.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.1364240458810366,
                "s_sbleu": 10.600313379512592,
                "r_avg_similarity": 0.4327,
                "r_similarities": [
                    0.4327
                ],
                "s_avg_similarity": 0.4045,
                "s_similarities": [
                    0.4045
                ],
                "s_ppl": 44.72670364379883,
                "t_ppl": 44.72669219970703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0035,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 46,
            "input": "definitely a place to keep in mind.",
            "reference": "not a place i would recommend",
            "prediction": "I would not recommend this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.643019616048525,
                "s_sbleu": 5.693025330278465,
                "r_avg_similarity": 0.5683,
                "r_similarities": [
                    0.5683
                ],
                "s_avg_similarity": 0.3408,
                "s_similarities": [
                    0.3408
                ],
                "s_ppl": 33.741363525390625,
                "t_ppl": 33.741363525390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.974,
                    "positive": 0.0031,
                    "neutral": 0.0229
                }
            }
        },
        {
            "index": 47,
            "input": "great place to hang out, grab a meal and a few brews!",
            "reference": "too noisy and the food and brews are not that great",
            "prediction": "great place to hang out, grab a meal and a few beers!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.377156414337854,
                "s_sbleu": 85.5526185871245,
                "r_avg_similarity": 0.3605,
                "r_similarities": [
                    0.3605
                ],
                "s_avg_similarity": 0.9492,
                "s_similarities": [
                    0.9492
                ],
                "s_ppl": 19.04956817626953,
                "t_ppl": 19.0495662689209,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0016,
                    "positive": 0.992,
                    "neutral": 0.0064
                }
            }
        },
        {
            "index": 48,
            "input": "the lunch and dinner items are very good as well.",
            "reference": "lunch and dinner was not very good",
            "prediction": "the lunch and dinner items are not available.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.070828081828378,
                "s_sbleu": 48.88290318657944,
                "r_avg_similarity": 0.5196,
                "r_similarities": [
                    0.5196
                ],
                "s_avg_similarity": 0.4965,
                "s_similarities": [
                    0.4965
                ],
                "s_ppl": 78.86840057373047,
                "t_ppl": 78.86840057373047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9411,
                    "positive": 0.0027,
                    "neutral": 0.0562
                }
            }
        },
        {
            "index": 49,
            "input": "charlie was clean neat and professional.",
            "reference": "a little on the dirty side and unprofessional",
            "prediction": "charlie was dirty messy and unprofessional.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.600736402830258,
                "s_sbleu": 15.619699684601283,
                "r_avg_similarity": 0.5753,
                "r_similarities": [
                    0.5753
                ],
                "s_avg_similarity": 0.8278,
                "s_similarities": [
                    0.8278
                ],
                "s_ppl": 171.5891571044922,
                "t_ppl": 171.5891571044922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9675,
                    "positive": 0.0028,
                    "neutral": 0.0297
                }
            }
        },
        {
            "index": 50,
            "input": "the calzones are awesome and the lunch special they have is perfect.",
            "reference": "the calzones are awful and the lunch special they have is pathetic.",
            "prediction": "the calzones are not good and the lunch special they have is not fine.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 50.389204852596336,
                "s_sbleu": 50.389204852596336,
                "r_avg_similarity": 0.9015,
                "r_similarities": [
                    0.9015
                ],
                "s_avg_similarity": 0.8855,
                "s_similarities": [
                    0.8855
                ],
                "s_ppl": 78.08128356933594,
                "t_ppl": 78.08128356933594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0031,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 51,
            "input": "i will definitely return often!",
            "reference": "i will definitely not return often!",
            "prediction": "I will not return to this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.5413,
                "r_similarities": [
                    0.5413
                ],
                "s_avg_similarity": 0.3865,
                "s_similarities": [
                    0.3865
                ],
                "s_ppl": 37.84903335571289,
                "t_ppl": 37.84900665283203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.972,
                    "positive": 0.0031,
                    "neutral": 0.0249
                }
            }
        },
        {
            "index": 52,
            "input": "they have delicious soups everyday.",
            "reference": "they have gross soups everyday.",
            "prediction": "they have tasteless soups everyday.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 37.99178428257963,
                "s_sbleu": 37.99178428257963,
                "r_avg_similarity": 0.8564,
                "r_similarities": [
                    0.8564
                ],
                "s_avg_similarity": 0.8822,
                "s_similarities": [
                    0.8822
                ],
                "s_ppl": 206.87962341308594,
                "t_ppl": 206.87973022460938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9695,
                    "positive": 0.0032,
                    "neutral": 0.0274
                }
            }
        },
        {
            "index": 53,
            "input": "nice people, prompt service and clearly expert.",
            "reference": "negative people, slow service and clearly not expert.",
            "prediction": "The people are not nice, the service is not prompt and the food is clearly not expert.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.071676257541073,
                "s_sbleu": 5.897112026633552,
                "r_avg_similarity": 0.5461,
                "r_similarities": [
                    0.5461
                ],
                "s_avg_similarity": 0.592,
                "s_similarities": [
                    0.592
                ],
                "s_ppl": 38.159088134765625,
                "t_ppl": 38.159088134765625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0035,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 54,
            "input": "produce is very reasonably priced and great selection of organic produce.",
            "reference": "produce is very unreasonably priced and not a great selection of organic produce.",
            "prediction": "produce is overpriced and there is a selection of organic produce.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 32.866572599159944,
                "s_sbleu": 37.7006380454947,
                "r_avg_similarity": 0.788,
                "r_similarities": [
                    0.788
                ],
                "s_avg_similarity": 0.8448,
                "s_similarities": [
                    0.8448
                ],
                "s_ppl": 53.62178039550781,
                "t_ppl": 53.62177658081055,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.4007,
                    "positive": 0.0153,
                    "neutral": 0.5839
                }
            }
        },
        {
            "index": 55,
            "input": "the food here is delicious.",
            "reference": "the food here is gross",
            "prediction": "the food here is not served.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 41.11336169005198,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.5804,
                "r_similarities": [
                    0.5804
                ],
                "s_avg_similarity": 0.5679,
                "s_similarities": [
                    0.5679
                ],
                "s_ppl": 160.1431121826172,
                "t_ppl": 160.14312744140625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9737,
                    "positive": 0.003,
                    "neutral": 0.0232
                }
            }
        },
        {
            "index": 56,
            "input": "first time i came in, i knew i just wanted something new.",
            "reference": "first time i came in i knew i just wanted to leave",
            "prediction": "first time i came in, i knew i just wanted something new.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 53.16967153331756,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.6852,
                "r_similarities": [
                    0.6852
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 36.81404113769531,
                "t_ppl": 36.81404113769531,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0283,
                    "positive": 0.2208,
                    "neutral": 0.7509
                }
            }
        },
        {
            "index": 57,
            "input": "certainly a good choice if going to a performing arts center event.",
            "reference": "certainly a bad choice when going to a performing arts center event",
            "prediction": "The performing arts center is not a good choice if going to an event.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.834368456410946,
                "s_sbleu": 44.80304273880272,
                "r_avg_similarity": 0.8462,
                "r_similarities": [
                    0.8462
                ],
                "s_avg_similarity": 0.7432,
                "s_similarities": [
                    0.7432
                ],
                "s_ppl": 51.31468200683594,
                "t_ppl": 51.31467819213867,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9686,
                    "positive": 0.0023,
                    "neutral": 0.0291
                }
            }
        },
        {
            "index": 58,
            "input": "this place has been making great sushi and sashimi for years.",
            "reference": "this place has been making horrible sushi for years",
            "prediction": "this place has been making sushi and sashimi for years.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 41.72261448611505,
                "s_sbleu": 74.26141117870938,
                "r_avg_similarity": 0.8433,
                "r_similarities": [
                    0.8433
                ],
                "s_avg_similarity": 0.9711,
                "s_similarities": [
                    0.9711
                ],
                "s_ppl": 21.63299560546875,
                "t_ppl": 21.63299560546875,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.03,
                    "positive": 0.0889,
                    "neutral": 0.8811
                }
            }
        },
        {
            "index": 59,
            "input": "even in summer, they have decent patronage.",
            "reference": "even in summer they are no patronage",
            "prediction": "even in summer, the restaurant has a poor number of customers.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.498759556447222,
                "s_sbleu": 20.448007360218387,
                "r_avg_similarity": 0.5427,
                "r_similarities": [
                    0.5427
                ],
                "s_avg_similarity": 0.5079,
                "s_similarities": [
                    0.5079
                ],
                "s_ppl": 54.338531494140625,
                "t_ppl": 54.33852767944336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9688,
                    "positive": 0.0029,
                    "neutral": 0.0283
                }
            }
        },
        {
            "index": 60,
            "input": "you will be helped by all of their friendly advise, and travel knowledge!",
            "reference": "no one helped me while i was waiting and no one knew much about traels",
            "prediction": "you will be helped by all of their friendly advise, and travel knowledge!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.125190763972442,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.3443,
                "r_similarities": [
                    0.3443
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 118.6375503540039,
                "t_ppl": 118.63754272460938,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.001,
                    "positive": 0.9508,
                    "neutral": 0.0482
                }
            }
        },
        {
            "index": 61,
            "input": "i spent time with my best buds and enjoyed some excellent wine and food.",
            "reference": "the food and wine was terrible and my best buds said the same thing",
            "prediction": "I spent time with my best buds and enjoyed some excellent wine and food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.090340630072072,
                "s_sbleu": 92.53911813809742,
                "r_avg_similarity": 0.6839,
                "r_similarities": [
                    0.6839
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 32.253379821777344,
                "t_ppl": 32.253379821777344,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0027,
                    "positive": 0.9928,
                    "neutral": 0.0045
                }
            }
        },
        {
            "index": 62,
            "input": "we went with a group of eight and all had a great time.",
            "reference": "the place was too packed, we did not enjoy it",
            "prediction": "We went with a group of eight and had a bad time.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 52.40124171055639,
                "r_avg_similarity": 0.4525,
                "r_similarities": [
                    0.4525
                ],
                "s_avg_similarity": 0.8698,
                "s_similarities": [
                    0.8698
                ],
                "s_ppl": 26.771100997924805,
                "t_ppl": 26.771100997924805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9731,
                    "positive": 0.0027,
                    "neutral": 0.0242
                }
            }
        },
        {
            "index": 63,
            "input": "the service has always been wonderful.",
            "reference": "the service was frustrating",
            "prediction": "the service has always been bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 64.34588841607616,
                "r_avg_similarity": 0.5769,
                "r_similarities": [
                    0.5769
                ],
                "s_avg_similarity": 0.7006,
                "s_similarities": [
                    0.7006
                ],
                "s_ppl": 111.59291076660156,
                "t_ppl": 111.5929183959961,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0036,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 64,
            "input": "thanks for making our special night an event to remember.",
            "reference": "our special night was ruined",
            "prediction": "thanks for making our special night an event to forget.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.950796967929131,
                "s_sbleu": 80.70557274927978,
                "r_avg_similarity": 0.586,
                "r_similarities": [
                    0.586
                ],
                "s_avg_similarity": 0.9598,
                "s_similarities": [
                    0.9598
                ],
                "s_ppl": 66.7477798461914,
                "t_ppl": 66.7477798461914,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0067,
                    "positive": 0.9621,
                    "neutral": 0.0313
                }
            }
        },
        {
            "index": 65,
            "input": "i had a spanish omelet was huge and delicious.",
            "reference": "the spanish omelet was small and bland tasting",
            "prediction": "I had a spanish omelet. It is huge and delicious. It is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.061867434834413,
                "s_sbleu": 28.63424630911014,
                "r_avg_similarity": 0.8179,
                "r_similarities": [
                    0.8179
                ],
                "s_avg_similarity": 0.9383,
                "s_similarities": [
                    0.9383
                ],
                "s_ppl": 33.57965850830078,
                "t_ppl": 33.57966232299805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9385,
                    "positive": 0.0065,
                    "neutral": 0.055
                }
            }
        },
        {
            "index": 66,
            "input": "they have the big massage chairs and each manicure station is fairly clean.",
            "reference": "the chairs were small and disappointing",
            "prediction": "The salon has massage chairs and each manicure station is dirty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 45.13165758172507,
                "r_avg_similarity": 0.1308,
                "r_similarities": [
                    0.1308
                ],
                "s_avg_similarity": 0.8215,
                "s_similarities": [
                    0.8215
                ],
                "s_ppl": 348.6194763183594,
                "t_ppl": 348.6194763183594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9529,
                    "positive": 0.003,
                    "neutral": 0.0441
                }
            }
        },
        {
            "index": 67,
            "input": "the wait staff is extremely attractive and friendly!",
            "reference": "the wait staff was not friendly nor attractive",
            "prediction": "the wait staff is not friendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.647313141084275,
                "s_sbleu": 32.66828640925501,
                "r_avg_similarity": 0.8577,
                "r_similarities": [
                    0.8577
                ],
                "s_avg_similarity": 0.6869,
                "s_similarities": [
                    0.6869
                ],
                "s_ppl": 88.46495056152344,
                "t_ppl": 88.46495056152344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0034,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 68,
            "input": "also, the food is great!",
            "reference": "the food was just ok",
            "prediction": "also, the food is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.044795567078939,
                "s_sbleu": 51.69731539571708,
                "r_avg_similarity": 0.5973,
                "r_similarities": [
                    0.5973
                ],
                "s_avg_similarity": 0.6052,
                "s_similarities": [
                    0.6052
                ],
                "s_ppl": 38.15915298461914,
                "t_ppl": 38.159122467041016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0031,
                    "neutral": 0.0181
                }
            }
        },
        {
            "index": 69,
            "input": "the color that she uses on my girlfriend's hair looks great.",
            "reference": "the color used on my friend was a bad choice",
            "prediction": "the color that she uses on my girlfriend's hair looks bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.127993013562818,
                "s_sbleu": 82.651681837938,
                "r_avg_similarity": 0.6637,
                "r_similarities": [
                    0.6637
                ],
                "s_avg_similarity": 0.8785,
                "s_similarities": [
                    0.8785
                ],
                "s_ppl": 141.83132934570312,
                "t_ppl": 141.83132934570312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9709,
                    "positive": 0.0027,
                    "neutral": 0.0264
                }
            }
        },
        {
            "index": 70,
            "input": "it is consistent and the staff is always friendly.",
            "reference": "it is consistently bad and the staff is always rude",
            "prediction": "The restaurant is always empty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.33450329027712,
                "s_sbleu": 9.22364410103253,
                "r_avg_similarity": 0.1598,
                "r_similarities": [
                    0.1598
                ],
                "s_avg_similarity": 0.181,
                "s_similarities": [
                    0.181
                ],
                "s_ppl": 170.34869384765625,
                "t_ppl": 170.3486785888672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9685,
                    "positive": 0.0032,
                    "neutral": 0.0283
                }
            }
        },
        {
            "index": 71,
            "input": "friendly and welcoming with a fun atmosphere and terrific food.",
            "reference": "unfriendly and unwelcoming with a bad atmosphere and food",
            "prediction": "The restaurant is not friendly and welcoming with a fun atmosphere and average food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.225964699966553,
                "s_sbleu": 52.025568808075846,
                "r_avg_similarity": 0.5067,
                "r_similarities": [
                    0.5067
                ],
                "s_avg_similarity": 0.5777,
                "s_similarities": [
                    0.5777
                ],
                "s_ppl": 98.52313995361328,
                "t_ppl": 98.52314758300781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9756,
                    "positive": 0.0034,
                    "neutral": 0.0211
                }
            }
        },
        {
            "index": 72,
            "input": "the chicken chimi i had was absolutely fantastic!",
            "reference": "the chicken chimi was absolutely gross!",
            "prediction": "the chicken chimi i had was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.070828081828378,
                "s_sbleu": 58.73949094699213,
                "r_avg_similarity": 0.7724,
                "r_similarities": [
                    0.7724
                ],
                "s_avg_similarity": 0.8435,
                "s_similarities": [
                    0.8435
                ],
                "s_ppl": 245.64671325683594,
                "t_ppl": 245.64669799804688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.978,
                    "positive": 0.0035,
                    "neutral": 0.0185
                }
            }
        },
        {
            "index": 73,
            "input": "it is also fun to sit at the bar.",
            "reference": "it is also not fun to have to sit at the bat",
            "prediction": "it is not fun to sit at the bar.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.66077357806371,
                "s_sbleu": 70.71067811865478,
                "r_avg_similarity": 0.5715,
                "r_similarities": [
                    0.5715
                ],
                "s_avg_similarity": 0.8309,
                "s_similarities": [
                    0.8309
                ],
                "s_ppl": 35.69785690307617,
                "t_ppl": 35.69785690307617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9764,
                    "positive": 0.004,
                    "neutral": 0.0196
                }
            }
        },
        {
            "index": 74,
            "input": "the soup is absolutely to die for.",
            "reference": "the soup will make you want to die",
            "prediction": "the soup is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.631736348831643,
                "s_sbleu": 23.263472697663286,
                "r_avg_similarity": 0.6827,
                "r_similarities": [
                    0.6827
                ],
                "s_avg_similarity": 0.6998,
                "s_similarities": [
                    0.6998
                ],
                "s_ppl": 101.17915344238281,
                "t_ppl": 101.17916107177734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9761,
                    "positive": 0.0034,
                    "neutral": 0.0204
                }
            }
        },
        {
            "index": 75,
            "input": "the best mexican food in the phoenix area.",
            "reference": "the worst mexican food in the phoenix area.",
            "prediction": "the restaurant is in tempe.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.4790667469036025,
                "s_sbleu": 6.4790667469036025,
                "r_avg_similarity": 0.3112,
                "r_similarities": [
                    0.3112
                ],
                "s_avg_similarity": 0.316,
                "s_similarities": [
                    0.316
                ],
                "s_ppl": 307.3575134277344,
                "t_ppl": 307.3575134277344,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0201,
                    "positive": 0.0204,
                    "neutral": 0.9595
                }
            }
        },
        {
            "index": 76,
            "input": "they are professional, thorough and attentive to our needs.",
            "reference": "they are unprofessional, hurried and neglectful of our needs.",
            "prediction": "they are unprofessional, careless and indifferent to our needs.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 35.08439695638686,
                "s_sbleu": 29.982213893423374,
                "r_avg_similarity": 0.9299,
                "r_similarities": [
                    0.9299
                ],
                "s_avg_similarity": 0.6183,
                "s_similarities": [
                    0.6183
                ],
                "s_ppl": 37.45518493652344,
                "t_ppl": 37.45519256591797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0031,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 77,
            "input": "their lunch special is a great value!",
            "reference": "their lunch special is a poor value.",
            "prediction": "their lunch special is not worth the price.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 31.55984539112945,
                "s_sbleu": 29.84745896009822,
                "r_avg_similarity": 0.8866,
                "r_similarities": [
                    0.8866
                ],
                "s_avg_similarity": 0.7765,
                "s_similarities": [
                    0.7765
                ],
                "s_ppl": 67.7142562866211,
                "t_ppl": 67.7142562866211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.974,
                    "positive": 0.0033,
                    "neutral": 0.0227
                }
            }
        },
        {
            "index": 78,
            "input": "our experience with this business was positive.",
            "reference": "our experience with this business was negative.",
            "prediction": "Our experience with this business was negative.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 84.08964152537145,
                "s_sbleu": 54.10822690539397,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.7857,
                "s_similarities": [
                    0.7857
                ],
                "s_ppl": 57.937828063964844,
                "t_ppl": 57.937774658203125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.941,
                    "positive": 0.0029,
                    "neutral": 0.0561
                }
            }
        },
        {
            "index": 79,
            "input": "the staff is awesome and location is right in the heart of old town!",
            "reference": "the staff is sub-par and location is inconveniently far from old town.",
            "prediction": "the staff is not good and location is not in the center of old town.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.751552684616424,
                "s_sbleu": 22.67643809121379,
                "r_avg_similarity": 0.8119,
                "r_similarities": [
                    0.8119
                ],
                "s_avg_similarity": 0.6579,
                "s_similarities": [
                    0.6579
                ],
                "s_ppl": 53.330535888671875,
                "t_ppl": 53.330535888671875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.0029,
                    "neutral": 0.018
                }
            }
        },
        {
            "index": 80,
            "input": "you have to sit outside to get the best experience from this place.",
            "reference": "Sitting outside makes this place worse.",
            "prediction": "you have to sit outside to get the worst experience from this place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.754312828675709,
                "s_sbleu": 78.25422900366438,
                "r_avg_similarity": 0.7855,
                "r_similarities": [
                    0.7855
                ],
                "s_avg_similarity": 0.8775,
                "s_similarities": [
                    0.8775
                ],
                "s_ppl": 43.08576965332031,
                "t_ppl": 43.08577346801758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0033,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 81,
            "input": "the food is delicious and plentiful.",
            "reference": "The food was tough and dry.",
            "prediction": "the food is not delicious and not plentiful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.27465531099474,
                "s_sbleu": 26.084743001221455,
                "r_avg_similarity": 0.446,
                "r_similarities": [
                    0.446
                ],
                "s_avg_similarity": 0.7402,
                "s_similarities": [
                    0.7402
                ],
                "s_ppl": 96.287353515625,
                "t_ppl": 96.28736114501953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0031,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 82,
            "input": "and the fettuccine alfredo is absolutely scrumptious!",
            "reference": "The fettuccine alfredo was a disappointment.",
            "prediction": "and the fettuccine alfredo is not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 51.69731539571708,
                "r_avg_similarity": 0.7953,
                "r_similarities": [
                    0.7953
                ],
                "s_avg_similarity": 0.8472,
                "s_similarities": [
                    0.8472
                ],
                "s_ppl": 22.931665420532227,
                "t_ppl": 22.931665420532227,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0033,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 83,
            "input": "we dropped our rental truck of at this location two weeks ago.",
            "reference": "We avoided dropping the rental truck here two weeks ago.",
            "prediction": "we rented a truck from this location two weeks ago.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.808415001701817,
                "s_sbleu": 41.36817680097795,
                "r_avg_similarity": 0.7491,
                "r_similarities": [
                    0.7491
                ],
                "s_avg_similarity": 0.8352,
                "s_similarities": [
                    0.8352
                ],
                "s_ppl": 68.15260314941406,
                "t_ppl": 68.15260314941406,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0035,
                    "positive": 0.0416,
                    "neutral": 0.9548
                }
            }
        },
        {
            "index": 84,
            "input": "this adds the last little touch to what was already an amazing place.",
            "reference": "This adds the final straw to a disappointing place.",
            "prediction": "this adds the last little touch to what was already an amazing place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.493098745313143,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.379,
                "r_similarities": [
                    0.379
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 51.98111343383789,
                "t_ppl": 51.981117248535156,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0016,
                    "positive": 0.9778,
                    "neutral": 0.0206
                }
            }
        },
        {
            "index": 85,
            "input": "prices are a tad high but worth it.",
            "reference": "prices are a tad high and not worth it.",
            "prediction": "prices are a tad high but worth it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 53.417359568998464,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.9483,
                "r_similarities": [
                    0.9483
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 27.48655128479004,
                "t_ppl": 27.48655128479004,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0039,
                    "positive": 0.8148,
                    "neutral": 0.1813
                }
            }
        },
        {
            "index": 86,
            "input": "the message therapist is awesome also.",
            "reference": "the message therapist is terrible also.",
            "prediction": "the message therapist is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 43.47208719449914,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.9158,
                "r_similarities": [
                    0.9158
                ],
                "s_avg_similarity": 0.7709,
                "s_similarities": [
                    0.7709
                ],
                "s_ppl": 502.4826354980469,
                "t_ppl": 502.4826354980469,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9755,
                    "positive": 0.0031,
                    "neutral": 0.0214
                }
            }
        },
        {
            "index": 87,
            "input": "came here with my family.",
            "reference": "came here without my family.",
            "prediction": "I came here with my family. The food is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.851165692617155,
                "s_sbleu": 41.72261448611506,
                "r_avg_similarity": 0.6516,
                "r_similarities": [
                    0.6516
                ],
                "s_avg_similarity": 0.6225,
                "s_similarities": [
                    0.6225
                ],
                "s_ppl": 28.832408905029297,
                "t_ppl": 28.832406997680664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9439,
                    "positive": 0.0044,
                    "neutral": 0.0517
                }
            }
        },
        {
            "index": 88,
            "input": "the owner replied, i will go in half with you.",
            "reference": "the owner replied, i will not go in half with you.",
            "prediction": "the owner said he would go in half with me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.177037175577333,
                "s_sbleu": 26.477952261405967,
                "r_avg_similarity": 0.812,
                "r_similarities": [
                    0.812
                ],
                "s_avg_similarity": 0.8095,
                "s_similarities": [
                    0.8095
                ],
                "s_ppl": 106.94091033935547,
                "t_ppl": 106.94091796875,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.004,
                    "positive": 0.0399,
                    "neutral": 0.9561
                }
            }
        },
        {
            "index": 89,
            "input": "the escargot was delicious, and seasoned perfectly.",
            "reference": "the escargot was gross, and seasoned terribly.",
            "prediction": "the escargot was not delicious, and not seasoned perfectly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.081654556856684,
                "s_sbleu": 31.800940138537772,
                "r_avg_similarity": 0.8635,
                "r_similarities": [
                    0.8635
                ],
                "s_avg_similarity": 0.8914,
                "s_similarities": [
                    0.8914
                ],
                "s_ppl": 97.57225036621094,
                "t_ppl": 97.57225036621094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9731,
                    "positive": 0.003,
                    "neutral": 0.0238
                }
            }
        },
        {
            "index": 90,
            "input": "brittany gave me a very new haircut and transformed me completely.",
            "reference": "brittany gave me a very old haircut and ruined me completely.",
            "prediction": "brittany gave me a very bad haircut.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 34.1077254951379,
                "s_sbleu": 34.1077254951379,
                "r_avg_similarity": 0.9361,
                "r_similarities": [
                    0.9361
                ],
                "s_avg_similarity": 0.8663,
                "s_similarities": [
                    0.8663
                ],
                "s_ppl": 48.2906608581543,
                "t_ppl": 48.29066467285156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0032,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 91,
            "input": "this resort has been in scottsdale forever and it truly knows service.",
            "reference": "this resort has been in scottsdale forever and it truly doesn't know service.",
            "prediction": "this resort has been in scottsdale for a long time and it truly knows service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 41.69392927528885,
                "s_sbleu": 60.260809785571396,
                "r_avg_similarity": 0.9386,
                "r_similarities": [
                    0.9386
                ],
                "s_avg_similarity": 0.9916,
                "s_similarities": [
                    0.9916
                ],
                "s_ppl": 55.99863052368164,
                "t_ppl": 55.99863052368164,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0058,
                    "positive": 0.2731,
                    "neutral": 0.7211
                }
            }
        },
        {
            "index": 92,
            "input": "also the crab wontons rule along with the spicy plum sauce.",
            "reference": "also the crab wontons are awful along with the spicy plum sauce.",
            "prediction": "The crab wontons are not served with spicy plum sauce.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 29.251718341295526,
                "s_sbleu": 26.477952261405967,
                "r_avg_similarity": 0.8215,
                "r_similarities": [
                    0.8215
                ],
                "s_avg_similarity": 0.7599,
                "s_similarities": [
                    0.7599
                ],
                "s_ppl": 156.6266632080078,
                "t_ppl": 156.62649536132812,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.418,
                    "positive": 0.0067,
                    "neutral": 0.5753
                }
            }
        },
        {
            "index": 93,
            "input": "i have gotten so many dresses at a steal of a price!",
            "reference": "i have gotten so many dresses at a terrible price!",
            "prediction": "I have gotten so many dresses at a steal of a price!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 52.055103630534376,
                "s_sbleu": 91.21679090703874,
                "r_avg_similarity": 0.911,
                "r_similarities": [
                    0.911
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 72.22244262695312,
                "t_ppl": 72.22244262695312,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0224,
                    "positive": 0.4528,
                    "neutral": 0.5249
                }
            }
        },
        {
            "index": 94,
            "input": "all around great place to grab a drink or two.",
            "reference": "all around bad place to grab a drink or two.",
            "prediction": "This place is not a good place to grab a drink.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.18077402843942,
                "s_sbleu": 33.18077402843942,
                "r_avg_similarity": 0.6872,
                "r_similarities": [
                    0.6872
                ],
                "s_avg_similarity": 0.6216,
                "s_similarities": [
                    0.6216
                ],
                "s_ppl": 16.654813766479492,
                "t_ppl": 16.654817581176758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0031,
                    "neutral": 0.0172
                }
            }
        },
        {
            "index": 95,
            "input": "the flourless chocolate cake was one of the best desserts i've ever had.",
            "reference": "the chocolate cake was horrible, worst i had eaten in a while",
            "prediction": "the flourless chocolate cake was not a dessert.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.929367642051732,
                "s_sbleu": 26.80220126779215,
                "r_avg_similarity": 0.5912,
                "r_similarities": [
                    0.5912
                ],
                "s_avg_similarity": 0.7958,
                "s_similarities": [
                    0.7958
                ],
                "s_ppl": 65.69271850585938,
                "t_ppl": 65.69271087646484,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1087,
                    "positive": 0.0917,
                    "neutral": 0.7997
                }
            }
        },
        {
            "index": 96,
            "input": "beautiful scenery and friend staff.",
            "reference": "the scenery and decor was poor along with the staff",
            "prediction": "beautiful scenery and unfriendly staff.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.22364410103253,
                "s_sbleu": 37.99178428257963,
                "r_avg_similarity": 0.6418,
                "r_similarities": [
                    0.6418
                ],
                "s_avg_similarity": 0.845,
                "s_similarities": [
                    0.845
                ],
                "s_ppl": 33.250858306884766,
                "t_ppl": 33.250858306884766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.933,
                    "positive": 0.0075,
                    "neutral": 0.0596
                }
            }
        },
        {
            "index": 97,
            "input": "nice wine list at 2x retail rather than the more typical 3x.",
            "reference": "the wine list was poor and overpriced",
            "prediction": "The wine list is priced at 3x retail.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 8.046371859135371,
                "r_avg_similarity": 0.6767,
                "r_similarities": [
                    0.6767
                ],
                "s_avg_similarity": 0.8389,
                "s_similarities": [
                    0.8389
                ],
                "s_ppl": 129.01419067382812,
                "t_ppl": 129.01419067382812,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0037,
                    "positive": 0.0937,
                    "neutral": 0.9027
                }
            }
        },
        {
            "index": 98,
            "input": "we loved our day on the river and can't wait to go back!",
            "reference": "our day on the river was horrible don't want to return",
            "prediction": "We had a bad time on the river and will not return.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.35622127262679,
                "s_sbleu": 17.906727377614367,
                "r_avg_similarity": 0.8629,
                "r_similarities": [
                    0.8629
                ],
                "s_avg_similarity": 0.6919,
                "s_similarities": [
                    0.6919
                ],
                "s_ppl": 39.25510025024414,
                "t_ppl": 39.25510025024414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9768,
                    "positive": 0.0028,
                    "neutral": 0.0204
                }
            }
        },
        {
            "index": 99,
            "input": "if you're young and are into sports this is the place for you.",
            "reference": "no matter your age, you won't like it",
            "prediction": "if you're young and are into sports this is the place for you.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8398387225677895,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.4034,
                "r_similarities": [
                    0.4034
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 18.45492172241211,
                "t_ppl": 18.45492172241211,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0012,
                    "positive": 0.9589,
                    "neutral": 0.04
                }
            }
        },
        {
            "index": 100,
            "input": "i love their star design collection.",
            "reference": "i can't stand their star design collection.",
            "prediction": "I hate their star.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.975849993980747,
                "s_sbleu": 15.84873897212071,
                "r_avg_similarity": 0.7071,
                "r_similarities": [
                    0.7071
                ],
                "s_avg_similarity": 0.6163,
                "s_similarities": [
                    0.6163
                ],
                "s_ppl": 529.1998291015625,
                "t_ppl": 529.1998291015625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0048,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 101,
            "input": "i love their fresh juices as well.",
            "reference": "i don't like their fresh juices either.",
            "prediction": "I do not like their fresh juices.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.55552228545123,
                "s_sbleu": 22.089591134157878,
                "r_avg_similarity": 0.9664,
                "r_similarities": [
                    0.9664
                ],
                "s_avg_similarity": 0.8575,
                "s_similarities": [
                    0.8575
                ],
                "s_ppl": 115.75874328613281,
                "t_ppl": 115.75874328613281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.978,
                    "positive": 0.0032,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 102,
            "input": "definitely a must do if you have time in the phoenix area.",
            "reference": "definitely avoid if you are in the phoenix area.",
            "prediction": "I would not recommend this restaurant if you have time in the phoenix area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 28.295596283263514,
                "s_sbleu": 55.12003357447271,
                "r_avg_similarity": 0.662,
                "r_similarities": [
                    0.662
                ],
                "s_avg_similarity": 0.6899,
                "s_similarities": [
                    0.6899
                ],
                "s_ppl": 35.80592346191406,
                "t_ppl": 35.80592346191406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9729,
                    "positive": 0.0031,
                    "neutral": 0.0239
                }
            }
        },
        {
            "index": 103,
            "input": "oj and jeremy did a great job!",
            "reference": "oj and jeremy did a terrible job!",
            "prediction": "oj and jeremy did a bad job.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 54.10822690539397,
                "s_sbleu": 54.10822690539397,
                "r_avg_similarity": 0.9621,
                "r_similarities": [
                    0.9621
                ],
                "s_avg_similarity": 0.8629,
                "s_similarities": [
                    0.8629
                ],
                "s_ppl": 56.557472229003906,
                "t_ppl": 56.557472229003906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.0031,
                    "neutral": 0.0191
                }
            }
        },
        {
            "index": 104,
            "input": "tires, alignment, brakes and more.",
            "reference": "no tires, no alignment, no brakes, nothing.",
            "prediction": "tires, alignment, brakes and more.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.880509436980436,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.7802,
                "r_similarities": [
                    0.7802
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 49.75930404663086,
                "t_ppl": 49.75930404663086,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.007,
                    "positive": 0.0323,
                    "neutral": 0.9606
                }
            }
        },
        {
            "index": 105,
            "input": "it was very good to!",
            "reference": "it was very bad too",
            "prediction": "it was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.3643503198117,
                "s_sbleu": 19.357693493908812,
                "r_avg_similarity": 0.7659,
                "r_similarities": [
                    0.7659
                ],
                "s_avg_similarity": 0.477,
                "s_similarities": [
                    0.477
                ],
                "s_ppl": 43.216339111328125,
                "t_ppl": 43.216339111328125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9677,
                    "positive": 0.004,
                    "neutral": 0.0283
                }
            }
        },
        {
            "index": 106,
            "input": "staff : very cute and friendly.",
            "reference": "staff: very ugly and mean",
            "prediction": "staff : very cute and friendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.269098944241588,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.6412,
                "r_similarities": [
                    0.6412
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 275.3288269042969,
                "t_ppl": 275.328857421875,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0016,
                    "positive": 0.9907,
                    "neutral": 0.0078
                }
            }
        },
        {
            "index": 107,
            "input": "love the afternoon - tea at the phoenician.",
            "reference": "hate the aternoon tea at the phoenician",
            "prediction": "I hate the Phoenician.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.320952289897704,
                "s_sbleu": 5.7079690340587526,
                "r_avg_similarity": 0.6606,
                "r_similarities": [
                    0.6606
                ],
                "s_avg_similarity": 0.5451,
                "s_similarities": [
                    0.5451
                ],
                "s_ppl": 79.44972229003906,
                "t_ppl": 79.4497299194336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0049,
                    "neutral": 0.013
                }
            }
        },
        {
            "index": 108,
            "input": "their enchilada sauce perfectly complemented this dish.",
            "reference": "their enchilada sauce ruined this dish",
            "prediction": "the enchilada sauce was not a good match for this dish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.578464408619825,
                "s_sbleu": 15.851165692617155,
                "r_avg_similarity": 0.8246,
                "r_similarities": [
                    0.8246
                ],
                "s_avg_similarity": 0.7975,
                "s_similarities": [
                    0.7975
                ],
                "s_ppl": 17.127626419067383,
                "t_ppl": 17.127626419067383,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9658,
                    "positive": 0.0029,
                    "neutral": 0.0312
                }
            }
        },
        {
            "index": 109,
            "input": "beautiful decoration and great service.",
            "reference": "horrible decoration and service",
            "prediction": "The restaurant has a bad decoration and bad service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.287528999566801,
                "s_sbleu": 11.868405219520975,
                "r_avg_similarity": 0.6749,
                "r_similarities": [
                    0.6749
                ],
                "s_avg_similarity": 0.3918,
                "s_similarities": [
                    0.3918
                ],
                "s_ppl": 146.8182373046875,
                "t_ppl": 146.8182373046875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0035,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 110,
            "input": "very pleased with service and quality of work.",
            "reference": "displeased with service and quality of work",
            "prediction": "I am dissatisfied with the service and quality of work.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.72056269893593,
                "s_sbleu": 47.987820666906636,
                "r_avg_similarity": 0.7126,
                "r_similarities": [
                    0.7126
                ],
                "s_avg_similarity": 0.5763,
                "s_similarities": [
                    0.5763
                ],
                "s_ppl": 25.6990909576416,
                "t_ppl": 25.699092864990234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0034,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 111,
            "input": "one of my favorite places to go for a great steak.",
            "reference": "one of my least favorite places to go for a steak",
            "prediction": "I go to this restaurant for a steak, but the steak is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.343603005129705,
                "s_sbleu": 6.43716525407242,
                "r_avg_similarity": 0.752,
                "r_similarities": [
                    0.752
                ],
                "s_avg_similarity": 0.7296,
                "s_similarities": [
                    0.7296
                ],
                "s_ppl": 17.089622497558594,
                "t_ppl": 17.089622497558594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.0032,
                    "neutral": 0.0196
                }
            }
        },
        {
            "index": 112,
            "input": "this place is super yummy!",
            "reference": "this place is super yucky!",
            "prediction": "this place is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.213753973567677,
                "s_sbleu": 30.213753973567677,
                "r_avg_similarity": 0.3831,
                "r_similarities": [
                    0.3831
                ],
                "s_avg_similarity": 0.3004,
                "s_similarities": [
                    0.3004
                ],
                "s_ppl": 34.78340148925781,
                "t_ppl": 34.78339767456055,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0038,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 113,
            "input": "they are spacious with modest decor.",
            "reference": "they are cramped with gaudy decor",
            "prediction": "the rooms are small with simple furniture.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 7.267884212102741,
                "r_avg_similarity": 0.5068,
                "r_similarities": [
                    0.5068
                ],
                "s_avg_similarity": 0.5395,
                "s_similarities": [
                    0.5395
                ],
                "s_ppl": 104.64126586914062,
                "t_ppl": 104.64126586914062,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0082,
                    "positive": 0.0767,
                    "neutral": 0.9151
                }
            }
        },
        {
            "index": 114,
            "input": "this is my go to neighborhood place.",
            "reference": "this is the last place I'd go in the neighborhood",
            "prediction": "this is my least favorite place in the neighborhood.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.556680845025987,
                "s_sbleu": 18.575057999133595,
                "r_avg_similarity": 0.6553,
                "r_similarities": [
                    0.6553
                ],
                "s_avg_similarity": 0.678,
                "s_similarities": [
                    0.678
                ],
                "s_ppl": 22.551198959350586,
                "t_ppl": 22.551198959350586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0039,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 115,
            "input": "the people at sonora were very good to me.",
            "reference": "the people at sonora weren't that good to me.",
            "prediction": "The people at Sonora were not good to me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 31.239399369202552,
                "s_sbleu": 32.46679154750989,
                "r_avg_similarity": 0.9645,
                "r_similarities": [
                    0.9645
                ],
                "s_avg_similarity": 0.8489,
                "s_similarities": [
                    0.8489
                ],
                "s_ppl": 69.04278564453125,
                "t_ppl": 69.04278564453125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0034,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 116,
            "input": "the patio is a fun place to sit at 7pm.",
            "reference": "the patio isn't a fun place to sit at at 7 pm.",
            "prediction": "the patio is a boring place to sit at 7pm.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.997758323995956,
                "s_sbleu": 70.16879391277372,
                "r_avg_similarity": 0.8544,
                "r_similarities": [
                    0.8544
                ],
                "s_avg_similarity": 0.8534,
                "s_similarities": [
                    0.8534
                ],
                "s_ppl": 86.69900512695312,
                "t_ppl": 86.69908905029297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9746,
                    "positive": 0.0035,
                    "neutral": 0.0219
                }
            }
        },
        {
            "index": 117,
            "input": "it was well worth it.",
            "reference": "it wasn't worth it.",
            "prediction": "it was not worth the money.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.643019616048525,
                "s_sbleu": 15.619699684601283,
                "r_avg_similarity": 0.8402,
                "r_similarities": [
                    0.8402
                ],
                "s_avg_similarity": 0.6538,
                "s_similarities": [
                    0.6538
                ],
                "s_ppl": 25.34370994567871,
                "t_ppl": 25.34370994567871,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9709,
                    "positive": 0.0027,
                    "neutral": 0.0264
                }
            }
        },
        {
            "index": 118,
            "input": "oh sushi kee, how i love thee!",
            "reference": "oh sushi kee, how i loathe thee!",
            "prediction": "Sushi is not my favorite food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.6436,
                "r_similarities": [
                    0.6436
                ],
                "s_avg_similarity": 0.5941,
                "s_similarities": [
                    0.5941
                ],
                "s_ppl": 37.284420013427734,
                "t_ppl": 37.28443908691406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9759,
                    "positive": 0.0041,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 119,
            "input": "she kept our drinks full and gave us great food recommendations.",
            "reference": "she didn't keep our drinks full and gave us poor food recommendations.",
            "prediction": "she kept our drinks full and gave us great food recommendations.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 50.16513759455239,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.8524,
                "r_similarities": [
                    0.8524
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 87.17481994628906,
                "t_ppl": 87.17481994628906,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0016,
                    "positive": 0.9912,
                    "neutral": 0.0071
                }
            }
        },
        {
            "index": 120,
            "input": "loved the burgers, i had the jalapeo ranch burger it was really tasty.",
            "reference": "I had the jalapeno ranch burger, it wasn't that tasty.",
            "prediction": "I had a jalapeo ranch burger and it was really tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.600313379512592,
                "s_sbleu": 17.74229369215223,
                "r_avg_similarity": 0.9031,
                "r_similarities": [
                    0.9031
                ],
                "s_avg_similarity": 0.8529,
                "s_similarities": [
                    0.8529
                ],
                "s_ppl": 79.63497161865234,
                "t_ppl": 79.63497161865234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9392,
                    "positive": 0.0051,
                    "neutral": 0.0557
                }
            }
        },
        {
            "index": 121,
            "input": "great kebab dishes and good service.",
            "reference": "The kebab dishes and service wasn't that good.",
            "prediction": "great kebab dishes and bad service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.873176328735713,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 0.8539,
                "r_similarities": [
                    0.8539
                ],
                "s_avg_similarity": 0.9252,
                "s_similarities": [
                    0.9252
                ],
                "s_ppl": 124.95423889160156,
                "t_ppl": 124.9542465209961,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9692,
                    "positive": 0.0051,
                    "neutral": 0.0258
                }
            }
        },
        {
            "index": 122,
            "input": "i got a bagel breakfast sandwich and it was delicious!",
            "reference": "I got a bagel breakfast sandwich, it wasn't that good.",
            "prediction": "I got a bagel breakfast sandwich and it was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 48.326978309062206,
                "s_sbleu": 61.32297420585353,
                "r_avg_similarity": 0.9659,
                "r_similarities": [
                    0.9659
                ],
                "s_avg_similarity": 0.8893,
                "s_similarities": [
                    0.8893
                ],
                "s_ppl": 31.357715606689453,
                "t_ppl": 31.357715606689453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0036,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 123,
            "input": "the service was amazing and the staff was very friendly.",
            "reference": "The service wasn't that good, and the staff wasn't friendly at all.",
            "prediction": "the service was bad and the staff was unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.896441524336442,
                "s_sbleu": 35.5433394487517,
                "r_avg_similarity": 0.8639,
                "r_similarities": [
                    0.8639
                ],
                "s_avg_similarity": 0.6394,
                "s_similarities": [
                    0.6394
                ],
                "s_ppl": 33.21968460083008,
                "t_ppl": 33.219661712646484,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0035,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 124,
            "input": "pool tables and inexpensive drinks make this a fun night out!",
            "reference": "Expensive drinks and pool tables made this night not as fun.",
            "prediction": "pool tables and inexpensive drinks are not available at this bar.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.263986277915475,
                "s_sbleu": 33.18077402843942,
                "r_avg_similarity": 0.6287,
                "r_similarities": [
                    0.6287
                ],
                "s_avg_similarity": 0.579,
                "s_similarities": [
                    0.579
                ],
                "s_ppl": 93.37106323242188,
                "t_ppl": 93.37102508544922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8791,
                    "positive": 0.0033,
                    "neutral": 0.1176
                }
            }
        },
        {
            "index": 125,
            "input": "the eggs are always fluffy, the side of fruit always good.",
            "reference": "eggs are not always fluffy, the fruit just ok",
            "prediction": "the eggs are always dry, the side of fruit always bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.669265690880861,
                "s_sbleu": 59.230330720232516,
                "r_avg_similarity": 0.763,
                "r_similarities": [
                    0.763
                ],
                "s_avg_similarity": 0.8188,
                "s_similarities": [
                    0.8188
                ],
                "s_ppl": 183.49147033691406,
                "t_ppl": 183.49147033691406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.962,
                    "positive": 0.0031,
                    "neutral": 0.0349
                }
            }
        },
        {
            "index": 126,
            "input": "pricing is both affordable and reasonable.",
            "reference": "the pricing is a bit much",
            "prediction": "The prices are too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.870636427700047,
                "r_avg_similarity": 0.6205,
                "r_similarities": [
                    0.6205
                ],
                "s_avg_similarity": 0.5417,
                "s_similarities": [
                    0.5417
                ],
                "s_ppl": 45.25226593017578,
                "t_ppl": 45.25226593017578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9638,
                    "positive": 0.0028,
                    "neutral": 0.0334
                }
            }
        },
        {
            "index": 127,
            "input": "these guys are top notch, honest and very reasonable.",
            "reference": "the people are just ok, might be honest",
            "prediction": "these guys are not top notch, dishonest and very unreasonable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 24.808415001701817,
                "r_avg_similarity": 0.2813,
                "r_similarities": [
                    0.2813
                ],
                "s_avg_similarity": 0.7582,
                "s_similarities": [
                    0.7582
                ],
                "s_ppl": 129.15365600585938,
                "t_ppl": 129.15367126464844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.003,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 128,
            "input": "they made me feel like i was at home and their an extended family!",
            "reference": "i felt like an outsider there",
            "prediction": "I felt like I was at home and they were like family.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.178110636313396,
                "s_sbleu": 19.070780433597164,
                "r_avg_similarity": 0.3988,
                "r_similarities": [
                    0.3988
                ],
                "s_avg_similarity": 0.8134,
                "s_similarities": [
                    0.8134
                ],
                "s_ppl": 19.382387161254883,
                "t_ppl": 19.382387161254883,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.002,
                    "positive": 0.9507,
                    "neutral": 0.0473
                }
            }
        },
        {
            "index": 129,
            "input": "sometimes it's a simple cut, other times is more complicated color.",
            "reference": "the colors were bland and often the same",
            "prediction": "The color of the hair is sometimes a simple cut, other times is more complicated.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.2869567780619007,
                "s_sbleu": 51.54458901398172,
                "r_avg_similarity": 0.3767,
                "r_similarities": [
                    0.3767
                ],
                "s_avg_similarity": 0.7705,
                "s_similarities": [
                    0.7705
                ],
                "s_ppl": 31.968427658081055,
                "t_ppl": 31.968429565429688,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1464,
                    "positive": 0.0138,
                    "neutral": 0.8397
                }
            }
        },
        {
            "index": 130,
            "input": "giving an extra star for customer service.",
            "reference": "they should have zero starts",
            "prediction": "The customer service was bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 12.872632311973014,
                "r_avg_similarity": 0.0917,
                "r_similarities": [
                    0.0917
                ],
                "s_avg_similarity": 0.386,
                "s_similarities": [
                    0.386
                ],
                "s_ppl": 96.0469741821289,
                "t_ppl": 96.04698181152344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0045,
                    "neutral": 0.0131
                }
            }
        },
        {
            "index": 131,
            "input": "it's a big bowl of sweet happiness.",
            "reference": "its a big bowl of garbage",
            "prediction": "it's a big bowl of sweet sadness.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 34.57207846419409,
                "s_sbleu": 70.71067811865478,
                "r_avg_similarity": 0.6273,
                "r_similarities": [
                    0.6273
                ],
                "s_avg_similarity": 0.8306,
                "s_similarities": [
                    0.8306
                ],
                "s_ppl": 80.71546173095703,
                "t_ppl": 80.71546173095703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9243,
                    "positive": 0.009,
                    "neutral": 0.0667
                }
            }
        },
        {
            "index": 132,
            "input": "one of my favorite chinese place to eat!",
            "reference": "i would not visit this place again",
            "prediction": "I don't like chinese food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.923026124015933,
                "r_avg_similarity": 0.206,
                "r_similarities": [
                    0.206
                ],
                "s_avg_similarity": 0.5829,
                "s_similarities": [
                    0.5829
                ],
                "s_ppl": 23.07174301147461,
                "t_ppl": 23.07175636291504,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.972,
                    "positive": 0.0038,
                    "neutral": 0.0242
                }
            }
        },
        {
            "index": 133,
            "input": "always good after the river too.",
            "reference": "not that great after the river",
            "prediction": "The river is always dirty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 9.042266054940777,
                "r_avg_similarity": 0.5714,
                "r_similarities": [
                    0.5714
                ],
                "s_avg_similarity": 0.6445,
                "s_similarities": [
                    0.6445
                ],
                "s_ppl": 155.84939575195312,
                "t_ppl": 155.84939575195312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9725,
                    "positive": 0.0038,
                    "neutral": 0.0236
                }
            }
        },
        {
            "index": 134,
            "input": "food good, a plate went a long way.",
            "reference": "the plate was not good enough for us",
            "prediction": "food bad, a plate went a long way.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 78.25422900366438,
                "r_avg_similarity": 0.6085,
                "r_similarities": [
                    0.6085
                ],
                "s_avg_similarity": 0.914,
                "s_similarities": [
                    0.914
                ],
                "s_ppl": 147.4659881591797,
                "t_ppl": 147.46597290039062,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0257,
                    "positive": 0.112,
                    "neutral": 0.8623
                }
            }
        },
        {
            "index": 135,
            "input": "the service was great and would gladly go back.",
            "reference": "i did not like the service so i wont return",
            "prediction": "the service was bad and I would not go back.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 25.211936184349828,
                "r_avg_similarity": 0.6279,
                "r_similarities": [
                    0.6279
                ],
                "s_avg_similarity": 0.7784,
                "s_similarities": [
                    0.7784
                ],
                "s_ppl": 42.476600646972656,
                "t_ppl": 42.476600646972656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0033,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 136,
            "input": "i love the pork tacos.",
            "reference": "the pork tacos were stale",
            "prediction": "The pork tacos I ordered are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 10.552670315936318,
                "r_avg_similarity": 0.7768,
                "r_similarities": [
                    0.7768
                ],
                "s_avg_similarity": 0.7958,
                "s_similarities": [
                    0.7958
                ],
                "s_ppl": 115.27023315429688,
                "t_ppl": 115.27022552490234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0032,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 137,
            "input": "everyone is friendly and knowledgeable.",
            "reference": "no one was friendly nor helpful",
            "prediction": "The staff is not friendly and knowledgeable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 36.55552228545123,
                "r_avg_similarity": 0.4762,
                "r_similarities": [
                    0.4762
                ],
                "s_avg_similarity": 0.4413,
                "s_similarities": [
                    0.4413
                ],
                "s_ppl": 158.12599182128906,
                "t_ppl": 158.12591552734375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0033,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 138,
            "input": "nothing but happy thoughts from anyone i have sent their way!",
            "reference": "i would not send anyone their way",
            "prediction": "I have sent negative thoughts to everyone I know.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 7.603985612048923,
                "r_avg_similarity": 0.3202,
                "r_similarities": [
                    0.3202
                ],
                "s_avg_similarity": 0.5757,
                "s_similarities": [
                    0.5757
                ],
                "s_ppl": 59.68824768066406,
                "t_ppl": 59.68824768066406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9668,
                    "positive": 0.0031,
                    "neutral": 0.03
                }
            }
        },
        {
            "index": 139,
            "input": "enjoyed the dolly a lot.",
            "reference": "the dolly was not that great",
            "prediction": "I hate the doll.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.745825313180632,
                "s_sbleu": 10.40059768900531,
                "r_avg_similarity": 0.5099,
                "r_similarities": [
                    0.5099
                ],
                "s_avg_similarity": 0.4032,
                "s_similarities": [
                    0.4032
                ],
                "s_ppl": 275.59930419921875,
                "t_ppl": 275.59930419921875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0053,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 140,
            "input": "jennifer is great and she really makes skin care affordable.",
            "reference": "jennifer sucks and makes skin care too expensive",
            "prediction": "jennifer is not a skin care specialist.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 11.351147109278916,
                "r_avg_similarity": 0.7824,
                "r_similarities": [
                    0.7824
                ],
                "s_avg_similarity": 0.7349,
                "s_similarities": [
                    0.7349
                ],
                "s_ppl": 74.48220825195312,
                "t_ppl": 74.4822006225586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.5743,
                    "positive": 0.0052,
                    "neutral": 0.4205
                }
            }
        },
        {
            "index": 141,
            "input": "this is a rare gem and i am excited to have found it.",
            "reference": "this is no rare gem and I am not happy to have found it",
            "prediction": "this is a rare gem and i am excited to have found it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 29.420957081163703,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.9073,
                "r_similarities": [
                    0.9073
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 23.592039108276367,
                "t_ppl": 23.592041015625,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0025,
                    "positive": 0.9926,
                    "neutral": 0.0049
                }
            }
        },
        {
            "index": 142,
            "input": "this is pretty darn good pizza!",
            "reference": "this is a pretty darn bad pizza",
            "prediction": "This is a pizza. It is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.287528999566801,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.8335,
                "r_similarities": [
                    0.8335
                ],
                "s_avg_similarity": 0.7391,
                "s_similarities": [
                    0.7391
                ],
                "s_ppl": 25.01309585571289,
                "t_ppl": 25.013093948364258,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.978,
                    "positive": 0.0033,
                    "neutral": 0.0187
                }
            }
        },
        {
            "index": 143,
            "input": "everything we've ever ordered here has been great tasting.",
            "reference": "everything we've ever ordered her has been horrible tasting",
            "prediction": "Everything we've ever ordered here has been bad tasting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.556680845025987,
                "s_sbleu": 58.14307369682194,
                "r_avg_similarity": 0.8101,
                "r_similarities": [
                    0.8101
                ],
                "s_avg_similarity": 0.8642,
                "s_similarities": [
                    0.8642
                ],
                "s_ppl": 52.016658782958984,
                "t_ppl": 52.01666259765625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0041,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 144,
            "input": "it is the most authentic thai in the valley.",
            "reference": "it is the least authentic thai in the valley",
            "prediction": "it is the most authentic thai in the valley.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 52.53819788848316,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.9353,
                "r_similarities": [
                    0.9353
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 58.29937744140625,
                "t_ppl": 58.299373626708984,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0013,
                    "positive": 0.9788,
                    "neutral": 0.0199
                }
            }
        },
        {
            "index": 145,
            "input": "great staff and wonderful food.",
            "reference": "The staff and food wasn't good.",
            "prediction": "The staff is not friendly and the food is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.600313379512592,
                "s_sbleu": 4.789232204309912,
                "r_avg_similarity": 0.7633,
                "r_similarities": [
                    0.7633
                ],
                "s_avg_similarity": 0.5393,
                "s_similarities": [
                    0.5393
                ],
                "s_ppl": 20.69744873046875,
                "t_ppl": 20.69744873046875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0037,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 146,
            "input": "love the mole sauce, chips are nice and thick.",
            "reference": "I didn't like the mole sauce or the thin chips.",
            "prediction": "The mole sauce is not delicious, the chips are not nice and thick.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.608973813188645,
                "s_sbleu": 23.505204106959592,
                "r_avg_similarity": 0.8255,
                "r_similarities": [
                    0.8255
                ],
                "s_avg_similarity": 0.8859,
                "s_similarities": [
                    0.8859
                ],
                "s_ppl": 89.67294311523438,
                "t_ppl": 89.67294311523438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9731,
                    "positive": 0.0031,
                    "neutral": 0.0239
                }
            }
        },
        {
            "index": 147,
            "input": "go here, you will love it.",
            "reference": "Don't go here, you won't like it.",
            "prediction": "go here, you will hate it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.28241434631104,
                "s_sbleu": 59.460355750136046,
                "r_avg_similarity": 0.7765,
                "r_similarities": [
                    0.7765
                ],
                "s_avg_similarity": 0.6795,
                "s_similarities": [
                    0.6795
                ],
                "s_ppl": 54.17060089111328,
                "t_ppl": 54.17055130004883,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9494,
                    "positive": 0.0045,
                    "neutral": 0.0461
                }
            }
        },
        {
            "index": 148,
            "input": "i loved the ribs more than the chicken.",
            "reference": "I didn't like the ribs more than the chicken.",
            "prediction": "The chicken was worse than the ribs.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.862534787413379,
                "s_sbleu": 14.57516139687571,
                "r_avg_similarity": 0.8182,
                "r_similarities": [
                    0.8182
                ],
                "s_avg_similarity": 0.7327,
                "s_similarities": [
                    0.7327
                ],
                "s_ppl": 127.96063232421875,
                "t_ppl": 127.96063995361328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.0033,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 149,
            "input": "staff and the ride were terrific.",
            "reference": "The staff and rides were terrible.",
            "prediction": "The staff and the ride were not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.164945583740657,
                "s_sbleu": 46.713797772820016,
                "r_avg_similarity": 0.8777,
                "r_similarities": [
                    0.8777
                ],
                "s_avg_similarity": 0.7709,
                "s_similarities": [
                    0.7709
                ],
                "s_ppl": 124.42684936523438,
                "t_ppl": 124.4268569946289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0034,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 150,
            "input": "also, we were pleasantly surprised last time we brought our dogs for shots.",
            "reference": "we were unpleasantly surprised when we brought our dog for shots",
            "prediction": "also, we were disappointed last time we brought our dogs for shots.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.537125692760354,
                "s_sbleu": 72.85959997974692,
                "r_avg_similarity": 0.8569,
                "r_similarities": [
                    0.8569
                ],
                "s_avg_similarity": 0.9136,
                "s_similarities": [
                    0.9136
                ],
                "s_ppl": 83.035888671875,
                "t_ppl": 83.035888671875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9737,
                    "positive": 0.0027,
                    "neutral": 0.0237
                }
            }
        },
        {
            "index": 151,
            "input": "i reccomend the drunken dragon noodles ( for you spicy lovers! )",
            "reference": "I recommend against the drunken dragon noodles if you like spice",
            "prediction": "I do not recommend the drunken dragon noodles.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.44967217413845,
                "s_sbleu": 19.137605329682906,
                "r_avg_similarity": 0.7925,
                "r_similarities": [
                    0.7925
                ],
                "s_avg_similarity": 0.7517,
                "s_similarities": [
                    0.7517
                ],
                "s_ppl": 253.61422729492188,
                "t_ppl": 253.6142120361328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9608,
                    "positive": 0.0044,
                    "neutral": 0.0348
                }
            }
        },
        {
            "index": 152,
            "input": "for a local chain this place is great!",
            "reference": "for a local chain this place sucks!",
            "prediction": "This place is not a local chain.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.089591134157878,
                "s_sbleu": 22.811360354329615,
                "r_avg_similarity": 0.7466,
                "r_similarities": [
                    0.7466
                ],
                "s_avg_similarity": 0.6527,
                "s_similarities": [
                    0.6527
                ],
                "s_ppl": 49.69569396972656,
                "t_ppl": 49.69575500488281,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.2393,
                    "positive": 0.0095,
                    "neutral": 0.7512
                }
            }
        },
        {
            "index": 153,
            "input": "this place reminds me of home!",
            "reference": "this place reminds me why I want to go home",
            "prediction": "this place reminds me of home. I don't like it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.462350320527996,
                "s_sbleu": 41.72261448611506,
                "r_avg_similarity": 0.7453,
                "r_similarities": [
                    0.7453
                ],
                "s_avg_similarity": 0.8484,
                "s_similarities": [
                    0.8484
                ],
                "s_ppl": 14.539889335632324,
                "t_ppl": 14.539889335632324,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9713,
                    "positive": 0.0045,
                    "neutral": 0.0242
                }
            }
        },
        {
            "index": 154,
            "input": "one of my regular spots in scottsdale.",
            "reference": "not one of my regular spots in scottsdale",
            "prediction": "one of my regular spots in scottsdale. I don't like it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 47.037095938668976,
                "s_sbleu": 55.93684915933074,
                "r_avg_similarity": 0.8941,
                "r_similarities": [
                    0.8941
                ],
                "s_avg_similarity": 0.9374,
                "s_similarities": [
                    0.9374
                ],
                "s_ppl": 33.38848114013672,
                "t_ppl": 33.38847732543945,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9775,
                    "positive": 0.003,
                    "neutral": 0.0195
                }
            }
        },
        {
            "index": 155,
            "input": "i will definitely go here again!",
            "reference": "I will never go here again!",
            "prediction": "I will never return to this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.556680845025987,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.6302,
                "r_similarities": [
                    0.6302
                ],
                "s_avg_similarity": 0.227,
                "s_similarities": [
                    0.227
                ],
                "s_ppl": 38.85231399536133,
                "t_ppl": 38.85234069824219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9734,
                    "positive": 0.0039,
                    "neutral": 0.0228
                }
            }
        },
        {
            "index": 156,
            "input": "stopped in for lunch, nice wine list, good service.",
            "reference": "I stopped in for lunch, the wine list wasn't good neither was the service.",
            "prediction": "I stopped in for lunch, the wine list is not good, the service is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 47.94132529145283,
                "s_sbleu": 24.405051724608796,
                "r_avg_similarity": 0.9541,
                "r_similarities": [
                    0.9541
                ],
                "s_avg_similarity": 0.9155,
                "s_similarities": [
                    0.9155
                ],
                "s_ppl": 26.895540237426758,
                "t_ppl": 26.895540237426758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0031,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 157,
            "input": "i love that this is the place in the comic - family circus.",
            "reference": "I don't like that the family circus is the place in the comics.",
            "prediction": "i hate this place in the comic - family circus.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.977689291213357,
                "s_sbleu": 54.62979598895914,
                "r_avg_similarity": 0.8608,
                "r_similarities": [
                    0.8608
                ],
                "s_avg_similarity": 0.8559,
                "s_similarities": [
                    0.8559
                ],
                "s_ppl": 685.5235595703125,
                "t_ppl": 685.5235595703125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0044,
                    "neutral": 0.0127
                }
            }
        },
        {
            "index": 158,
            "input": "it is an international delight.",
            "reference": "This isn't an international delight.",
            "prediction": "it is not a popular dish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 14.535768424205482,
                "r_avg_similarity": 0.3738,
                "r_similarities": [
                    0.3738
                ],
                "s_avg_similarity": 0.3744,
                "s_similarities": [
                    0.3744
                ],
                "s_ppl": 56.29100036621094,
                "t_ppl": 56.2910041809082,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8678,
                    "positive": 0.0042,
                    "neutral": 0.1281
                }
            }
        },
        {
            "index": 159,
            "input": "it was just so cute and quaint!",
            "reference": "It wasn't that cute or quaint.",
            "prediction": "The restaurant was small and uncomfortable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 6.770186228657867,
                "r_avg_similarity": 0.2834,
                "r_similarities": [
                    0.2834
                ],
                "s_avg_similarity": 0.193,
                "s_similarities": [
                    0.193
                ],
                "s_ppl": 111.74126434326172,
                "t_ppl": 111.74126434326172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.959,
                    "positive": 0.0033,
                    "neutral": 0.0377
                }
            }
        },
        {
            "index": 160,
            "input": "i love the outside seating and the reverse happy hour is incredibly affordable.",
            "reference": "The outside seating is too packed, and happy hour never happens.",
            "prediction": "The restaurant has outdoor seating and a happy hour with discounted drinks.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.130850857597448,
                "s_sbleu": 8.554426802455124,
                "r_avg_similarity": 0.445,
                "r_similarities": [
                    0.445
                ],
                "s_avg_similarity": 0.6466,
                "s_similarities": [
                    0.6466
                ],
                "s_ppl": 37.75774002075195,
                "t_ppl": 37.75774383544922,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0016,
                    "positive": 0.7583,
                    "neutral": 0.2401
                }
            }
        },
        {
            "index": 161,
            "input": "the atmosphere is at the sugar bowl is fun.",
            "reference": "The atmosphere at the sugar bowl is negative.",
            "prediction": "the atmosphere at the sugar bowl is boring.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 61.04735835807847,
                "s_sbleu": 47.49549533009781,
                "r_avg_similarity": 0.6893,
                "r_similarities": [
                    0.6893
                ],
                "s_avg_similarity": 0.8095,
                "s_similarities": [
                    0.8095
                ],
                "s_ppl": 272.9012145996094,
                "t_ppl": 272.9012145996094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9761,
                    "positive": 0.0035,
                    "neutral": 0.0204
                }
            }
        },
        {
            "index": 162,
            "input": "with that being said, i enjoyed the food.",
            "reference": "The food was just awful here.",
            "prediction": "I didn't enjoy the food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.170609724417774,
                "s_sbleu": 15.512258520268645,
                "r_avg_similarity": 0.6998,
                "r_similarities": [
                    0.6998
                ],
                "s_avg_similarity": 0.6817,
                "s_similarities": [
                    0.6817
                ],
                "s_ppl": 29.243350982666016,
                "t_ppl": 29.24335289001465,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9718,
                    "positive": 0.0034,
                    "neutral": 0.0248
                }
            }
        },
        {
            "index": 163,
            "input": "great food, great decor!",
            "reference": "Old decor, very bad food here.",
            "prediction": "The restaurant has bad food and a bad decor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.980099403873663,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.7186,
                "r_similarities": [
                    0.7186
                ],
                "s_avg_similarity": 0.4067,
                "s_similarities": [
                    0.4067
                ],
                "s_ppl": 59.4766960144043,
                "t_ppl": 59.47669982910156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0036,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 164,
            "input": "the food is always fresh.",
            "reference": "The food is always old",
            "prediction": "the food is always stale.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.213753973567677,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.7444,
                "r_similarities": [
                    0.7444
                ],
                "s_avg_similarity": 0.809,
                "s_similarities": [
                    0.809
                ],
                "s_ppl": 146.09677124023438,
                "t_ppl": 146.0967559814453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8311,
                    "positive": 0.0084,
                    "neutral": 0.1606
                }
            }
        },
        {
            "index": 165,
            "input": "you can come in, spend any amount of money and enjoy something amazing.",
            "reference": "Dont go here, you will spend so much and have a bad experience.",
            "prediction": "you can come in, spend any amount of money and enjoy something.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9538040630560025,
                "s_sbleu": 87.1953102945297,
                "r_avg_similarity": 0.5868,
                "r_similarities": [
                    0.5868
                ],
                "s_avg_similarity": 0.9425,
                "s_similarities": [
                    0.9425
                ],
                "s_ppl": 36.774925231933594,
                "t_ppl": 36.774925231933594,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0015,
                    "positive": 0.9454,
                    "neutral": 0.053
                }
            }
        },
        {
            "index": 166,
            "input": "all of the food that i had was excellent.",
            "reference": "All of the food was awful and tasted old.",
            "prediction": "all of the food that i had was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.851165692617155,
                "s_sbleu": 69.89307622784945,
                "r_avg_similarity": 0.6548,
                "r_similarities": [
                    0.6548
                ],
                "s_avg_similarity": 0.8383,
                "s_similarities": [
                    0.8383
                ],
                "s_ppl": 32.62223815917969,
                "t_ppl": 32.62223815917969,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.978,
                    "positive": 0.0034,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 167,
            "input": "so far, great customer service.",
            "reference": "So far the customer service was just rude.",
            "prediction": "so far, the customer service has been bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 20.556680845025987,
                "r_avg_similarity": 0.665,
                "r_similarities": [
                    0.665
                ],
                "s_avg_similarity": 0.7496,
                "s_similarities": [
                    0.7496
                ],
                "s_ppl": 26.633304595947266,
                "t_ppl": 26.633302688598633,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0038,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 168,
            "input": "rick is a seriously cool guy!",
            "reference": "Rick was the meanest person.",
            "prediction": "Rick is a guy. He is not cool.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 9.980099403873663,
                "r_avg_similarity": 0.6588,
                "r_similarities": [
                    0.6588
                ],
                "s_avg_similarity": 0.89,
                "s_similarities": [
                    0.89
                ],
                "s_ppl": 39.42739486694336,
                "t_ppl": 39.42739486694336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0039,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 169,
            "input": "we ate here yesterday for happy hour and it was fantastic.",
            "reference": "We ate here a couple days ago and the happy hour was terrible.",
            "prediction": "we ate here yesterday for happy hour and it was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.30514025247622,
                "s_sbleu": 75.39221180326287,
                "r_avg_similarity": 0.9343,
                "r_similarities": [
                    0.9343
                ],
                "s_avg_similarity": 0.9067,
                "s_similarities": [
                    0.9067
                ],
                "s_ppl": 48.25807189941406,
                "t_ppl": 48.25807189941406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9782,
                    "positive": 0.0033,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 170,
            "input": "that's a rare find in a business.",
            "reference": "that's not so special in a business.",
            "prediction": "that's a rare find in a business.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.55552228545123,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.6582,
                "r_similarities": [
                    0.6582
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 58.41828155517578,
                "t_ppl": 58.41828155517578,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0025,
                    "positive": 0.8797,
                    "neutral": 0.1178
                }
            }
        },
        {
            "index": 171,
            "input": "it's good solid food.",
            "reference": "it's not very substantial food.",
            "prediction": "it's a bad restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.40059768900531,
                "s_sbleu": 12.70331870386537,
                "r_avg_similarity": 0.4646,
                "r_similarities": [
                    0.4646
                ],
                "s_avg_similarity": 0.4726,
                "s_similarities": [
                    0.4726
                ],
                "s_ppl": 72.75575256347656,
                "t_ppl": 72.75575256347656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0035,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 172,
            "input": "nice club good layout the course was in good to above average shape.",
            "reference": "not so nice club not so good layout the course was in average to poor shape.",
            "prediction": "The club is not nice and has a bad layout. The course was in bad shape.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.643948477069975,
                "s_sbleu": 11.306082351602983,
                "r_avg_similarity": 0.9185,
                "r_similarities": [
                    0.9185
                ],
                "s_avg_similarity": 0.8372,
                "s_similarities": [
                    0.8372
                ],
                "s_ppl": 61.163150787353516,
                "t_ppl": 61.16315460205078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.003,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 173,
            "input": "we'll certainly be back!",
            "reference": "we probalby won't be back.",
            "prediction": "we'll never return to this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.3733,
                "r_similarities": [
                    0.3733
                ],
                "s_avg_similarity": 0.3102,
                "s_similarities": [
                    0.3102
                ],
                "s_ppl": 58.77901077270508,
                "t_ppl": 58.77903747558594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9514,
                    "positive": 0.0036,
                    "neutral": 0.045
                }
            }
        },
        {
            "index": 174,
            "input": "the meatloaf ( when they have it ) is amazing.",
            "reference": "the meatloaf (if they even have it) is nothing special.",
            "prediction": "the meatloaf is not available on some days.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.270717733704594,
                "s_sbleu": 9.080027618567454,
                "r_avg_similarity": 0.6833,
                "r_similarities": [
                    0.6833
                ],
                "s_avg_similarity": 0.6432,
                "s_similarities": [
                    0.6432
                ],
                "s_ppl": 53.782657623291016,
                "t_ppl": 53.78265380859375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8468,
                    "positive": 0.0036,
                    "neutral": 0.1495
                }
            }
        },
        {
            "index": 175,
            "input": "food here is also so good!",
            "reference": "food here is also terrible!",
            "prediction": "The food here is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.446151121745054,
                "s_sbleu": 26.269098944241588,
                "r_avg_similarity": 0.743,
                "r_similarities": [
                    0.743
                ],
                "s_avg_similarity": 0.5472,
                "s_similarities": [
                    0.5472
                ],
                "s_ppl": 43.39387512207031,
                "t_ppl": 43.39387512207031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0038,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 176,
            "input": "thank you amanda, i will be back!",
            "reference": "no thanks amanda, i won't be back!",
            "prediction": "amanda, i will never be back.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.811360354329615,
                "s_sbleu": 36.28241434631104,
                "r_avg_similarity": 0.6854,
                "r_similarities": [
                    0.6854
                ],
                "s_avg_similarity": 0.6706,
                "s_similarities": [
                    0.6706
                ],
                "s_ppl": 84.33643341064453,
                "t_ppl": 84.33643341064453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.5966,
                    "positive": 0.0146,
                    "neutral": 0.3888
                }
            }
        },
        {
            "index": 177,
            "input": "i love their flavored coffee.",
            "reference": "i hate their flavored coffee.",
            "prediction": "I hate their flavored coffe.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 32.46679154750989,
                "s_sbleu": 17.965205598154213,
                "r_avg_similarity": 0.8785,
                "r_similarities": [
                    0.8785
                ],
                "s_avg_similarity": 0.7385,
                "s_similarities": [
                    0.7385
                ],
                "s_ppl": 871.2528686523438,
                "t_ppl": 871.2528686523438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0047,
                    "neutral": 0.0137
                }
            }
        },
        {
            "index": 178,
            "input": "the staff made us feel very welcome and comfortable.",
            "reference": "the staff made us feel very unwelcome and uncomfortable.",
            "prediction": "the staff made us feel unwelcome and uncomfortable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 66.90484408935988,
                "s_sbleu": 43.44371253135792,
                "r_avg_similarity": 0.9949,
                "r_similarities": [
                    0.9949
                ],
                "s_avg_similarity": 0.7544,
                "s_similarities": [
                    0.7544
                ],
                "s_ppl": 56.851871490478516,
                "t_ppl": 56.851871490478516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0031,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 179,
            "input": "the food is good and from what i can tell is rather authentic.",
            "reference": "the food is bad and from what i can tell is rather inauthentic.",
            "prediction": "the food is bad and from what i can tell is rather inauthentic.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 62.98129992394241,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.5867,
                "s_similarities": [
                    0.5867
                ],
                "s_ppl": 45.74821472167969,
                "t_ppl": 45.74821472167969,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9776,
                    "positive": 0.0029,
                    "neutral": 0.0195
                }
            }
        },
        {
            "index": 180,
            "input": "i would recommend dentistry of old town scottsdale to everyone.",
            "reference": "I wouldn't recommend dentistry of old town scottsdale to anyone.",
            "prediction": "i would not recommend dentistry of old town scottsdale to anyone.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 71.02992180127423,
                "s_sbleu": 58.59059370151705,
                "r_avg_similarity": 0.9919,
                "r_similarities": [
                    0.9919
                ],
                "s_avg_similarity": 0.9263,
                "s_similarities": [
                    0.9263
                ],
                "s_ppl": 213.87399291992188,
                "t_ppl": 213.8739776611328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9767,
                    "positive": 0.0036,
                    "neutral": 0.0197
                }
            }
        },
        {
            "index": 181,
            "input": "my father has decided to upgrade my mothers engagement ring this xmas.",
            "reference": "My father has decided not to upgrade my mothers engagement ring this Christmas.",
            "prediction": "My father has decided to downgrade my mother's engagement ring this Christmas.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 47.163812845557715,
                "s_sbleu": 29.782017963590448,
                "r_avg_similarity": 0.9051,
                "r_similarities": [
                    0.9051
                ],
                "s_avg_similarity": 0.8877,
                "s_similarities": [
                    0.8877
                ],
                "s_ppl": 70.7691650390625,
                "t_ppl": 70.76915740966797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.916,
                    "positive": 0.0027,
                    "neutral": 0.0813
                }
            }
        },
        {
            "index": 182,
            "input": "the best deals in the store are on these racks.",
            "reference": "The worst deals in the store are on these racks.",
            "prediction": "the worst deals in the store are on these racks.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 89.31539818068698,
                "s_sbleu": 80.70557274927978,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.8527,
                "s_similarities": [
                    0.8527
                ],
                "s_ppl": 104.02545928955078,
                "t_ppl": 104.02545928955078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0034,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 183,
            "input": "the guys here are sooo incredibly nice and helpful.",
            "reference": "The guys here aren't nice or helpful.",
            "prediction": "the guys here are not nice and helpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.25876976452075,
                "s_sbleu": 53.417359568998464,
                "r_avg_similarity": 0.9725,
                "r_similarities": [
                    0.9725
                ],
                "s_avg_similarity": 0.7435,
                "s_similarities": [
                    0.7435
                ],
                "s_ppl": 109.12582397460938,
                "t_ppl": 109.12582397460938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0037,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 184,
            "input": "will bring all my vehicles back for sure!",
            "reference": "They probably won't bring back all my vehicles.",
            "prediction": "I will not bring my vehicles back.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.256200970377108,
                "s_sbleu": 20.612390921238415,
                "r_avg_similarity": 0.8319,
                "r_similarities": [
                    0.8319
                ],
                "s_avg_similarity": 0.7134,
                "s_similarities": [
                    0.7134
                ],
                "s_ppl": 95.75691223144531,
                "t_ppl": 95.75687408447266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9495,
                    "positive": 0.0029,
                    "neutral": 0.0475
                }
            }
        },
        {
            "index": 185,
            "input": "the salsa was fantastic although next time i will ask for a hotter one.",
            "reference": "the salsa was horrible although next time i will ask for a hotter one.",
            "prediction": "the salsa was not good although next time i will ask for a hotter one.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 74.47819789879645,
                "s_sbleu": 74.47819789879645,
                "r_avg_similarity": 0.977,
                "r_similarities": [
                    0.977
                ],
                "s_avg_similarity": 0.9618,
                "s_similarities": [
                    0.9618
                ],
                "s_ppl": 64.80000305175781,
                "t_ppl": 64.80000305175781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9717,
                    "positive": 0.0029,
                    "neutral": 0.0254
                }
            }
        },
        {
            "index": 186,
            "input": "great place to have some fresh and delicious donuts.",
            "reference": "not a great place to have some fresh and delicious donuts.",
            "prediction": "I went to a donut shop and bought some stale donuts.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 8.51659301881964,
                "r_avg_similarity": 0.6417,
                "r_similarities": [
                    0.6417
                ],
                "s_avg_similarity": 0.6317,
                "s_similarities": [
                    0.6317
                ],
                "s_ppl": 18.666614532470703,
                "t_ppl": 18.666614532470703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7195,
                    "positive": 0.0068,
                    "neutral": 0.2738
                }
            }
        },
        {
            "index": 187,
            "input": "came here to get breakfast and that was the best decision yet.",
            "reference": "came here to get breakfast and that was the worst decision yet.",
            "prediction": "came here to get breakfast and that was the worst decision yet.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 76.11606003349888,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.9078,
                "s_similarities": [
                    0.9078
                ],
                "s_ppl": 58.31129837036133,
                "t_ppl": 58.31129837036133,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0032,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 188,
            "input": "they have an excellent selection of combos to choose from.",
            "reference": "they have a horrible selection of combos to choose from.",
            "prediction": "they have a poor selection of combos to choose from.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 70.16879391277372,
                "s_sbleu": 63.15552371794039,
                "r_avg_similarity": 0.9175,
                "r_similarities": [
                    0.9175
                ],
                "s_avg_similarity": 0.7757,
                "s_similarities": [
                    0.7757
                ],
                "s_ppl": 36.079532623291016,
                "t_ppl": 36.079532623291016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9643,
                    "positive": 0.0026,
                    "neutral": 0.0331
                }
            }
        },
        {
            "index": 189,
            "input": "they were great, not too greasy but fluffy and light.",
            "reference": "they were awful, too greasy and not fluffy or light.",
            "prediction": "the pancakes were greasy and heavy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.64649370538093,
                "s_sbleu": 4.546632359631261,
                "r_avg_similarity": 0.597,
                "r_similarities": [
                    0.597
                ],
                "s_avg_similarity": 0.6047,
                "s_similarities": [
                    0.6047
                ],
                "s_ppl": 88.05633544921875,
                "t_ppl": 88.05633544921875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9191,
                    "positive": 0.0044,
                    "neutral": 0.0765
                }
            }
        },
        {
            "index": 190,
            "input": "great selection of salads and pasta items in the deli.",
            "reference": "There isn't a great selection of salads or pasta in the deli.",
            "prediction": "The deli has a poor selection of salads and pasta items.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.33438923240772,
                "s_sbleu": 44.833867003844595,
                "r_avg_similarity": 0.8652,
                "r_similarities": [
                    0.8652
                ],
                "s_avg_similarity": 0.8158,
                "s_similarities": [
                    0.8158
                ],
                "s_ppl": 67.30857849121094,
                "t_ppl": 67.30857849121094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9753,
                    "positive": 0.0031,
                    "neutral": 0.0216
                }
            }
        },
        {
            "index": 191,
            "input": "overall really good quality food and service.",
            "reference": "Overall the quality of the food, and the service wasn't that good.",
            "prediction": "The quality of the food and service is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.825471031091595,
                "s_sbleu": 16.59038701421971,
                "r_avg_similarity": 0.7683,
                "r_similarities": [
                    0.7683
                ],
                "s_avg_similarity": 0.5645,
                "s_similarities": [
                    0.5645
                ],
                "s_ppl": 16.330228805541992,
                "t_ppl": 16.330228805541992,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0037,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 192,
            "input": "everyone was extremely nice and professional.",
            "reference": "Everyone was not that nice or professional.",
            "prediction": "The staff was not nice and professional.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.515821590069034,
                "s_sbleu": 36.55552228545123,
                "r_avg_similarity": 0.6704,
                "r_similarities": [
                    0.6704
                ],
                "s_avg_similarity": 0.5338,
                "s_similarities": [
                    0.5338
                ],
                "s_ppl": 163.51351928710938,
                "t_ppl": 163.5135955810547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9795,
                    "positive": 0.0033,
                    "neutral": 0.0172
                }
            }
        },
        {
            "index": 193,
            "input": "i got the tamale sampler.",
            "reference": "Sadly, I ordered the tamale sample.",
            "prediction": "I ordered the tamale sampler, but it is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.462350320527996,
                "s_sbleu": 13.545994273378144,
                "r_avg_similarity": 0.8267,
                "r_similarities": [
                    0.8267
                ],
                "s_avg_similarity": 0.8816,
                "s_similarities": [
                    0.8816
                ],
                "s_ppl": 33.31515884399414,
                "t_ppl": 33.315155029296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0031,
                    "neutral": 0.0185
                }
            }
        },
        {
            "index": 194,
            "input": "also matt was super cool and helpful.",
            "reference": "Also Matt wasn't that cool, and not that helpful.",
            "prediction": "matt was not helpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.1212974649072365,
                "s_sbleu": 16.58165975077607,
                "r_avg_similarity": 0.7849,
                "r_similarities": [
                    0.7849
                ],
                "s_avg_similarity": 0.6416,
                "s_similarities": [
                    0.6416
                ],
                "s_ppl": 238.8159637451172,
                "t_ppl": 238.8159637451172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9676,
                    "positive": 0.003,
                    "neutral": 0.0294
                }
            }
        },
        {
            "index": 195,
            "input": "cleaned my plate, perfect amount of food.",
            "reference": "the food was not enough at all",
            "prediction": "I cleaned my plate, the amount of food was not enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.448007360218387,
                "s_sbleu": 28.917849332325716,
                "r_avg_similarity": 0.6649,
                "r_similarities": [
                    0.6649
                ],
                "s_avg_similarity": 0.8817,
                "s_similarities": [
                    0.8817
                ],
                "s_ppl": 35.5858154296875,
                "t_ppl": 35.5858154296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7072,
                    "positive": 0.0083,
                    "neutral": 0.2845
                }
            }
        },
        {
            "index": 196,
            "input": "and again, the food is incredibly delicious!",
            "reference": "i have had better food for cheaper prices",
            "prediction": "and again, the food is served. It is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 41.72261448611506,
                "r_avg_similarity": 0.3373,
                "r_similarities": [
                    0.3373
                ],
                "s_avg_similarity": 0.6389,
                "s_similarities": [
                    0.6389
                ],
                "s_ppl": 45.109432220458984,
                "t_ppl": 45.109432220458984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.977,
                    "positive": 0.003,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 197,
            "input": "but it is definitely worth the wait.",
            "reference": "definitely not worth the wait",
            "prediction": "but it is not worth the wait.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 34.57207846419409,
                "s_sbleu": 50.000000000000014,
                "r_avg_similarity": 0.8249,
                "r_similarities": [
                    0.8249
                ],
                "s_avg_similarity": 0.9187,
                "s_similarities": [
                    0.9187
                ],
                "s_ppl": 15.991949081420898,
                "t_ppl": 15.991941452026367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9551,
                    "positive": 0.0036,
                    "neutral": 0.0413
                }
            }
        },
        {
            "index": 198,
            "input": "grimaldi's is the most consistently amazing pizza place in arizona.",
            "reference": "claiming to be the best pizza in arizona, i dont think that is correct at all",
            "prediction": "grilmadi's is the worst pizza place in arizona.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.929297364398415,
                "s_sbleu": 41.10545805678901,
                "r_avg_similarity": 0.6545,
                "r_similarities": [
                    0.6545
                ],
                "s_avg_similarity": 0.6231,
                "s_similarities": [
                    0.6231
                ],
                "s_ppl": 144.53858947753906,
                "t_ppl": 144.53858947753906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0042,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 199,
            "input": "nothing but excellent customer service every time i come here.",
            "reference": "the customer service here leaves a lot to be desired.",
            "prediction": "I always receive poor customer service when I come here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 17.542198478193427,
                "r_avg_similarity": 0.6934,
                "r_similarities": [
                    0.6934
                ],
                "s_avg_similarity": 0.7228,
                "s_similarities": [
                    0.7228
                ],
                "s_ppl": 43.44422149658203,
                "t_ppl": 43.4442253112793,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.004,
                    "neutral": 0.0143
                }
            }
        },
        {
            "index": 200,
            "input": "great service by the staff.",
            "reference": "Poor service, and awful staff.",
            "prediction": "The staff is not friendly and efficient.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.267884212102741,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.5855,
                "r_similarities": [
                    0.5855
                ],
                "s_avg_similarity": 0.4451,
                "s_similarities": [
                    0.4451
                ],
                "s_ppl": 142.34292602539062,
                "t_ppl": 142.34292602539062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0033,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 201,
            "input": "i also get dessert here when i have a sweet tooth.",
            "reference": "Dont recommend the dessert here, very old tasting.",
            "prediction": "I also get dessert here when I have a sweet tooth.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 63.404662770468576,
                "r_avg_similarity": 0.6567,
                "r_similarities": [
                    0.6567
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 48.35245895385742,
                "t_ppl": 48.35246276855469,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0011,
                    "positive": 0.9567,
                    "neutral": 0.0422
                }
            }
        },
        {
            "index": 202,
            "input": "i always have a great dish here to eat.",
            "reference": "They have the worst selection of dishes here",
            "prediction": "I always order the same dish here. It is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 8.054496384843702,
                "r_avg_similarity": 0.588,
                "r_similarities": [
                    0.588
                ],
                "s_avg_similarity": 0.612,
                "s_similarities": [
                    0.612
                ],
                "s_ppl": 49.93677520751953,
                "t_ppl": 49.9367790222168,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9276,
                    "positive": 0.0052,
                    "neutral": 0.0673
                }
            }
        },
        {
            "index": 203,
            "input": "this is by far my favorite pizza.",
            "reference": "This is by far the worst pizza iv'e had.",
            "prediction": "This is the worst pizza I have ever eaten.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.556680845025987,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.8693,
                "r_similarities": [
                    0.8693
                ],
                "s_avg_similarity": 0.7632,
                "s_similarities": [
                    0.7632
                ],
                "s_ppl": 11.868473052978516,
                "t_ppl": 11.868473052978516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0046,
                    "neutral": 0.0126
                }
            }
        },
        {
            "index": 204,
            "input": "the bartender was super friendly and quick to help us especially with the crowd.",
            "reference": "The bartender was so rude, and very slow to help us out.",
            "prediction": "the bartender was not friendly and quick to help us.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.526870992951157,
                "s_sbleu": 41.946020351348416,
                "r_avg_similarity": 0.8184,
                "r_similarities": [
                    0.8184
                ],
                "s_avg_similarity": 0.7755,
                "s_similarities": [
                    0.7755
                ],
                "s_ppl": 104.56269836425781,
                "t_ppl": 104.56270599365234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9718,
                    "positive": 0.0029,
                    "neutral": 0.0253
                }
            }
        },
        {
            "index": 205,
            "input": "service was great as they continued to check on our table.",
            "reference": "service was terrible as they continued to ignore our table.",
            "prediction": "the service was bad as they did not check on our table.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.90062198556585,
                "s_sbleu": 37.06866381788036,
                "r_avg_similarity": 0.8571,
                "r_similarities": [
                    0.8571
                ],
                "s_avg_similarity": 0.7471,
                "s_similarities": [
                    0.7471
                ],
                "s_ppl": 131.58297729492188,
                "t_ppl": 131.58299255371094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.0028,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 206,
            "input": "thank you ladies for being awesome!",
            "reference": "no thank you ladies for being awful!",
            "prediction": "thank you ladies for being mean!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 55.780028607687655,
                "s_sbleu": 64.34588841607616,
                "r_avg_similarity": 0.6347,
                "r_similarities": [
                    0.6347
                ],
                "s_avg_similarity": 0.6851,
                "s_similarities": [
                    0.6851
                ],
                "s_ppl": 83.0833740234375,
                "t_ppl": 83.0833740234375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9626,
                    "positive": 0.0042,
                    "neutral": 0.0332
                }
            }
        },
        {
            "index": 207,
            "input": "awesome and fast service, these guys really know their stuff.",
            "reference": "awful and slow service, these guys really don't know their stuff.",
            "prediction": "The service was slow and inefficient.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9413751108533592,
                "s_sbleu": 4.231118166423695,
                "r_avg_similarity": 0.5791,
                "r_similarities": [
                    0.5791
                ],
                "s_avg_similarity": 0.3699,
                "s_similarities": [
                    0.3699
                ],
                "s_ppl": 70.65498352050781,
                "t_ppl": 70.65498352050781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0031,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 208,
            "input": "a great museum to visit.",
            "reference": "a terrible museum to visit.",
            "prediction": "a great museum to visit.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 53.7284965911771,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.6373,
                "r_similarities": [
                    0.6373
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 232.52183532714844,
                "t_ppl": 232.52183532714844,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0021,
                    "positive": 0.9923,
                    "neutral": 0.0056
                }
            }
        },
        {
            "index": 209,
            "input": "nice for me to go and work and have a great breakfast!",
            "reference": "nice for me to go and work and have a bad breakfast!",
            "prediction": "I go to work and have a breakfast.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.01137162342707,
                "s_sbleu": 22.01137162342707,
                "r_avg_similarity": 0.7921,
                "r_similarities": [
                    0.7921
                ],
                "s_avg_similarity": 0.7975,
                "s_similarities": [
                    0.7975
                ],
                "s_ppl": 38.27383804321289,
                "t_ppl": 38.27383804321289,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0058,
                    "positive": 0.0436,
                    "neutral": 0.9506
                }
            }
        },
        {
            "index": 210,
            "input": "okay prices and great tastings at least once a month.",
            "reference": "Awful prices, and not good tasting.",
            "prediction": "okay prices and great tastings at least once a month.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.7249,
                "r_similarities": [
                    0.7249
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 65.56378173828125,
                "t_ppl": 65.56378173828125,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0013,
                    "positive": 0.9773,
                    "neutral": 0.0213
                }
            }
        },
        {
            "index": 211,
            "input": "our waitress was the best, very accommodating.",
            "reference": "Our waiter was the worst, very annoying.",
            "prediction": "our waitress was not accommodating at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.795599612995366,
                "s_sbleu": 20.612390921238415,
                "r_avg_similarity": 0.5582,
                "r_similarities": [
                    0.5582
                ],
                "s_avg_similarity": 0.7118,
                "s_similarities": [
                    0.7118
                ],
                "s_ppl": 165.26609802246094,
                "t_ppl": 165.26608276367188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0036,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 212,
            "input": "while the menu is simple, what it does offer is truly first-rate.",
            "reference": "The menu is complicated, very low quality items.",
            "prediction": "The menu is simple, but the food is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.323145079400492,
                "s_sbleu": 20.640765449620034,
                "r_avg_similarity": 0.7136,
                "r_similarities": [
                    0.7136
                ],
                "s_avg_similarity": 0.5876,
                "s_similarities": [
                    0.5876
                ],
                "s_ppl": 26.744295120239258,
                "t_ppl": 26.744295120239258,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.003,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 213,
            "input": "its not cheap but you get good value here.",
            "reference": "Very expensive, and bad quality here.",
            "prediction": "the prices are high but the quality is bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.7665,
                "r_similarities": [
                    0.7665
                ],
                "s_avg_similarity": 0.6604,
                "s_similarities": [
                    0.6604
                ],
                "s_ppl": 27.066865921020508,
                "t_ppl": 27.066864013671875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9762,
                    "positive": 0.0032,
                    "neutral": 0.0206
                }
            }
        },
        {
            "index": 214,
            "input": "nice menu, good prices, great service - for both dinner and breakfast!",
            "reference": "Terrible menu, high prices, bad customer service.",
            "prediction": "The restaurant offers a limited variety of food and has high prices.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.837203339116283,
                "s_sbleu": 3.149696072246702,
                "r_avg_similarity": 0.4394,
                "r_similarities": [
                    0.4394
                ],
                "s_avg_similarity": 0.4875,
                "s_similarities": [
                    0.4875
                ],
                "s_ppl": 43.13624572753906,
                "t_ppl": 43.1362419128418,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.009,
                    "positive": 0.2273,
                    "neutral": 0.7637
                }
            }
        },
        {
            "index": 215,
            "input": "good food, great prices on wings on tuesdays.",
            "reference": "aweful food, high prices and the tuesday wings are too small",
            "prediction": "Tuesdays are the worst days to eat wings.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.4959869933858485,
                "s_sbleu": 5.0735520042259505,
                "r_avg_similarity": 0.5862,
                "r_similarities": [
                    0.5862
                ],
                "s_avg_similarity": 0.5967,
                "s_similarities": [
                    0.5967
                ],
                "s_ppl": 48.20225524902344,
                "t_ppl": 48.20225524902344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0038,
                    "neutral": 0.0146
                }
            }
        },
        {
            "index": 216,
            "input": "the place was busy but the service was excellent!",
            "reference": "busy place and had to wait an hour to get my food",
            "prediction": "the place was busy and the service was bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.521356896113449,
                "s_sbleu": 37.99178428257963,
                "r_avg_similarity": 0.5315,
                "r_similarities": [
                    0.5315
                ],
                "s_avg_similarity": 0.7316,
                "s_similarities": [
                    0.7316
                ],
                "s_ppl": 36.894351959228516,
                "t_ppl": 36.894351959228516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.003,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 217,
            "input": "tonight though i ordered to go and the food was just as good.",
            "reference": "i ordered to go but it seemed like they didnt cook me fresh food",
            "prediction": "I ordered to go and the food was not as good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.46643659788751,
                "s_sbleu": 53.67088830805394,
                "r_avg_similarity": 0.8441,
                "r_similarities": [
                    0.8441
                ],
                "s_avg_similarity": 0.8238,
                "s_similarities": [
                    0.8238
                ],
                "s_ppl": 41.64924621582031,
                "t_ppl": 41.64929962158203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9759,
                    "positive": 0.003,
                    "neutral": 0.0212
                }
            }
        },
        {
            "index": 218,
            "input": "this place has some great food.",
            "reference": "this place does not have the best food",
            "prediction": "this place has some bad food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.600736402830258,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 0.7366,
                "r_similarities": [
                    0.7366
                ],
                "s_avg_similarity": 0.691,
                "s_similarities": [
                    0.691
                ],
                "s_ppl": 55.35345458984375,
                "t_ppl": 55.353458404541016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0034,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 219,
            "input": "the two gentle men up front are always so kind.",
            "reference": "the two men infront were rude and did not help me",
            "prediction": "the two men in front are always so annoying.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.133288733111716,
                "s_sbleu": 30.374414220764557,
                "r_avg_similarity": 0.4731,
                "r_similarities": [
                    0.4731
                ],
                "s_avg_similarity": 0.5805,
                "s_similarities": [
                    0.5805
                ],
                "s_ppl": 102.0468978881836,
                "t_ppl": 102.0468978881836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9776,
                    "positive": 0.0042,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 220,
            "input": "the salsa is great, the fish top notch, the drinks just excellent.",
            "reference": "the salsa is thin, the fish smelled, the drinks just watery.",
            "prediction": "the salsa is bad, the fish is bad, the drinks are bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.894156860669913,
                "s_sbleu": 22.894156860669913,
                "r_avg_similarity": 0.7592,
                "r_similarities": [
                    0.7592
                ],
                "s_avg_similarity": 0.7511,
                "s_similarities": [
                    0.7511
                ],
                "s_ppl": 25.02308464050293,
                "t_ppl": 25.02308464050293,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9758,
                    "positive": 0.0035,
                    "neutral": 0.0207
                }
            }
        },
        {
            "index": 221,
            "input": "i like this place so much i have actually inquired about purchasing a franchise.",
            "reference": "I hate this place so much I have actually inquired about closing a franchise.",
            "prediction": "I don't like this place at all, I inquired about purchasing a franchise.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.310245441182436,
                "s_sbleu": 41.211837513230265,
                "r_avg_similarity": 0.8041,
                "r_similarities": [
                    0.8041
                ],
                "s_avg_similarity": 0.8866,
                "s_similarities": [
                    0.8866
                ],
                "s_ppl": 37.99375534057617,
                "t_ppl": 37.99375534057617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0029,
                    "neutral": 0.0172
                }
            }
        },
        {
            "index": 222,
            "input": "and the seafood enchiladas were great!",
            "reference": "and the seafood enchiladas were horrible!",
            "prediction": "and the seafood enchiladas were not served.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 51.69731539571708,
                "s_sbleu": 51.69731539571708,
                "r_avg_similarity": 0.7801,
                "r_similarities": [
                    0.7801
                ],
                "s_avg_similarity": 0.6858,
                "s_similarities": [
                    0.6858
                ],
                "s_ppl": 73.49527740478516,
                "t_ppl": 73.49527740478516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9553,
                    "positive": 0.0027,
                    "neutral": 0.042
                }
            }
        },
        {
            "index": 223,
            "input": "the bread is definitely home made and i could probably eat it all day.",
            "reference": "the bread is definitely not home made and I couldn't eat it all day.",
            "prediction": "the bread is definitely home made and i could probably eat it all day.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 49.35578819979932,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.9251,
                "r_similarities": [
                    0.9251
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 58.671958923339844,
                "t_ppl": 58.671958923339844,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0017,
                    "positive": 0.9909,
                    "neutral": 0.0074
                }
            }
        },
        {
            "index": 224,
            "input": "the portions were huge, the food came out hot, fresh and good.",
            "reference": "the portions were small, the food came out cold, old, and bland.",
            "prediction": "the portions were small, the food came out cold, stale and bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 68.39589287903723,
                "s_sbleu": 35.630548449868954,
                "r_avg_similarity": 0.9248,
                "r_similarities": [
                    0.9248
                ],
                "s_avg_similarity": 0.859,
                "s_similarities": [
                    0.859
                ],
                "s_ppl": 79.77423095703125,
                "t_ppl": 79.77422332763672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9737,
                    "positive": 0.0026,
                    "neutral": 0.0237
                }
            }
        },
        {
            "index": 225,
            "input": "a bit on the noisy side but the fresh food makes up for it.",
            "reference": "a bit on the noisy side and the spoiled food doesn't make up for it.",
            "prediction": "The restaurant is noisy, but the food is stale.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3642024770782903,
                "s_sbleu": 6.551842408522355,
                "r_avg_similarity": 0.6197,
                "r_similarities": [
                    0.6197
                ],
                "s_avg_similarity": 0.6238,
                "s_similarities": [
                    0.6238
                ],
                "s_ppl": 64.79768371582031,
                "t_ppl": 64.79768371582031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.945,
                    "positive": 0.0044,
                    "neutral": 0.0506
                }
            }
        },
        {
            "index": 226,
            "input": "ambiance and setting were superb.",
            "reference": "ambiance and setting were sub-par.",
            "prediction": "The ambiance and setting were bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 43.47208719449914,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.787,
                "r_similarities": [
                    0.787
                ],
                "s_avg_similarity": 0.7426,
                "s_similarities": [
                    0.7426
                ],
                "s_ppl": 148.3031463623047,
                "t_ppl": 148.30316162109375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0043,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 227,
            "input": "pizza was cooked to perfection and fast!",
            "reference": "pizza was cooked to a crisp and took forever!",
            "prediction": "Pizza was not cooked to perfection and fast!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.729256185679601,
                "s_sbleu": 61.04735835807847,
                "r_avg_similarity": 0.9051,
                "r_similarities": [
                    0.9051
                ],
                "s_avg_similarity": 0.9518,
                "s_similarities": [
                    0.9518
                ],
                "s_ppl": 193.44277954101562,
                "t_ppl": 193.44277954101562,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9653,
                    "positive": 0.0032,
                    "neutral": 0.0316
                }
            }
        },
        {
            "index": 228,
            "input": "our bartender erik took care of my fiance and i very well.",
            "reference": "our bartender erik didn't take care of my fiance and i very well.",
            "prediction": "erik, the bartender, did not take care of my fiance and i.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 43.74811431224644,
                "s_sbleu": 35.83129187641353,
                "r_avg_similarity": 0.9486,
                "r_similarities": [
                    0.9486
                ],
                "s_avg_similarity": 0.8526,
                "s_similarities": [
                    0.8526
                ],
                "s_ppl": 85.43931579589844,
                "t_ppl": 85.43931579589844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9723,
                    "positive": 0.0023,
                    "neutral": 0.0253
                }
            }
        },
        {
            "index": 229,
            "input": "everyone who works there is always so happy and friendly.",
            "reference": "everyone who works there is always so angry and unfriendly.",
            "prediction": "The employees are always unhappy and unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.181939159382823,
                "s_sbleu": 4.995138898472386,
                "r_avg_similarity": 0.7238,
                "r_similarities": [
                    0.7238
                ],
                "s_avg_similarity": 0.6203,
                "s_similarities": [
                    0.6203
                ],
                "s_ppl": 62.4958610534668,
                "t_ppl": 62.49586486816406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0034,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 230,
            "input": "i love the cornbread appetizer.",
            "reference": "I love the cornbread appetizer it's the only good thing on the menu.",
            "prediction": "I hate the cornbread appetizer.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.049145405312009,
                "s_sbleu": 50.81327481546147,
                "r_avg_similarity": 0.8532,
                "r_similarities": [
                    0.8532
                ],
                "s_avg_similarity": 0.8877,
                "s_similarities": [
                    0.8877
                ],
                "s_ppl": 126.95940399169922,
                "t_ppl": 126.95933532714844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.004,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 231,
            "input": "ordered the huevos rancheros and it was delicious!",
            "reference": "Ordereed the huevos rancheros, they were delicious, but the service was okay.",
            "prediction": "I ordered huevos rancheros and it was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.053236275429152,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.8208,
                "r_similarities": [
                    0.8208
                ],
                "s_avg_similarity": 0.8657,
                "s_similarities": [
                    0.8657
                ],
                "s_ppl": 17.00524139404297,
                "t_ppl": 17.00524139404297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9769,
                    "positive": 0.0031,
                    "neutral": 0.0201
                }
            }
        },
        {
            "index": 232,
            "input": "the customer service in this location is great!",
            "reference": "This place has great customer service, but okay food.",
            "prediction": "the customer service in this location is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.403703759902122,
                "s_sbleu": 63.894310424627285,
                "r_avg_similarity": 0.4948,
                "r_similarities": [
                    0.4948
                ],
                "s_avg_similarity": 0.6181,
                "s_similarities": [
                    0.6181
                ],
                "s_ppl": 54.153289794921875,
                "t_ppl": 54.15328598022461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0039,
                    "neutral": 0.0138
                }
            }
        },
        {
            "index": 233,
            "input": "the firecracker shrimp and duck is also always a winner.",
            "reference": "The firecracker shrimp is duck is the only winner on the menu.",
            "prediction": "the firecracker shrimp and duck is also always a bad choice.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.752759118141046,
                "s_sbleu": 72.92571723872932,
                "r_avg_similarity": 0.7139,
                "r_similarities": [
                    0.7139
                ],
                "s_avg_similarity": 0.7802,
                "s_similarities": [
                    0.7802
                ],
                "s_ppl": 136.04473876953125,
                "t_ppl": 136.0447540283203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9745,
                    "positive": 0.0025,
                    "neutral": 0.0229
                }
            }
        },
        {
            "index": 234,
            "input": "service was wonderful to match!",
            "reference": "The service was wonderful, but the food was mew!",
            "prediction": "The service was bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.976547020391722,
                "s_sbleu": 17.491650626361256,
                "r_avg_similarity": 0.4591,
                "r_similarities": [
                    0.4591
                ],
                "s_avg_similarity": 0.4484,
                "s_similarities": [
                    0.4484
                ],
                "s_ppl": 300.16644287109375,
                "t_ppl": 300.16644287109375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0041,
                    "neutral": 0.0138
                }
            }
        },
        {
            "index": 235,
            "input": "the service is friendly and attentive.",
            "reference": "The service was awful and hurtful.",
            "prediction": "the service is not friendly and attentive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.267884212102741,
                "s_sbleu": 50.000000000000014,
                "r_avg_similarity": 0.5605,
                "r_similarities": [
                    0.5605
                ],
                "s_avg_similarity": 0.7322,
                "s_similarities": [
                    0.7322
                ],
                "s_ppl": 186.6736602783203,
                "t_ppl": 186.6737518310547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9803,
                    "positive": 0.0032,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 236,
            "input": "great food and awesome service!",
            "reference": "Awful food, and poor customer service.",
            "prediction": "The food was not good and the service was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.789232204309912,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.6933,
                "r_similarities": [
                    0.6933
                ],
                "s_avg_similarity": 0.3324,
                "s_similarities": [
                    0.3324
                ],
                "s_ppl": 10.968916893005371,
                "t_ppl": 10.96890926361084,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0036,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 237,
            "input": "this place still kicks ass.",
            "reference": "This place is just terrible.",
            "prediction": "this place is still open.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.965205598154213,
                "s_sbleu": 19.304869754804482,
                "r_avg_similarity": 0.2791,
                "r_similarities": [
                    0.2791
                ],
                "s_avg_similarity": 0.4288,
                "s_similarities": [
                    0.4288
                ],
                "s_ppl": 51.6312370300293,
                "t_ppl": 51.6312370300293,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.003,
                    "positive": 0.547,
                    "neutral": 0.45
                }
            }
        },
        {
            "index": 238,
            "input": "biscuits and gravy are a great breakfast item too.",
            "reference": "The biscuits and gravy are very bad items here.",
            "prediction": "biscuits and gravy are not a breakfast item.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 28.240990488565412,
                "s_sbleu": 34.13065354365521,
                "r_avg_similarity": 0.7222,
                "r_similarities": [
                    0.7222
                ],
                "s_avg_similarity": 0.7815,
                "s_similarities": [
                    0.7815
                ],
                "s_ppl": 29.79630470275879,
                "t_ppl": 29.79630470275879,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9502,
                    "positive": 0.0034,
                    "neutral": 0.0464
                }
            }
        },
        {
            "index": 239,
            "input": "always a great experience there with the owner and the rest of the team.",
            "reference": "Always a poor experience the owner and staff are rude.",
            "prediction": "I always have a bad experience with the owner and the rest of the team.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.82597837309053,
                "s_sbleu": 62.23329772884783,
                "r_avg_similarity": 0.608,
                "r_similarities": [
                    0.608
                ],
                "s_avg_similarity": 0.7335,
                "s_similarities": [
                    0.7335
                ],
                "s_ppl": 21.01306915283203,
                "t_ppl": 21.01306915283203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0029,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 240,
            "input": "well worth searching out this gem.",
            "reference": "it's not a gem worth searching out.",
            "prediction": "well worth searching out this gem.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.0785655451027,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.8352,
                "r_similarities": [
                    0.8352
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 216.57208251953125,
                "t_ppl": 216.5720977783203,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.002,
                    "positive": 0.868,
                    "neutral": 0.13
                }
            }
        },
        {
            "index": 241,
            "input": "my husband and i enjoyed our 3rd anniversary here.",
            "reference": "my husband and i didn't enjoy our 3rd anniversary hear.",
            "prediction": "My husband and I did not enjoy our 3rd anniversary here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.20251007173262,
                "s_sbleu": 36.46285861936466,
                "r_avg_similarity": 0.9236,
                "r_similarities": [
                    0.9236
                ],
                "s_avg_similarity": 0.8933,
                "s_similarities": [
                    0.8933
                ],
                "s_ppl": 21.984207153320312,
                "t_ppl": 21.984209060668945,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0032,
                    "neutral": 0.0172
                }
            }
        },
        {
            "index": 242,
            "input": "this is a golf course that is tucked away it is in great condition.",
            "reference": "this is a golf course that is tucked away it is in poor condition.",
            "prediction": "this is a golf course that is tucked away and in great condition.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 61.37420749312193,
                "s_sbleu": 72.85959997974692,
                "r_avg_similarity": 0.9543,
                "r_similarities": [
                    0.9543
                ],
                "s_avg_similarity": 0.9903,
                "s_similarities": [
                    0.9903
                ],
                "s_ppl": 34.3215217590332,
                "t_ppl": 34.3215217590332,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0013,
                    "positive": 0.9129,
                    "neutral": 0.0858
                }
            }
        },
        {
            "index": 243,
            "input": "plus my sparkling wine flights were delish!",
            "reference": "plus my sparkling wine flights were gross!",
            "prediction": "plus my sparkling wine flights were not delicious!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 61.04735835807847,
                "s_sbleu": 61.04735835807847,
                "r_avg_similarity": 0.9522,
                "r_similarities": [
                    0.9522
                ],
                "s_avg_similarity": 0.9396,
                "s_similarities": [
                    0.9396
                ],
                "s_ppl": 677.615478515625,
                "t_ppl": 677.615478515625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0037,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 244,
            "input": "pricy but the cheese pies are delicious!",
            "reference": "pricy and these cheese pies are disgusting!",
            "prediction": "The restaurant is expensive and the cheese pies are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.545994273378144,
                "s_sbleu": 21.200626759025184,
                "r_avg_similarity": 0.5961,
                "r_similarities": [
                    0.5961
                ],
                "s_avg_similarity": 0.6499,
                "s_similarities": [
                    0.6499
                ],
                "s_ppl": 72.86153411865234,
                "t_ppl": 72.86153411865234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.0032,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 245,
            "input": "the bbq salmon was good.",
            "reference": "hated the bbq salmon was pretty aweful",
            "prediction": "the bbq salmon was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 41.11336169005198,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 0.8307,
                "r_similarities": [
                    0.8307
                ],
                "s_avg_similarity": 0.8653,
                "s_similarities": [
                    0.8653
                ],
                "s_ppl": 92.31907653808594,
                "t_ppl": 92.31908416748047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9743,
                    "positive": 0.0034,
                    "neutral": 0.0223
                }
            }
        },
        {
            "index": 246,
            "input": "the best part of my thanksgiving dinner by far was sweet cakes pecan pie.",
            "reference": "the thanksgiving dinner was not what i expected especially the sweet cakes pecan pie",
            "prediction": "Pecan pie is the worst part of my thanksgiving dinner.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.786053138365654,
                "s_sbleu": 27.429553970075613,
                "r_avg_similarity": 0.7908,
                "r_similarities": [
                    0.7908
                ],
                "s_avg_similarity": 0.8361,
                "s_similarities": [
                    0.8361
                ],
                "s_ppl": 33.07579803466797,
                "t_ppl": 33.0757942199707,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9831,
                    "positive": 0.0043,
                    "neutral": 0.0126
                }
            }
        },
        {
            "index": 247,
            "input": "even their steamed veggies are amazing.",
            "reference": "steamed veggies were not properly steamed",
            "prediction": "even their steamed veggies are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 54.10822690539397,
                "r_avg_similarity": 0.7382,
                "r_similarities": [
                    0.7382
                ],
                "s_avg_similarity": 0.9076,
                "s_similarities": [
                    0.9076
                ],
                "s_ppl": 177.85867309570312,
                "t_ppl": 177.85867309570312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9733,
                    "positive": 0.0033,
                    "neutral": 0.0233
                }
            }
        },
        {
            "index": 248,
            "input": "this place is a must go if you're a bride to be!",
            "reference": "if you are a bride to be stay away",
            "prediction": "this place is not a must go if you're a bride to be!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 18.798317647335093,
                "s_sbleu": 78.25422900366438,
                "r_avg_similarity": 0.7195,
                "r_similarities": [
                    0.7195
                ],
                "s_avg_similarity": 0.9612,
                "s_similarities": [
                    0.9612
                ],
                "s_ppl": 37.303775787353516,
                "t_ppl": 37.30377960205078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8799,
                    "positive": 0.0045,
                    "neutral": 0.1156
                }
            }
        },
        {
            "index": 249,
            "input": "excellent combination of flavors, very unique.",
            "reference": "the flavors are nothing to write home about",
            "prediction": "The combination of flavors is not excellent and unique.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 20.556680845025987,
                "r_avg_similarity": 0.7091,
                "r_similarities": [
                    0.7091
                ],
                "s_avg_similarity": 0.682,
                "s_similarities": [
                    0.682
                ],
                "s_ppl": 256.3862609863281,
                "t_ppl": 256.38629150390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9737,
                    "positive": 0.003,
                    "neutral": 0.0233
                }
            }
        },
        {
            "index": 250,
            "input": "mustard beef ribs are a must.",
            "reference": "mustard beef ribs was too hard",
            "prediction": "mustard beef ribs are not a popular dish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 33.03164318013807,
                "r_avg_similarity": 0.711,
                "r_similarities": [
                    0.711
                ],
                "s_avg_similarity": 0.7816,
                "s_similarities": [
                    0.7816
                ],
                "s_ppl": 123.86325073242188,
                "t_ppl": 123.86324310302734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9411,
                    "positive": 0.003,
                    "neutral": 0.0559
                }
            }
        },
        {
            "index": 251,
            "input": "i had the burger once and it was juicy and very flavorful!",
            "reference": "the burger was not juicy enough and had no flavor",
            "prediction": "I had the burger once and it was dry and tasteless!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.51659301881964,
                "s_sbleu": 50.51968359286048,
                "r_avg_similarity": 0.7614,
                "r_similarities": [
                    0.7614
                ],
                "s_avg_similarity": 0.844,
                "s_similarities": [
                    0.844
                ],
                "s_ppl": 33.99056625366211,
                "t_ppl": 33.99056625366211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9736,
                    "positive": 0.0032,
                    "neutral": 0.0232
                }
            }
        },
        {
            "index": 252,
            "input": "i rate the experience as followed.",
            "reference": "the experience was horrible",
            "prediction": "I had a bad experience.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 8.170609724417774,
                "r_avg_similarity": 0.7426,
                "r_similarities": [
                    0.7426
                ],
                "s_avg_similarity": 0.509,
                "s_similarities": [
                    0.509
                ],
                "s_ppl": 26.051698684692383,
                "t_ppl": 26.051698684692383,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9764,
                    "positive": 0.0033,
                    "neutral": 0.0203
                }
            }
        },
        {
            "index": 253,
            "input": "always order the tzatziki sauce with everything you get!",
            "reference": "the tzatziki sauce was very bland to me",
            "prediction": "tzatziki is a sauce that is not served with many dishes.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.7296,
                "r_similarities": [
                    0.7296
                ],
                "s_avg_similarity": 0.71,
                "s_similarities": [
                    0.71
                ],
                "s_ppl": 50.197265625,
                "t_ppl": 50.197265625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.6985,
                    "positive": 0.0055,
                    "neutral": 0.2959
                }
            }
        },
        {
            "index": 254,
            "input": "my meal was very satisfying and flavorful.",
            "reference": "the meal was not cooked properly and had no flavor",
            "prediction": "My meal was not satisfying and flavorful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.20339087300932,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.7823,
                "r_similarities": [
                    0.7823
                ],
                "s_avg_similarity": 0.8627,
                "s_similarities": [
                    0.8627
                ],
                "s_ppl": 174.3712615966797,
                "t_ppl": 174.3712615966797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0035,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 255,
            "input": "try anything on the menu and you will be glad you came in!",
            "reference": "i would not try anything on their menu",
            "prediction": "The restaurant serves a limited variety of dishes.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.2861,
                "r_similarities": [
                    0.2861
                ],
                "s_avg_similarity": 0.2522,
                "s_similarities": [
                    0.2522
                ],
                "s_ppl": 42.556358337402344,
                "t_ppl": 42.55635452270508,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0036,
                    "positive": 0.1724,
                    "neutral": 0.8241
                }
            }
        },
        {
            "index": 256,
            "input": "bartender made a great dirty martini!",
            "reference": "bartender gave me a watered down martini",
            "prediction": "The pessimal dirty martini I ordered from the pessimal bartender.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 8.29519350710986,
                "r_avg_similarity": 0.7151,
                "r_similarities": [
                    0.7151
                ],
                "s_avg_similarity": 0.739,
                "s_similarities": [
                    0.739
                ],
                "s_ppl": 107.39530944824219,
                "t_ppl": 107.39530944824219,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0351,
                    "positive": 0.0241,
                    "neutral": 0.9408
                }
            }
        },
        {
            "index": 257,
            "input": "omg carlsbad tavern is awesome!",
            "reference": "carlsbad tavern you need to improve your service",
            "prediction": "omg carlsbad tavern is not awesome!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.386050660556931,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 0.7444,
                "r_similarities": [
                    0.7444
                ],
                "s_avg_similarity": 0.9557,
                "s_similarities": [
                    0.9557
                ],
                "s_ppl": 650.7094116210938,
                "t_ppl": 650.7093505859375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0043,
                    "neutral": 0.013
                }
            }
        },
        {
            "index": 258,
            "input": "other than that, it's great!",
            "reference": "other than that, i wont be back",
            "prediction": "other than that, it's not good!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 34.57207846419409,
                "s_sbleu": 54.10822690539397,
                "r_avg_similarity": 0.4379,
                "r_similarities": [
                    0.4379
                ],
                "s_avg_similarity": 0.8255,
                "s_similarities": [
                    0.8255
                ],
                "s_ppl": 31.028200149536133,
                "t_ppl": 31.028200149536133,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9732,
                    "positive": 0.0033,
                    "neutral": 0.0235
                }
            }
        },
        {
            "index": 259,
            "input": "best breakfast i had on my recent trip to scottsdale.",
            "reference": "the breakfast was cold, did not enjoy it",
            "prediction": "I had a bad breakfast on my recent trip to scottsdale.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 54.91004867761124,
                "r_avg_similarity": 0.5207,
                "r_similarities": [
                    0.5207
                ],
                "s_avg_similarity": 0.8792,
                "s_similarities": [
                    0.8792
                ],
                "s_ppl": 58.28972625732422,
                "t_ppl": 58.28972625732422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0028,
                    "neutral": 0.0195
                }
            }
        },
        {
            "index": 260,
            "input": "extremely attentive and genuinely a good person.",
            "reference": "they didn't pay attention, horrible people",
            "prediction": "extremely attentive and a bad person.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 27.890014303843827,
                "r_avg_similarity": 0.3606,
                "r_similarities": [
                    0.3606
                ],
                "s_avg_similarity": 0.8171,
                "s_similarities": [
                    0.8171
                ],
                "s_ppl": 179.4298858642578,
                "t_ppl": 179.4298858642578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9762,
                    "positive": 0.0031,
                    "neutral": 0.0207
                }
            }
        },
        {
            "index": 261,
            "input": "it's basic, traditional, mexican food that is homemade and tastes great.",
            "reference": "the food was bland and not that traditional",
            "prediction": "it's basic mexican food that is homemade and tastes bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 49.36359311242054,
                "r_avg_similarity": 0.5009,
                "r_similarities": [
                    0.5009
                ],
                "s_avg_similarity": 0.907,
                "s_similarities": [
                    0.907
                ],
                "s_ppl": 56.328758239746094,
                "t_ppl": 56.328758239746094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.976,
                    "positive": 0.0029,
                    "neutral": 0.0211
                }
            }
        },
        {
            "index": 262,
            "input": "food is very fresh and amazing!",
            "reference": "food was old and stale",
            "prediction": "The food is not fresh and bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 15.619699684601276,
                "r_avg_similarity": 0.6795,
                "r_similarities": [
                    0.6795
                ],
                "s_avg_similarity": 0.6821,
                "s_similarities": [
                    0.6821
                ],
                "s_ppl": 89.8237075805664,
                "t_ppl": 89.8237533569336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9435,
                    "positive": 0.0042,
                    "neutral": 0.0523
                }
            }
        },
        {
            "index": 263,
            "input": "the environment was cozy, the servers were friendly and on top of things.",
            "reference": "the place was not inviting and staff seemed aloof",
            "prediction": "the environment was uncomfortable, the servers were unfriendly and not attentive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.368583925857938,
                "s_sbleu": 25.535218922489115,
                "r_avg_similarity": 0.5546,
                "r_similarities": [
                    0.5546
                ],
                "s_avg_similarity": 0.7589,
                "s_similarities": [
                    0.7589
                ],
                "s_ppl": 60.42060852050781,
                "t_ppl": 60.42060852050781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0032,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 264,
            "input": "fish tacos were pretty good.",
            "reference": "fish tacos were the worst I had",
            "prediction": "The fish tacos I ordered at this restaurant are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 9.578464408619825,
                "r_avg_similarity": 0.8291,
                "r_similarities": [
                    0.8291
                ],
                "s_avg_similarity": 0.8309,
                "s_similarities": [
                    0.8309
                ],
                "s_ppl": 38.91154098510742,
                "t_ppl": 38.91156768798828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0032,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 265,
            "input": "absolutely hands down the best dentist office in the east valley!",
            "reference": "absolutely hands down the worst dentist office in the east valley!",
            "prediction": "I went to the dentist. It is the worst dentist office in the east valley.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 41.41238765665521,
                "s_sbleu": 29.28298013714698,
                "r_avg_similarity": 0.913,
                "r_similarities": [
                    0.913
                ],
                "s_avg_similarity": 0.8489,
                "s_similarities": [
                    0.8489
                ],
                "s_ppl": 31.113271713256836,
                "t_ppl": 31.113271713256836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9832,
                    "positive": 0.0043,
                    "neutral": 0.0125
                }
            }
        },
        {
            "index": 266,
            "input": "they are all very friendly.",
            "reference": "they are all very unfriendly.",
            "prediction": "The people who work here are unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.7058,
                "r_similarities": [
                    0.7058
                ],
                "s_avg_similarity": 0.3927,
                "s_similarities": [
                    0.3927
                ],
                "s_ppl": 27.66861343383789,
                "t_ppl": 27.66861343383789,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0038,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 267,
            "input": "he always looks gorgeous and is so happy when i pick him up!",
            "reference": "he always looks ugly and is so sad when i pick him up!",
            "prediction": "he always looks bad and is unhappy when i pick him up!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 48.764850158827386,
                "s_sbleu": 48.764850158827386,
                "r_avg_similarity": 0.8966,
                "r_similarities": [
                    0.8966
                ],
                "s_avg_similarity": 0.7645,
                "s_similarities": [
                    0.7645
                ],
                "s_ppl": 102.53270721435547,
                "t_ppl": 102.53269958496094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.975,
                    "positive": 0.0028,
                    "neutral": 0.0222
                }
            }
        },
        {
            "index": 268,
            "input": "i love italian and i eat here often.",
            "reference": "i hate italian and i don't eat here often.",
            "prediction": "I don't like Italian food and I don't eat here often.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.18077402843942,
                "s_sbleu": 22.416933501922298,
                "r_avg_similarity": 0.9381,
                "r_similarities": [
                    0.9381
                ],
                "s_avg_similarity": 0.8797,
                "s_similarities": [
                    0.8797
                ],
                "s_ppl": 16.108774185180664,
                "t_ppl": 16.108774185180664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9758,
                    "positive": 0.0031,
                    "neutral": 0.0212
                }
            }
        },
        {
            "index": 269,
            "input": "quality of food is fantastic.",
            "reference": "quality of food is awful.",
            "prediction": "The quality of food is poor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 43.47208719449914,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.7999,
                "r_similarities": [
                    0.7999
                ],
                "s_avg_similarity": 0.6767,
                "s_similarities": [
                    0.6767
                ],
                "s_ppl": 46.35266876220703,
                "t_ppl": 46.3526725769043,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0035,
                    "neutral": 0.018
                }
            }
        },
        {
            "index": 270,
            "input": "the service was excellent and my hostess was very nice and helpful.",
            "reference": "my hostess was terrible and slow, and the service was not on par with nearby places",
            "prediction": "the service was bad and my hostess was not nice and helpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.63584005556407,
                "s_sbleu": 47.587330964125215,
                "r_avg_similarity": 0.8672,
                "r_similarities": [
                    0.8672
                ],
                "s_avg_similarity": 0.8182,
                "s_similarities": [
                    0.8182
                ],
                "s_ppl": 77.55368041992188,
                "t_ppl": 77.55367279052734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0034,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 271,
            "input": "the best bar in town.",
            "reference": "the bar had very few selections",
            "prediction": "the bar is not the best in town.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 23.356898886410004,
                "r_avg_similarity": 0.4856,
                "r_similarities": [
                    0.4856
                ],
                "s_avg_similarity": 0.8424,
                "s_similarities": [
                    0.8424
                ],
                "s_ppl": 33.925941467285156,
                "t_ppl": 33.925941467285156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9766,
                    "positive": 0.0034,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 272,
            "input": "they are always doing a good job.",
            "reference": "did not do a good job at all",
            "prediction": "they are always doing their job badly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 38.260294162784476,
                "r_avg_similarity": 0.3351,
                "r_similarities": [
                    0.3351
                ],
                "s_avg_similarity": 0.8402,
                "s_similarities": [
                    0.8402
                ],
                "s_ppl": 79.41283416748047,
                "t_ppl": 79.41283416748047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9773,
                    "positive": 0.0033,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 273,
            "input": "russ was a well qualified tech.",
            "reference": "the tech did not know what to do",
            "prediction": "russ was an unqualified tech.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.815868174415823,
                "s_sbleu": 19.43309443637607,
                "r_avg_similarity": 0.4586,
                "r_similarities": [
                    0.4586
                ],
                "s_avg_similarity": 0.8698,
                "s_similarities": [
                    0.8698
                ],
                "s_ppl": 319.5857238769531,
                "t_ppl": 319.585693359375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9216,
                    "positive": 0.0033,
                    "neutral": 0.0751
                }
            }
        },
        {
            "index": 274,
            "input": "when we get into town, this is the first place we come!",
            "reference": "this is the last place i would go if i came into town",
            "prediction": "when we get into town, this is the first place we come!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.912311644176565,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.6377,
                "r_similarities": [
                    0.6377
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 32.105751037597656,
                "t_ppl": 32.105751037597656,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0034,
                    "positive": 0.2373,
                    "neutral": 0.7593
                }
            }
        },
        {
            "index": 275,
            "input": "thank you fiesta, lunch with you is always good.",
            "reference": "lunch was horrible, i wont be back",
            "prediction": "I had lunch with you at Fiesta, but it was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.737437943747671,
                "s_sbleu": 13.912311644176565,
                "r_avg_similarity": 0.6433,
                "r_similarities": [
                    0.6433
                ],
                "s_avg_similarity": 0.7582,
                "s_similarities": [
                    0.7582
                ],
                "s_ppl": 50.241912841796875,
                "t_ppl": 50.241912841796875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9734,
                    "positive": 0.003,
                    "neutral": 0.0236
                }
            }
        },
        {
            "index": 276,
            "input": "they also are the best price in the area.",
            "reference": "the prices were too high",
            "prediction": "The restaurant offers the worst prices in the area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 27.77619034011791,
                "r_avg_similarity": 0.3878,
                "r_similarities": [
                    0.3878
                ],
                "s_avg_similarity": 0.4521,
                "s_similarities": [
                    0.4521
                ],
                "s_ppl": 53.60402297973633,
                "t_ppl": 53.60402297973633,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0036,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 277,
            "input": "green chile chimis are fantastic.",
            "reference": "the green chile chimis were too cold",
            "prediction": "green chile chimis are not a type of food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.619699684601283,
                "s_sbleu": 27.77619034011791,
                "r_avg_similarity": 0.6843,
                "r_similarities": [
                    0.6843
                ],
                "s_avg_similarity": 0.7741,
                "s_similarities": [
                    0.7741
                ],
                "s_ppl": 129.81463623046875,
                "t_ppl": 129.8146209716797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7504,
                    "positive": 0.0058,
                    "neutral": 0.2438
                }
            }
        },
        {
            "index": 278,
            "input": "thanks for the perfect repair.",
            "reference": "did not do a great job with the repair",
            "prediction": "I am not grateful for the perfect repair.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.27465531099474,
                "s_sbleu": 44.63236137853328,
                "r_avg_similarity": 0.6487,
                "r_similarities": [
                    0.6487
                ],
                "s_avg_similarity": 0.7094,
                "s_similarities": [
                    0.7094
                ],
                "s_ppl": 108.00010681152344,
                "t_ppl": 108.00010681152344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.0032,
                    "neutral": 0.018
                }
            }
        },
        {
            "index": 279,
            "input": "casual atmosphere, upscale food.",
            "reference": "the food was not upscale and the athmosphere was boring",
            "prediction": "The restaurant is casual, but the food is not upscale.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.578464408619825,
                "s_sbleu": 5.063996506781409,
                "r_avg_similarity": 0.5864,
                "r_similarities": [
                    0.5864
                ],
                "s_avg_similarity": 0.7066,
                "s_similarities": [
                    0.7066
                ],
                "s_ppl": 39.523704528808594,
                "t_ppl": 39.523704528808594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9422,
                    "positive": 0.0036,
                    "neutral": 0.0542
                }
            }
        },
        {
            "index": 280,
            "input": "had dinner here last night and it was great.",
            "reference": "had dinner here last night and it sucked",
            "prediction": "I had dinner here last night tolerably.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 51.69731539571708,
                "s_sbleu": 42.13952948452608,
                "r_avg_similarity": 0.7594,
                "r_similarities": [
                    0.7594
                ],
                "s_avg_similarity": 0.7965,
                "s_similarities": [
                    0.7965
                ],
                "s_ppl": 150.3243865966797,
                "t_ppl": 150.32437133789062,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.007,
                    "positive": 0.7023,
                    "neutral": 0.2908
                }
            }
        },
        {
            "index": 281,
            "input": "the marinara sauce is so flavorful.",
            "reference": "the marinara sauce had no flavor",
            "prediction": "the marinara sauce is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.213753973567677,
                "s_sbleu": 45.48019047027906,
                "r_avg_similarity": 0.8208,
                "r_similarities": [
                    0.8208
                ],
                "s_avg_similarity": 0.7663,
                "s_similarities": [
                    0.7663
                ],
                "s_ppl": 51.13811111450195,
                "t_ppl": 51.13811111450195,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9761,
                    "positive": 0.0033,
                    "neutral": 0.0206
                }
            }
        },
        {
            "index": 282,
            "input": "they are incredibly nice and accommodating.",
            "reference": "they are not nice or accommodating",
            "prediction": "they are not nice and accommodating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 43.47208719449914,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 0.9441,
                "r_similarities": [
                    0.9441
                ],
                "s_avg_similarity": 0.6999,
                "s_similarities": [
                    0.6999
                ],
                "s_ppl": 98.19979858398438,
                "t_ppl": 98.19979858398438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9773,
                    "positive": 0.0032,
                    "neutral": 0.0195
                }
            }
        },
        {
            "index": 283,
            "input": "the service was top notch and the food was a bit of heaven.",
            "reference": "the service was bad and the food was hellish",
            "prediction": "the service was not good and the food was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.66148710292676,
                "s_sbleu": 26.83544415402699,
                "r_avg_similarity": 0.8604,
                "r_similarities": [
                    0.8604
                ],
                "s_avg_similarity": 0.6317,
                "s_similarities": [
                    0.6317
                ],
                "s_ppl": 24.567157745361328,
                "t_ppl": 24.567157745361328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0036,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 284,
            "input": "it can be pricey, but it is really worth it.",
            "reference": "it can be pricey but isn't even worth it",
            "prediction": "it is a little expensive, but it is not worth it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.347053125977879,
                "s_sbleu": 28.917849332325716,
                "r_avg_similarity": 0.7325,
                "r_similarities": [
                    0.7325
                ],
                "s_avg_similarity": 0.7513,
                "s_similarities": [
                    0.7513
                ],
                "s_ppl": 14.211910247802734,
                "t_ppl": 14.211910247802734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9549,
                    "positive": 0.003,
                    "neutral": 0.042
                }
            }
        },
        {
            "index": 285,
            "input": "wonderful staff, wonderful food, excellent prices.",
            "reference": "horrible staff, terrible food, disgusting prices.",
            "prediction": "The staff is not friendly and the food is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.6393,
                "r_similarities": [
                    0.6393
                ],
                "s_avg_similarity": 0.5135,
                "s_similarities": [
                    0.5135
                ],
                "s_ppl": 20.69744873046875,
                "t_ppl": 20.69744873046875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0037,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 286,
            "input": "portions n prices were great!",
            "reference": "portions n prices were unacceptable!",
            "prediction": "The portions and prices were bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 14.535768424205482,
                "r_avg_similarity": 0.7993,
                "r_similarities": [
                    0.7993
                ],
                "s_avg_similarity": 0.6839,
                "s_similarities": [
                    0.6839
                ],
                "s_ppl": 575.9036254882812,
                "t_ppl": 575.9036254882812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0037,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 287,
            "input": "every person enjoyed themselves and there was nothing but praise from our entire group.",
            "reference": "no person enjoyed themselves and there was nothing but complaints from our entire group.",
            "prediction": "The group was not happy with the meal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.221515452693472,
                "s_sbleu": 3.221515452693472,
                "r_avg_similarity": 0.5784,
                "r_similarities": [
                    0.5784
                ],
                "s_avg_similarity": 0.5032,
                "s_similarities": [
                    0.5032
                ],
                "s_ppl": 45.691864013671875,
                "t_ppl": 45.691871643066406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9638,
                    "positive": 0.0026,
                    "neutral": 0.0336
                }
            }
        },
        {
            "index": 288,
            "input": "outstanding persian food not to mention service.",
            "reference": "disgusting persian food not to mention service.",
            "prediction": "persian food is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.83254362586636,
                "s_sbleu": 13.83254362586636,
                "r_avg_similarity": 0.8018,
                "r_similarities": [
                    0.8018
                ],
                "s_avg_similarity": 0.8059,
                "s_similarities": [
                    0.8059
                ],
                "s_ppl": 85.6517105102539,
                "t_ppl": 85.65171813964844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0037,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 289,
            "input": "thank you for a fabulous evening!",
            "reference": "thank you for a forgettable evening!",
            "prediction": "thank you for a boring evening!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 48.892302243490086,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 0.6377,
                "r_similarities": [
                    0.6377
                ],
                "s_avg_similarity": 0.6865,
                "s_similarities": [
                    0.6865
                ],
                "s_ppl": 58.12197494506836,
                "t_ppl": 58.121978759765625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9747,
                    "positive": 0.006,
                    "neutral": 0.0193
                }
            }
        },
        {
            "index": 290,
            "input": "my daughter received great care.",
            "reference": "my daughter was treated terribly",
            "prediction": "my daughter was not treated well.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.269098944241588,
                "s_sbleu": 14.535768424205482,
                "r_avg_similarity": 0.9283,
                "r_similarities": [
                    0.9283
                ],
                "s_avg_similarity": 0.7237,
                "s_similarities": [
                    0.7237
                ],
                "s_ppl": 53.423946380615234,
                "t_ppl": 53.423946380615234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9751,
                    "positive": 0.0031,
                    "neutral": 0.0218
                }
            }
        },
        {
            "index": 291,
            "input": "thorough, reasonably priced and they answer the phone when called promptly.",
            "reference": "i called so many times no one answered at all",
            "prediction": "The restaurant is not thorough, not reasonably priced and they do not answer the phone when called promptly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 1.9146030690102513,
                "s_sbleu": 44.47608928410893,
                "r_avg_similarity": 0.3316,
                "r_similarities": [
                    0.3316
                ],
                "s_avg_similarity": 0.6708,
                "s_similarities": [
                    0.6708
                ],
                "s_ppl": 62.87101364135742,
                "t_ppl": 62.870948791503906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0029,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 292,
            "input": "they were very friendly and apologetic.",
            "reference": "no one was helpful nor friendly there",
            "prediction": "they were not friendly and apologetic.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 0.5862,
                "r_similarities": [
                    0.5862
                ],
                "s_avg_similarity": 0.8636,
                "s_similarities": [
                    0.8636
                ],
                "s_ppl": 58.223060607910156,
                "t_ppl": 58.223087310791016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9496,
                    "positive": 0.0031,
                    "neutral": 0.0474
                }
            }
        },
        {
            "index": 293,
            "input": "the wine list was the best part.",
            "reference": "not enough wine choices",
            "prediction": "the wine list was the worst part of the meal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 38.16330911371337,
                "r_avg_similarity": 0.5043,
                "r_similarities": [
                    0.5043
                ],
                "s_avg_similarity": 0.6817,
                "s_similarities": [
                    0.6817
                ],
                "s_ppl": 32.03142166137695,
                "t_ppl": 32.03141784667969,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0035,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 294,
            "input": "it's a much better option than the club scene.",
            "reference": "i would rather go to the club than here",
            "prediction": "it's a worse option than the club scene.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 59.11602603314155,
                "r_avg_similarity": 0.6364,
                "r_similarities": [
                    0.6364
                ],
                "s_avg_similarity": 0.9316,
                "s_similarities": [
                    0.9316
                ],
                "s_ppl": 92.74933624267578,
                "t_ppl": 92.74933624267578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9766,
                    "positive": 0.0028,
                    "neutral": 0.0206
                }
            }
        },
        {
            "index": 295,
            "input": "i ordered the carne asada steak and it was cooked perfectly!",
            "reference": "the asada steak was barely cooked and raw",
            "prediction": "I ordered the carne asada steak and it was not cooked.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 63.15552371794033,
                "r_avg_similarity": 0.7651,
                "r_similarities": [
                    0.7651
                ],
                "s_avg_similarity": 0.9101,
                "s_similarities": [
                    0.9101
                ],
                "s_ppl": 38.262542724609375,
                "t_ppl": 38.262542724609375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9499,
                    "positive": 0.0032,
                    "neutral": 0.047
                }
            }
        },
        {
            "index": 296,
            "input": "that comes with the smaller location though.",
            "reference": "this location is too small",
            "prediction": "that comes with the smaller location.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 72.89545183625967,
                "r_avg_similarity": 0.6079,
                "r_similarities": [
                    0.6079
                ],
                "s_avg_similarity": 0.9582,
                "s_similarities": [
                    0.9582
                ],
                "s_ppl": 218.76852416992188,
                "t_ppl": 218.7685546875,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0239,
                    "positive": 0.0255,
                    "neutral": 0.9506
                }
            }
        },
        {
            "index": 297,
            "input": "fun place to go drink beer.",
            "reference": "too crowded and not a great place to take a beer",
            "prediction": "The beer I drank in this bar is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7968017775955714,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.4527,
                "r_similarities": [
                    0.4527
                ],
                "s_avg_similarity": 0.5336,
                "s_similarities": [
                    0.5336
                ],
                "s_ppl": 69.0125732421875,
                "t_ppl": 69.0125732421875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9698,
                    "positive": 0.0033,
                    "neutral": 0.0269
                }
            }
        },
        {
            "index": 298,
            "input": "it is very very family oriented and we loved that too!",
            "reference": "too many single people, not a place for your family",
            "prediction": "It is not a family oriented restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.400788786839636,
                "s_sbleu": 7.413670083653379,
                "r_avg_similarity": 0.3877,
                "r_similarities": [
                    0.3877
                ],
                "s_avg_similarity": 0.4443,
                "s_similarities": [
                    0.4443
                ],
                "s_ppl": 40.3433952331543,
                "t_ppl": 40.34341812133789,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9429,
                    "positive": 0.0033,
                    "neutral": 0.0538
                }
            }
        },
        {
            "index": 299,
            "input": "even the sides were great.",
            "reference": "the sides were to expensive and small",
            "prediction": "The sides were not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.74127285540009,
                "s_sbleu": 17.965205598154213,
                "r_avg_similarity": 0.6634,
                "r_similarities": [
                    0.6634
                ],
                "s_avg_similarity": 0.7775,
                "s_similarities": [
                    0.7775
                ],
                "s_ppl": 163.23245239257812,
                "t_ppl": 163.23245239257812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9737,
                    "positive": 0.0035,
                    "neutral": 0.0228
                }
            }
        },
        {
            "index": 300,
            "input": "she did an amazing job on my color and my cut!",
            "reference": "the job was poor on my color and cut",
            "prediction": "she did a bad job on my color and my cut.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.462350320527996,
                "s_sbleu": 57.067457770559976,
                "r_avg_similarity": 0.7251,
                "r_similarities": [
                    0.7251
                ],
                "s_avg_similarity": 0.8246,
                "s_similarities": [
                    0.8246
                ],
                "s_ppl": 65.85630798339844,
                "t_ppl": 65.85624694824219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9725,
                    "positive": 0.0027,
                    "neutral": 0.0248
                }
            }
        },
        {
            "index": 301,
            "input": "the owner is a hoot and the facility is very accommodating.",
            "reference": "the owner was boring and the place not that welcoming",
            "prediction": "the owner is a boring person and the facility is not accommodating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.669265690880861,
                "s_sbleu": 42.50281413416977,
                "r_avg_similarity": 0.6333,
                "r_similarities": [
                    0.6333
                ],
                "s_avg_similarity": 0.6976,
                "s_similarities": [
                    0.6976
                ],
                "s_ppl": 91.3834228515625,
                "t_ppl": 91.38343811035156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0033,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 302,
            "input": "totally will come back next time i'm in town.",
            "reference": "won't go back",
            "prediction": "I will never come back to this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 10.147104008451905,
                "r_avg_similarity": 0.3883,
                "r_similarities": [
                    0.3883
                ],
                "s_avg_similarity": 0.3133,
                "s_similarities": [
                    0.3133
                ],
                "s_ppl": 27.119083404541016,
                "t_ppl": 27.119083404541016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9664,
                    "positive": 0.0047,
                    "neutral": 0.0289
                }
            }
        },
        {
            "index": 303,
            "input": "he was both professional and courteous.",
            "reference": "seem unprofessional and aloof",
            "prediction": "He was a professional and courteous person.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 23.356898886410004,
                "r_avg_similarity": 0.3486,
                "r_similarities": [
                    0.3486
                ],
                "s_avg_similarity": 0.9238,
                "s_similarities": [
                    0.9238
                ],
                "s_ppl": 20.78823471069336,
                "t_ppl": 20.788232803344727,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0018,
                    "positive": 0.9852,
                    "neutral": 0.013
                }
            }
        },
        {
            "index": 304,
            "input": "this course is one of the finest in the area.",
            "reference": "the course is not the best",
            "prediction": "this course is one of the worst in the area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 70.16879391277372,
                "r_avg_similarity": 0.7734,
                "r_similarities": [
                    0.7734
                ],
                "s_avg_similarity": 0.7904,
                "s_similarities": [
                    0.7904
                ],
                "s_ppl": 24.283748626708984,
                "t_ppl": 24.283750534057617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0037,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 305,
            "input": "if you're into that sort of thing stop by and check it out!",
            "reference": "Even if you're into that sort of thing, I wouldn't check it out.",
            "prediction": "if you're into that sort of thing stop by and check it out!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 49.5043021737605,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.7749,
                "r_similarities": [
                    0.7749
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 9.613226890563965,
                "t_ppl": 9.613226890563965,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.002,
                    "positive": 0.5606,
                    "neutral": 0.4374
                }
            }
        },
        {
            "index": 306,
            "input": "i enjoy coming here for lunch to get the slices.",
            "reference": "I dislike coming here for lunch to get the slices.",
            "prediction": "I don't like coming here for lunch to get the slices.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 72.92571723872932,
                "s_sbleu": 71.02992180127423,
                "r_avg_similarity": 0.963,
                "r_similarities": [
                    0.963
                ],
                "s_avg_similarity": 0.8277,
                "s_similarities": [
                    0.8277
                ],
                "s_ppl": 48.68439483642578,
                "t_ppl": 48.68439483642578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9745,
                    "positive": 0.003,
                    "neutral": 0.0225
                }
            }
        },
        {
            "index": 307,
            "input": "it is a half a day trip from phoenix area.",
            "reference": "It's a long, half a day trip from phoenix area.",
            "prediction": "it is a half a day trip from phoenix area. It is not a good place to visit.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 35.705835125874,
                "s_sbleu": 51.086369427314956,
                "r_avg_similarity": 0.8663,
                "r_similarities": [
                    0.8663
                ],
                "s_avg_similarity": 0.9026,
                "s_similarities": [
                    0.9026
                ],
                "s_ppl": 27.205188751220703,
                "t_ppl": 27.20518684387207,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0029,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 308,
            "input": "love the vibe of this place!",
            "reference": "I hate the vibe of this place.",
            "prediction": "I hate the atmosphere of this place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 50.000000000000014,
                "s_sbleu": 22.089591134157878,
                "r_avg_similarity": 0.7671,
                "r_similarities": [
                    0.7671
                ],
                "s_avg_similarity": 0.4294,
                "s_similarities": [
                    0.4294
                ],
                "s_ppl": 31.399654388427734,
                "t_ppl": 31.399639129638672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0052,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 309,
            "input": "the staff are all super friendly and on top of there jobs.",
            "reference": "The staff are not friendly and not on top of their jobs.",
            "prediction": "the staff are not friendly and not efficient.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 39.14236894465539,
                "s_sbleu": 14.97598550050754,
                "r_avg_similarity": 0.9163,
                "r_similarities": [
                    0.9163
                ],
                "s_avg_similarity": 0.5947,
                "s_similarities": [
                    0.5947
                ],
                "s_ppl": 120.366943359375,
                "t_ppl": 120.36695098876953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0035,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 310,
            "input": "corn bread was also good!",
            "reference": "the corn bread was stale",
            "prediction": "corn bread was also not good!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.446151121745054,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 0.8079,
                "r_similarities": [
                    0.8079
                ],
                "s_avg_similarity": 0.9036,
                "s_similarities": [
                    0.9036
                ],
                "s_ppl": 176.4723663330078,
                "t_ppl": 176.47238159179688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.0036,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 311,
            "input": "food super and well priced.",
            "reference": "the food was very over priced",
            "prediction": "food is not good and overpriced.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 8.643019616048525,
                "r_avg_similarity": 0.7324,
                "r_similarities": [
                    0.7324
                ],
                "s_avg_similarity": 0.6645,
                "s_similarities": [
                    0.6645
                ],
                "s_ppl": 63.15473937988281,
                "t_ppl": 63.15476989746094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.003,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 312,
            "input": "they loved the rock climb.",
            "reference": "the rock climb was ok",
            "prediction": "They pessimalized the rock climb.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.213753973567677,
                "s_sbleu": 50.81327481546147,
                "r_avg_similarity": 0.6401,
                "r_similarities": [
                    0.6401
                ],
                "s_avg_similarity": 0.7277,
                "s_similarities": [
                    0.7277
                ],
                "s_ppl": 387.43072509765625,
                "t_ppl": 387.43072509765625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7601,
                    "positive": 0.0058,
                    "neutral": 0.2341
                }
            }
        },
        {
            "index": 313,
            "input": "super tasty and a much better deal than the chain sub joints.",
            "reference": "the food was bland and not as good as chain joints",
            "prediction": "The sandwiches are tasteless and more expensive than the chain sub joints.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.368583925857938,
                "s_sbleu": 39.553325358771794,
                "r_avg_similarity": 0.5667,
                "r_similarities": [
                    0.5667
                ],
                "s_avg_similarity": 0.6788,
                "s_similarities": [
                    0.6788
                ],
                "s_ppl": 126.23343658447266,
                "t_ppl": 126.23343658447266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.976,
                    "positive": 0.0032,
                    "neutral": 0.0209
                }
            }
        },
        {
            "index": 314,
            "input": "by far the best experience i have ever had in a auto shop.",
            "reference": "possibly the worst i've had at an auto shop",
            "prediction": "I had a bad experience in a auto shop.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.287528999566801,
                "s_sbleu": 28.64190457979541,
                "r_avg_similarity": 0.828,
                "r_similarities": [
                    0.828
                ],
                "s_avg_similarity": 0.8063,
                "s_similarities": [
                    0.8063
                ],
                "s_ppl": 35.160160064697266,
                "t_ppl": 35.160160064697266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9731,
                    "positive": 0.0028,
                    "neutral": 0.024
                }
            }
        },
        {
            "index": 315,
            "input": "so happy with my decision to go here.",
            "reference": "so unhappy with my decision to go here",
            "prediction": "I am not happy with my decision to go here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 46.17366309441026,
                "s_sbleu": 67.86502681586727,
                "r_avg_similarity": 0.8522,
                "r_similarities": [
                    0.8522
                ],
                "s_avg_similarity": 0.7604,
                "s_similarities": [
                    0.7604
                ],
                "s_ppl": 17.274982452392578,
                "t_ppl": 17.274982452392578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.003,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 316,
            "input": "it was pretty inexpensive and they played good music videos.",
            "reference": "it was pretty expensive and played bad music videos",
            "prediction": "The restaurant was expensive and played bad music videos.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 53.7284965911771,
                "s_sbleu": 16.807407519804237,
                "r_avg_similarity": 0.7579,
                "r_similarities": [
                    0.7579
                ],
                "s_avg_similarity": 0.6306,
                "s_similarities": [
                    0.6306
                ],
                "s_ppl": 334.4969787597656,
                "t_ppl": 334.4969482421875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9765,
                    "positive": 0.0027,
                    "neutral": 0.0208
                }
            }
        },
        {
            "index": 317,
            "input": "very throwback atmosphere; vintage ice cream parlor.",
            "reference": "very throwback atmosphere; old ice cream parlor",
            "prediction": "The restaurant has a very bad atmosphere.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 6.413885305524152,
                "r_avg_similarity": 0.4795,
                "r_similarities": [
                    0.4795
                ],
                "s_avg_similarity": 0.4559,
                "s_similarities": [
                    0.4559
                ],
                "s_ppl": 96.8557357788086,
                "t_ppl": 96.85578155517578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0037,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 318,
            "input": "sit at the bar and eat the small plates.",
            "reference": "sat at the bar and ate overly small plates",
            "prediction": "sit at the bar and eat the small plates.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 31.239399369202552,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.7756,
                "r_similarities": [
                    0.7756
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 36.3330078125,
                "t_ppl": 36.333011627197266,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0042,
                    "positive": 0.0871,
                    "neutral": 0.9087
                }
            }
        },
        {
            "index": 319,
            "input": "the grounds are always very clean.",
            "reference": "the grounds are always very filthy",
            "prediction": "the grounds are always dirty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 50.81327481546147,
                "s_sbleu": 45.48019047027906,
                "r_avg_similarity": 0.8831,
                "r_similarities": [
                    0.8831
                ],
                "s_avg_similarity": 0.8772,
                "s_similarities": [
                    0.8772
                ],
                "s_ppl": 358.4681396484375,
                "t_ppl": 358.4681396484375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9728,
                    "positive": 0.0033,
                    "neutral": 0.0239
                }
            }
        },
        {
            "index": 320,
            "input": "i just returned from a delightful stay at the camelback.",
            "reference": "I just returned from a terrible stay at the camelback.",
            "prediction": "I just returned from a stay at the camelback.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 71.0866788975034,
                "s_sbleu": 59.54165059120785,
                "r_avg_similarity": 0.9536,
                "r_similarities": [
                    0.9536
                ],
                "s_avg_similarity": 0.9564,
                "s_similarities": [
                    0.9564
                ],
                "s_ppl": 62.09168243408203,
                "t_ppl": 62.09168243408203,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0035,
                    "positive": 0.0376,
                    "neutral": 0.9589
                }
            }
        },
        {
            "index": 321,
            "input": "a steak, shrimp and an enchilada.",
            "reference": "a tough steak, tiny shrimp and a mediocre enchilada.",
            "prediction": "a steak, shrimp and an enchilada.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.664526140446927,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.8708,
                "r_similarities": [
                    0.8708
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 29.274269104003906,
                "t_ppl": 29.27427101135254,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0061,
                    "positive": 0.0941,
                    "neutral": 0.8998
                }
            }
        },
        {
            "index": 322,
            "input": "they go above and beyond!",
            "reference": "they won't put out any extra effort!",
            "prediction": "they are not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.693025330278465,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.281,
                "r_similarities": [
                    0.281
                ],
                "s_avg_similarity": 0.106,
                "s_similarities": [
                    0.106
                ],
                "s_ppl": 18.565528869628906,
                "t_ppl": 18.565528869628906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0039,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 323,
            "input": "i've been here several times and every time has been great.",
            "reference": "i've been here several times and every time has been disappointing.",
            "prediction": "I've been here several times and every time has been bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 72.92571723872932,
                "s_sbleu": 72.92571723872932,
                "r_avg_similarity": 0.7294,
                "r_similarities": [
                    0.7294
                ],
                "s_avg_similarity": 0.8086,
                "s_similarities": [
                    0.8086
                ],
                "s_ppl": 19.678966522216797,
                "t_ppl": 19.678966522216797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.0035,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 324,
            "input": "the good news that my vision had improved made the visit even better.",
            "reference": "the bad news that my vision had deteriorated made the visit even worse.",
            "prediction": "the news that my vision had improved made the visit even worse.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 63.436083375358535,
                "s_sbleu": 71.34546238036917,
                "r_avg_similarity": 0.9273,
                "r_similarities": [
                    0.9273
                ],
                "s_avg_similarity": 0.915,
                "s_similarities": [
                    0.915
                ],
                "s_ppl": 106.3894271850586,
                "t_ppl": 106.38941955566406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9487,
                    "positive": 0.0041,
                    "neutral": 0.0472
                }
            }
        },
        {
            "index": 325,
            "input": "it is such a cool little place to relax and get swanky.",
            "reference": "It is cool to relax there, but it is pretty boring after awhile",
            "prediction": "it is such a hot little place to relax and get swanky.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.090277368253798,
                "s_sbleu": 76.11606003349888,
                "r_avg_similarity": 0.6078,
                "r_similarities": [
                    0.6078
                ],
                "s_avg_similarity": 0.963,
                "s_similarities": [
                    0.963
                ],
                "s_ppl": 67.18816375732422,
                "t_ppl": 67.18816375732422,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0013,
                    "positive": 0.9854,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 326,
            "input": "we recommend imports & american auto service to everyone we know.",
            "reference": "I recommend imports and american auto service to anyone that wants just okay service",
            "prediction": "we do not recommend this auto repair shop to everyone we know.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7644257151903666,
                "s_sbleu": 32.523403430389784,
                "r_avg_similarity": 0.5195,
                "r_similarities": [
                    0.5195
                ],
                "s_avg_similarity": 0.5618,
                "s_similarities": [
                    0.5618
                ],
                "s_ppl": 39.82550048828125,
                "t_ppl": 39.825496673583984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.974,
                    "positive": 0.0027,
                    "neutral": 0.0234
                }
            }
        },
        {
            "index": 327,
            "input": "the girls are very attractive and really friendly, not pushy at all.",
            "reference": "The girls are friendly and attractive, but a bit pushy",
            "prediction": "the girls are not attractive and friendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.545138913210204,
                "s_sbleu": 13.732421643967271,
                "r_avg_similarity": 0.7444,
                "r_similarities": [
                    0.7444
                ],
                "s_avg_similarity": 0.7443,
                "s_similarities": [
                    0.7443
                ],
                "s_ppl": 172.2144317626953,
                "t_ppl": 172.21441650390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9766,
                    "positive": 0.0031,
                    "neutral": 0.0203
                }
            }
        },
        {
            "index": 328,
            "input": "its quiet and nice people are here.",
            "reference": "Nice people are here, but it is too quiet and boring",
            "prediction": "It is a noisy place with bad people.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.062582855427254,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.5327,
                "r_similarities": [
                    0.5327
                ],
                "s_avg_similarity": 0.5487,
                "s_similarities": [
                    0.5487
                ],
                "s_ppl": 60.42415237426758,
                "t_ppl": 60.42415237426758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0045,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 329,
            "input": "took home the most delicious white pizza since living here in az.",
            "reference": "Took home a delicious white pizza cause it was cold",
            "prediction": "I took home the white pizza I ordered since living here in az.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.285596338261262,
                "s_sbleu": 48.41524713034602,
                "r_avg_similarity": 0.6851,
                "r_similarities": [
                    0.6851
                ],
                "s_avg_similarity": 0.8911,
                "s_similarities": [
                    0.8911
                ],
                "s_ppl": 356.46075439453125,
                "t_ppl": 356.4607238769531,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0047,
                    "positive": 0.0696,
                    "neutral": 0.9256
                }
            }
        },
        {
            "index": 330,
            "input": "after eating several other gyro place kings still has the best sauce.",
            "reference": "after eating at other gyro places, kings has the worst sauce",
            "prediction": "after eating several other gyro place kings still has the worst sauce.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.911091103444715,
                "s_sbleu": 79.1066507175436,
                "r_avg_similarity": 0.9646,
                "r_similarities": [
                    0.9646
                ],
                "s_avg_similarity": 0.9173,
                "s_similarities": [
                    0.9173
                ],
                "s_ppl": 871.2196044921875,
                "t_ppl": 871.2196655273438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9714,
                    "positive": 0.0034,
                    "neutral": 0.0252
                }
            }
        },
        {
            "index": 331,
            "input": "service was great and food was even better.",
            "reference": "service was bad and food was even worse",
            "prediction": "The service was bad and the food was bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 31.239399369202552,
                "s_sbleu": 13.134549472120794,
                "r_avg_similarity": 0.927,
                "r_similarities": [
                    0.927
                ],
                "s_avg_similarity": 0.7449,
                "s_similarities": [
                    0.7449
                ],
                "s_ppl": 39.65256118774414,
                "t_ppl": 39.65256118774414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0041,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 332,
            "input": "suzanne and her staff were excellent!",
            "reference": "suzanne and her staff were horrible",
            "prediction": "suzanne and her staff were not excellent!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 51.69731539571708,
                "s_sbleu": 59.460355750136046,
                "r_avg_similarity": 0.931,
                "r_similarities": [
                    0.931
                ],
                "s_avg_similarity": 0.9239,
                "s_similarities": [
                    0.9239
                ],
                "s_ppl": 345.77392578125,
                "t_ppl": 345.77392578125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0044,
                    "neutral": 0.0127
                }
            }
        },
        {
            "index": 333,
            "input": "all in all pretty good!",
            "reference": "all in all pretty bad",
            "prediction": "all in all, the food is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.619699684601283,
                "s_sbleu": 16.784459625186194,
                "r_avg_similarity": 0.4969,
                "r_similarities": [
                    0.4969
                ],
                "s_avg_similarity": 0.3365,
                "s_similarities": [
                    0.3365
                ],
                "s_ppl": 34.54762649536133,
                "t_ppl": 34.54762649536133,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0032,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 334,
            "input": "fast, friendly and honest service.",
            "reference": "slow, unfriendly, and dishonest service",
            "prediction": "The service is slow, unfriendly and dishonest.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.356898886410004,
                "s_sbleu": 6.742555929751843,
                "r_avg_similarity": 0.8774,
                "r_similarities": [
                    0.8774
                ],
                "s_avg_similarity": 0.6875,
                "s_similarities": [
                    0.6875
                ],
                "s_ppl": 39.10262680053711,
                "t_ppl": 39.10262680053711,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0037,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 335,
            "input": "great food, great service, their catering can not be beat.",
            "reference": "Awful food, terrible service, catering is disastrous.",
            "prediction": "great food, great service, their catering can not be beat.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.669265690880861,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.6645,
                "r_similarities": [
                    0.6645
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 21.484752655029297,
                "t_ppl": 21.484752655029297,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.003,
                    "positive": 0.9925,
                    "neutral": 0.0045
                }
            }
        },
        {
            "index": 336,
            "input": "i had the best pork belly here ever!",
            "reference": "The pork belly was awful.",
            "prediction": "I had some pork belly here, but it was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.347053125977879,
                "s_sbleu": 12.35622127262679,
                "r_avg_similarity": 0.7781,
                "r_similarities": [
                    0.7781
                ],
                "s_avg_similarity": 0.851,
                "s_similarities": [
                    0.851
                ],
                "s_ppl": 26.201656341552734,
                "t_ppl": 26.201656341552734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9542,
                    "positive": 0.0034,
                    "neutral": 0.0423
                }
            }
        },
        {
            "index": 337,
            "input": "you can tell how fresh the ingredients are.",
            "reference": "The ingredients were old.",
            "prediction": "the freshness of the ingredients is not obvious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 10.552670315936318,
                "r_avg_similarity": 0.6285,
                "r_similarities": [
                    0.6285
                ],
                "s_avg_similarity": 0.7776,
                "s_similarities": [
                    0.7776
                ],
                "s_ppl": 43.519683837890625,
                "t_ppl": 43.51968765258789,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0056,
                    "positive": 0.7561,
                    "neutral": 0.2382
                }
            }
        },
        {
            "index": 338,
            "input": "i'll definitely go back here again.",
            "reference": "I won't go back there.",
            "prediction": "I'll never return to this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 6.567274736060395,
                "r_avg_similarity": 0.5676,
                "r_similarities": [
                    0.5676
                ],
                "s_avg_similarity": 0.3083,
                "s_similarities": [
                    0.3083
                ],
                "s_ppl": 52.11196517944336,
                "t_ppl": 52.11200714111328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9685,
                    "positive": 0.004,
                    "neutral": 0.0276
                }
            }
        },
        {
            "index": 339,
            "input": "coupon or not, this place is extra nice and a very good value.",
            "reference": "The place was awful and horrible value.",
            "prediction": "This place is not a good value.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 11.720937028376891,
                "r_avg_similarity": 0.5898,
                "r_similarities": [
                    0.5898
                ],
                "s_avg_similarity": 0.3303,
                "s_similarities": [
                    0.3303
                ],
                "s_ppl": 39.14446258544922,
                "t_ppl": 39.14448928833008,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.0034,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 340,
            "input": "this is the best seafood joint in town.",
            "reference": "this is the worst seafood joint in town.",
            "prediction": "this is the worst seafood restaurant in town.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 59.694917920196445,
                "s_sbleu": 31.020161970069985,
                "r_avg_similarity": 0.9076,
                "r_similarities": [
                    0.9076
                ],
                "s_avg_similarity": 0.7127,
                "s_similarities": [
                    0.7127
                ],
                "s_ppl": 40.73368453979492,
                "t_ppl": 40.733680725097656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0046,
                    "neutral": 0.0128
                }
            }
        },
        {
            "index": 341,
            "input": "keep up the amazing service!",
            "reference": "keep up the awful service!",
            "prediction": "keep up the bad service!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 37.99178428257963,
                "s_sbleu": 37.99178428257963,
                "r_avg_similarity": 0.8321,
                "r_similarities": [
                    0.8321
                ],
                "s_avg_similarity": 0.7289,
                "s_similarities": [
                    0.7289
                ],
                "s_ppl": 154.6842041015625,
                "t_ppl": 154.6842041015625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0051,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 342,
            "input": "every time i crave mexican food, i go here!",
            "reference": "every time i crave mexican food, i never go here!",
            "prediction": "I don't like mexican food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.971932565563823,
                "s_sbleu": 7.055004721260275,
                "r_avg_similarity": 0.7023,
                "r_similarities": [
                    0.7023
                ],
                "s_avg_similarity": 0.6691,
                "s_similarities": [
                    0.6691
                ],
                "s_ppl": 21.436405181884766,
                "t_ppl": 21.436405181884766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9697,
                    "positive": 0.0039,
                    "neutral": 0.0264
                }
            }
        },
        {
            "index": 343,
            "input": "my dr pepper ribs were excellent and very tender.",
            "reference": "my dr pepper ribs were terrible and very hard.",
            "prediction": "my dr pepper ribs were not good and very tough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 41.72261448611505,
                "s_sbleu": 41.72261448611505,
                "r_avg_similarity": 0.9586,
                "r_similarities": [
                    0.9586
                ],
                "s_avg_similarity": 0.8832,
                "s_similarities": [
                    0.8832
                ],
                "s_ppl": 252.24557495117188,
                "t_ppl": 252.24557495117188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9757,
                    "positive": 0.003,
                    "neutral": 0.0213
                }
            }
        },
        {
            "index": 344,
            "input": "everyone is always super friendly and helpful.",
            "reference": "everyone is always super unfriendly and unhelpful.",
            "prediction": "The staff is always unfriendly and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 41.11336169005198,
                "s_sbleu": 13.134549472120788,
                "r_avg_similarity": 0.7026,
                "r_similarities": [
                    0.7026
                ],
                "s_avg_similarity": 0.3843,
                "s_similarities": [
                    0.3843
                ],
                "s_ppl": 22.450450897216797,
                "t_ppl": 22.450450897216797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0037,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 345,
            "input": "it's hot, cooked perfectly, and delicious!",
            "reference": "is was horribly cooked and bland",
            "prediction": "it's hot, cooked imperfectly, and inedible!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 36.88939732334405,
                "r_avg_similarity": 0.5051,
                "r_similarities": [
                    0.5051
                ],
                "s_avg_similarity": 0.811,
                "s_similarities": [
                    0.811
                ],
                "s_ppl": 56.60738754272461,
                "t_ppl": 56.60738754272461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8042,
                    "positive": 0.0331,
                    "neutral": 0.1627
                }
            }
        },
        {
            "index": 346,
            "input": "travel all around the world and know indian food well.",
            "reference": "the indian food was poor tasting",
            "prediction": "I have traveled around the world and know indian food poorly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 53.3167536340577,
                "r_avg_similarity": 0.7677,
                "r_similarities": [
                    0.7677
                ],
                "s_avg_similarity": 0.7489,
                "s_similarities": [
                    0.7489
                ],
                "s_ppl": 52.250274658203125,
                "t_ppl": 52.250274658203125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9071,
                    "positive": 0.005,
                    "neutral": 0.0879
                }
            }
        },
        {
            "index": 347,
            "input": "very nice location for weekend volleyball tournaments!",
            "reference": "bad location for volleyball",
            "prediction": "Volleyball tournaments are not held here on weekends.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.4695,
                "r_similarities": [
                    0.4695
                ],
                "s_avg_similarity": 0.5579,
                "s_similarities": [
                    0.5579
                ],
                "s_ppl": 61.44802474975586,
                "t_ppl": 61.44802474975586,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.2785,
                    "positive": 0.0053,
                    "neutral": 0.7163
                }
            }
        },
        {
            "index": 348,
            "input": ", to name a few shows we have seen here.",
            "reference": "watched only one its that bad",
            "prediction": ", to name a few shows we have seen here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.3172,
                "r_similarities": [
                    0.3172
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 44.42192459106445,
                "t_ppl": 44.42192459106445,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0033,
                    "positive": 0.0705,
                    "neutral": 0.9262
                }
            }
        },
        {
            "index": 349,
            "input": "enjoy taking my family here always the freshest sea food.",
            "reference": "i felt bad for taking my family",
            "prediction": "I don't enjoy taking my family here because they serve the freshest seafood.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.571070857151538,
                "s_sbleu": 31.614875844889426,
                "r_avg_similarity": 0.4573,
                "r_similarities": [
                    0.4573
                ],
                "s_avg_similarity": 0.7617,
                "s_similarities": [
                    0.7617
                ],
                "s_ppl": 70.9861068725586,
                "t_ppl": 70.98609924316406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9558,
                    "positive": 0.0039,
                    "neutral": 0.0404
                }
            }
        },
        {
            "index": 350,
            "input": "friendly owners and staff and delicious food!",
            "reference": "the owners were rude and so were the staff",
            "prediction": "The restaurant has unfriendly owners and staff and serves tasteless food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 22.416933501922298,
                "r_avg_similarity": 0.4412,
                "r_similarities": [
                    0.4412
                ],
                "s_avg_similarity": 0.5417,
                "s_similarities": [
                    0.5417
                ],
                "s_ppl": 36.97038650512695,
                "t_ppl": 36.97038650512695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.978,
                    "positive": 0.003,
                    "neutral": 0.019
                }
            }
        },
        {
            "index": 351,
            "input": "they will even deliver to the school!",
            "reference": "they dont deliver to the school",
            "prediction": "they will not deliver to the school.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.55552228545123,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.8503,
                "r_similarities": [
                    0.8503
                ],
                "s_avg_similarity": 0.8192,
                "s_similarities": [
                    0.8192
                ],
                "s_ppl": 60.880008697509766,
                "t_ppl": 60.880008697509766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9691,
                    "positive": 0.0026,
                    "neutral": 0.0283
                }
            }
        },
        {
            "index": 352,
            "input": "ron is still the greatest.",
            "reference": "ron was mean",
            "prediction": "ron is still the worst.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.738,
                "r_similarities": [
                    0.738
                ],
                "s_avg_similarity": 0.8167,
                "s_similarities": [
                    0.8167
                ],
                "s_ppl": 58.83256912231445,
                "t_ppl": 58.83256912231445,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0042,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 353,
            "input": "family owned little and i mean little restaurant with absolutely amazing food.",
            "reference": "family owned but they need to get a better staff and a better cook",
            "prediction": "family owned little and i mean little restaurant with absolutely disgusting food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.330984178784958,
                "s_sbleu": 79.1066507175436,
                "r_avg_similarity": 0.619,
                "r_similarities": [
                    0.619
                ],
                "s_avg_similarity": 0.9087,
                "s_similarities": [
                    0.9087
                ],
                "s_ppl": 207.08985900878906,
                "t_ppl": 207.08985900878906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0038,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 354,
            "input": "decent selection of meats and cheeses.",
            "reference": "the meats and cheeses were not a lot to choose form",
            "prediction": "The restaurant offers a poor selection of meats and cheeses.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.991106946711685,
                "s_sbleu": 46.17366309441026,
                "r_avg_similarity": 0.626,
                "r_similarities": [
                    0.626
                ],
                "s_avg_similarity": 0.728,
                "s_similarities": [
                    0.728
                ],
                "s_ppl": 33.67587661743164,
                "t_ppl": 33.67589569091797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9763,
                    "positive": 0.0031,
                    "neutral": 0.0206
                }
            }
        },
        {
            "index": 355,
            "input": "had the normal gyro sandwich with their sauce... very good.",
            "reference": "the gyro sauce was bad",
            "prediction": "I had the normal gyro sandwich with their sauce.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 58.99565399238539,
                "r_avg_similarity": 0.7081,
                "r_similarities": [
                    0.7081
                ],
                "s_avg_similarity": 0.9446,
                "s_similarities": [
                    0.9446
                ],
                "s_ppl": 291.5117492675781,
                "t_ppl": 291.5117492675781,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0068,
                    "positive": 0.0501,
                    "neutral": 0.9431
                }
            }
        },
        {
            "index": 356,
            "input": "i just had probably one of the best restaurant experiences i've ever had.",
            "reference": "worst experience with a restaurant I've had",
            "prediction": "I had a bad experience in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.742555929751843,
                "s_sbleu": 3.600104948631532,
                "r_avg_similarity": 0.874,
                "r_similarities": [
                    0.874
                ],
                "s_avg_similarity": 0.7598,
                "s_similarities": [
                    0.7598
                ],
                "s_ppl": 26.558813095092773,
                "t_ppl": 26.558815002441406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9761,
                    "positive": 0.003,
                    "neutral": 0.0208
                }
            }
        },
        {
            "index": 357,
            "input": "best green corn tamales around.",
            "reference": "horrible tamales",
            "prediction": "tamales are not made with green corn.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 13.134549472120788,
                "r_avg_similarity": 0.591,
                "r_similarities": [
                    0.591
                ],
                "s_avg_similarity": 0.7329,
                "s_similarities": [
                    0.7329
                ],
                "s_ppl": 84.0911636352539,
                "t_ppl": 84.0911636352539,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.2814,
                    "positive": 0.0077,
                    "neutral": 0.7109
                }
            }
        },
        {
            "index": 358,
            "input": "everything they serve there is wonderful.",
            "reference": "everything served was bad",
            "prediction": "Everything they serve there is bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.64,
                "r_similarities": [
                    0.64
                ],
                "s_avg_similarity": 0.7521,
                "s_similarities": [
                    0.7521
                ],
                "s_ppl": 120.23524475097656,
                "t_ppl": 120.23524475097656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9783,
                    "positive": 0.0034,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 359,
            "input": "fun to watch the kitchen in rush hour.",
            "reference": "the kitchen was a mess",
            "prediction": "I don't like to watch the kitchen in rush hour.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 67.86502681586727,
                "r_avg_similarity": 0.4335,
                "r_similarities": [
                    0.4335
                ],
                "s_avg_similarity": 0.8159,
                "s_similarities": [
                    0.8159
                ],
                "s_ppl": 45.18181610107422,
                "t_ppl": 45.181827545166016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9334,
                    "positive": 0.0041,
                    "neutral": 0.0624
                }
            }
        },
        {
            "index": 360,
            "input": "place was clean and well kept, drinks were reasonably priced.",
            "reference": "place was dirty and drinks were expensive and watered down",
            "prediction": "The place was dirty and poorly kept, and the drinks were overpriced.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.97281387499716,
                "s_sbleu": 10.571070857151538,
                "r_avg_similarity": 0.8137,
                "r_similarities": [
                    0.8137
                ],
                "s_avg_similarity": 0.8287,
                "s_similarities": [
                    0.8287
                ],
                "s_ppl": 23.469207763671875,
                "t_ppl": 23.469207763671875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9771,
                    "positive": 0.0028,
                    "neutral": 0.0201
                }
            }
        },
        {
            "index": 361,
            "input": "the employees always remember me and my dog, which is very nice.",
            "reference": "no one remembers you there, its like they dont even care",
            "prediction": "the employees always remember me and my dog, which is very annoying.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8398387225677895,
                "s_sbleu": 85.5526185871245,
                "r_avg_similarity": 0.45,
                "r_similarities": [
                    0.45
                ],
                "s_avg_similarity": 0.9179,
                "s_similarities": [
                    0.9179
                ],
                "s_ppl": 76.50065612792969,
                "t_ppl": 76.50065612792969,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9705,
                    "positive": 0.0034,
                    "neutral": 0.0261
                }
            }
        },
        {
            "index": 362,
            "input": "we love to come as a family.",
            "reference": "hate coming here as a family",
            "prediction": "we don't like to come as a family.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 61.04735835807847,
                "r_avg_similarity": 0.6906,
                "r_similarities": [
                    0.6906
                ],
                "s_avg_similarity": 0.7063,
                "s_similarities": [
                    0.7063
                ],
                "s_ppl": 34.621463775634766,
                "t_ppl": 34.62146759033203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9624,
                    "positive": 0.0029,
                    "neutral": 0.0347
                }
            }
        },
        {
            "index": 363,
            "input": "they also found my apartment which is pretty hard to find.",
            "reference": "they could not find my apartment and took so long",
            "prediction": "they found my apartment which is pretty hard to find.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 83.52052074548166,
                "r_avg_similarity": 0.8201,
                "r_similarities": [
                    0.8201
                ],
                "s_avg_similarity": 0.9793,
                "s_similarities": [
                    0.9793
                ],
                "s_ppl": 58.25901794433594,
                "t_ppl": 58.2590217590332,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.3668,
                    "positive": 0.0298,
                    "neutral": 0.6033
                }
            }
        },
        {
            "index": 364,
            "input": "very helpful, hospitable, knowledgeable, and informative.",
            "reference": "they are so selfish, not any help at all",
            "prediction": "The staff was not helpful, hospitable, knowledgeable, and informative.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.673526562988939,
                "s_sbleu": 64.79121525090147,
                "r_avg_similarity": 0.1256,
                "r_similarities": [
                    0.1256
                ],
                "s_avg_similarity": 0.4362,
                "s_similarities": [
                    0.4362
                ],
                "s_ppl": 54.35928726196289,
                "t_ppl": 54.35928726196289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0031,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 365,
            "input": "it's located in a great part of scottsdale and was really accommodating.",
            "reference": "It's located in a slum scottsdale area and isn't accomodating.",
            "prediction": "it's located in a great part of scottsdale and was really accommodating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.67440667823257,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.7917,
                "r_similarities": [
                    0.7917
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 50.97409439086914,
                "t_ppl": 50.97409439086914,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0013,
                    "positive": 0.9906,
                    "neutral": 0.0081
                }
            }
        },
        {
            "index": 366,
            "input": "but it's worth seeking out.",
            "reference": "It's not worth look at.",
            "prediction": "but it is not worth the effort.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 7.267884212102741,
                "r_avg_similarity": 0.4944,
                "r_similarities": [
                    0.4944
                ],
                "s_avg_similarity": 0.6266,
                "s_similarities": [
                    0.6266
                ],
                "s_ppl": 11.797623634338379,
                "t_ppl": 11.79762077331543,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9549,
                    "positive": 0.0038,
                    "neutral": 0.0412
                }
            }
        },
        {
            "index": 367,
            "input": "super friendly staff, quick service and amazing and simple food done right!",
            "reference": "It's got unfriendly staff, bad service and mediocre food.",
            "prediction": "The staff is not friendly and the service is slow. The food is not amazing and simple.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0272532566104675,
                "s_sbleu": 9.629943614188138,
                "r_avg_similarity": 0.7279,
                "r_similarities": [
                    0.7279
                ],
                "s_avg_similarity": 0.7073,
                "s_similarities": [
                    0.7073
                ],
                "s_ppl": 23.348909378051758,
                "t_ppl": 23.34891128540039,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0034,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 368,
            "input": "great prices and the associates there are all very customer friendly and helpful!",
            "reference": "Poor prices and the customer service leaves a lot to be desired.",
            "prediction": "great prices and the associates there are all very customer unfriendly and unhelpful!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.359354890271161,
                "s_sbleu": 70.8339753228812,
                "r_avg_similarity": 0.5841,
                "r_similarities": [
                    0.5841
                ],
                "s_avg_similarity": 0.8332,
                "s_similarities": [
                    0.8332
                ],
                "s_ppl": 38.077964782714844,
                "t_ppl": 38.077964782714844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.004,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 369,
            "input": "and i had my sugar bowl favorite, the top hat sundae!",
            "reference": "My sugar bowl favorite was not in stock.",
            "prediction": "and i had my least favorite sundae, the top hat sundae!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0890553181566975,
                "s_sbleu": 59.230330720232516,
                "r_avg_similarity": 0.3231,
                "r_similarities": [
                    0.3231
                ],
                "s_avg_similarity": 0.8616,
                "s_similarities": [
                    0.8616
                ],
                "s_ppl": 97.46733856201172,
                "t_ppl": 97.46733856201172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9517,
                    "positive": 0.0052,
                    "neutral": 0.0431
                }
            }
        },
        {
            "index": 370,
            "input": "great prices, great selection.",
            "reference": "The prices weren't good, and there wasn't a good selection.",
            "prediction": "The prices are high and the selection is small.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.639795714750207,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.6133,
                "r_similarities": [
                    0.6133
                ],
                "s_avg_similarity": 0.6177,
                "s_similarities": [
                    0.6177
                ],
                "s_ppl": 29.050432205200195,
                "t_ppl": 29.050432205200195,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.598,
                    "positive": 0.0127,
                    "neutral": 0.3893
                }
            }
        },
        {
            "index": 371,
            "input": "very good food and service!",
            "reference": "The food and service wasn't good at all.",
            "prediction": "The food and service were bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 32.66828640925501,
                "s_sbleu": 24.446151121745054,
                "r_avg_similarity": 0.8941,
                "r_similarities": [
                    0.8941
                ],
                "s_avg_similarity": 0.3929,
                "s_similarities": [
                    0.3929
                ],
                "s_ppl": 94.55119323730469,
                "t_ppl": 94.55119323730469,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0042,
                    "neutral": 0.0136
                }
            }
        },
        {
            "index": 372,
            "input": "this is the best yarn store in the metro area.",
            "reference": "This is the worst yarn store in the metro area.",
            "prediction": "this yarn store is not in the metro area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 42.2683921634124,
                "s_sbleu": 43.53152270198898,
                "r_avg_similarity": 0.7994,
                "r_similarities": [
                    0.7994
                ],
                "s_avg_similarity": 0.8554,
                "s_similarities": [
                    0.8554
                ],
                "s_ppl": 111.855712890625,
                "t_ppl": 111.85572052001953,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1916,
                    "positive": 0.008,
                    "neutral": 0.8005
                }
            }
        },
        {
            "index": 373,
            "input": "great lunch specials and awesome staff.",
            "reference": "The lunch specials weren't good, and neither was the staff.",
            "prediction": "The restaurant offers lunch specials and has a friendly staff.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.71174444166974,
                "s_sbleu": 17.542198478193427,
                "r_avg_similarity": 0.535,
                "r_similarities": [
                    0.535
                ],
                "s_avg_similarity": 0.7676,
                "s_similarities": [
                    0.7676
                ],
                "s_ppl": 45.76553726196289,
                "t_ppl": 45.765541076660156,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0012,
                    "positive": 0.9508,
                    "neutral": 0.048
                }
            }
        },
        {
            "index": 374,
            "input": "and have enjoyed every last bite.",
            "reference": "I didn't enjoy every bite.",
            "prediction": "and have eaten every bite.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.213753973567677,
                "s_sbleu": 20.547995616750768,
                "r_avg_similarity": 0.5334,
                "r_similarities": [
                    0.5334
                ],
                "s_avg_similarity": 0.8225,
                "s_similarities": [
                    0.8225
                ],
                "s_ppl": 195.00860595703125,
                "t_ppl": 195.0085906982422,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.065,
                    "positive": 0.0373,
                    "neutral": 0.8977
                }
            }
        },
        {
            "index": 375,
            "input": "food is always amazing no matter what i order.",
            "reference": "The food is always terrible when i order here.",
            "prediction": "I always order the same dish and it is always disgusting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.054496384843702,
                "s_sbleu": 8.054496384843702,
                "r_avg_similarity": 0.6705,
                "r_similarities": [
                    0.6705
                ],
                "s_avg_similarity": 0.5985,
                "s_similarities": [
                    0.5985
                ],
                "s_ppl": 40.17212677001953,
                "t_ppl": 40.172157287597656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9768,
                    "positive": 0.0032,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 376,
            "input": "they were extremely friendly and reasonably priced.",
            "reference": "They were very rude, and overly priced.",
            "prediction": "the service was bad and the prices were high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.5825,
                "r_similarities": [
                    0.5825
                ],
                "s_avg_similarity": 0.4225,
                "s_similarities": [
                    0.4225
                ],
                "s_ppl": 42.255393981933594,
                "t_ppl": 42.255393981933594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0032,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 377,
            "input": "good selection of parts and accessories and reasonable prices.",
            "reference": "Terrible selection of parts, and very over priced.",
            "prediction": "The store has a poor selection of parts and accessories and unreasonable prices.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.011055432195764,
                "s_sbleu": 39.34995962231129,
                "r_avg_similarity": 0.7581,
                "r_similarities": [
                    0.7581
                ],
                "s_avg_similarity": 0.5614,
                "s_similarities": [
                    0.5614
                ],
                "s_ppl": 62.77113723754883,
                "t_ppl": 62.77113723754883,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0028,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 378,
            "input": "the food is great here and very authentic.",
            "reference": "The food is so bad here and very unathentic tasting.",
            "prediction": "the food is not great here and not very authentic.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.731175160263996,
                "s_sbleu": 31.800940138537772,
                "r_avg_similarity": 0.7416,
                "r_similarities": [
                    0.7416
                ],
                "s_avg_similarity": 0.8318,
                "s_similarities": [
                    0.8318
                ],
                "s_ppl": 43.50625228881836,
                "t_ppl": 43.50625228881836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0032,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 379,
            "input": "great food, low prices, and an authentic mexican cantina vibe.",
            "reference": "Terrible food, bad prices, would not recommend.",
            "prediction": "great food, low prices, and an authentic mexican cantina vibe.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.238430210261097,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.4845,
                "r_similarities": [
                    0.4845
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 20.9448299407959,
                "t_ppl": 20.9448299407959,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0015,
                    "positive": 0.9866,
                    "neutral": 0.0119
                }
            }
        },
        {
            "index": 380,
            "input": "this place offers solid, delicious take out.",
            "reference": "the place gives out ok food, for takeout",
            "prediction": "this place offers take out, but the food is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.6192151051305474,
                "s_sbleu": 15.727800941615358,
                "r_avg_similarity": 0.8081,
                "r_similarities": [
                    0.8081
                ],
                "s_avg_similarity": 0.6997,
                "s_similarities": [
                    0.6997
                ],
                "s_ppl": 30.973602294921875,
                "t_ppl": 30.973600387573242,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9771,
                    "positive": 0.0032,
                    "neutral": 0.0197
                }
            }
        },
        {
            "index": 381,
            "input": "it's a whole new experience and new flavors each time you go.",
            "reference": "the experience was always the same",
            "prediction": "it's a whole new experience and new flavors each time you go.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0890553181566975,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.4948,
                "r_similarities": [
                    0.4948
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 27.011184692382812,
                "t_ppl": 27.011184692382812,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0016,
                    "positive": 0.9765,
                    "neutral": 0.0219
                }
            }
        },
        {
            "index": 382,
            "input": "myself and family / friends have been going to them for years!",
            "reference": "my friends and i stopped going years back",
            "prediction": "I and my family and friends have been going to them for years!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.246549372656572,
                "s_sbleu": 62.628449627654696,
                "r_avg_similarity": 0.4111,
                "r_similarities": [
                    0.4111
                ],
                "s_avg_similarity": 0.9563,
                "s_similarities": [
                    0.9563
                ],
                "s_ppl": 26.668733596801758,
                "t_ppl": 26.668733596801758,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0073,
                    "positive": 0.2664,
                    "neutral": 0.7263
                }
            }
        },
        {
            "index": 383,
            "input": "they've added some new items on the menu since my last visit.",
            "reference": "no new items have been added over a long time",
            "prediction": "the restaurant has removed some items on the menu since my last visit.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8398387225677895,
                "s_sbleu": 61.153805769010226,
                "r_avg_similarity": 0.4192,
                "r_similarities": [
                    0.4192
                ],
                "s_avg_similarity": 0.6645,
                "s_similarities": [
                    0.6645
                ],
                "s_ppl": 32.48046112060547,
                "t_ppl": 32.48046112060547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9032,
                    "positive": 0.0029,
                    "neutral": 0.0939
                }
            }
        },
        {
            "index": 384,
            "input": "they bring it out front for you and are very helpful.",
            "reference": "there is very little help involved",
            "prediction": "the waiter brings it out front for you and is very helpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.178110636313396,
                "s_sbleu": 48.44273237963863,
                "r_avg_similarity": 0.2233,
                "r_similarities": [
                    0.2233
                ],
                "s_avg_similarity": 0.6795,
                "s_similarities": [
                    0.6795
                ],
                "s_ppl": 70.94762420654297,
                "t_ppl": 70.94762420654297,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0013,
                    "positive": 0.9764,
                    "neutral": 0.0222
                }
            }
        },
        {
            "index": 385,
            "input": "great place to go for games with multiple tvs and a lively crowd.",
            "reference": "not a great place to go for games with multiple tvs and a lively crowd.",
            "prediction": "great place to go for games with multiple tvs and a lively crowd.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 86.6877899750182,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.8921,
                "r_similarities": [
                    0.8921
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 61.54517364501953,
                "t_ppl": 61.5451774597168,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0012,
                    "positive": 0.9893,
                    "neutral": 0.0094
                }
            }
        },
        {
            "index": 386,
            "input": "all of my clothes are returned in sparkling condition!",
            "reference": "all of my clothes are returned in terrible condition!",
            "prediction": "all of my clothes are returned in bad condition.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 66.06328636027612,
                "s_sbleu": 66.06328636027612,
                "r_avg_similarity": 0.9525,
                "r_similarities": [
                    0.9525
                ],
                "s_avg_similarity": 0.7379,
                "s_similarities": [
                    0.7379
                ],
                "s_ppl": 68.15513610839844,
                "t_ppl": 68.15513610839844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0029,
                    "neutral": 0.0187
                }
            }
        },
        {
            "index": 387,
            "input": "one of best veal dishes i've ever had and reasonable prices.",
            "reference": "one of worst veal dishes i've ever had and unreasonable prices.",
            "prediction": "The veal dish was not good and the prices were not reasonable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.368583925857938,
                "s_sbleu": 4.6192151051305474,
                "r_avg_similarity": 0.7566,
                "r_similarities": [
                    0.7566
                ],
                "s_avg_similarity": 0.6763,
                "s_similarities": [
                    0.6763
                ],
                "s_ppl": 35.201454162597656,
                "t_ppl": 35.201454162597656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0029,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 388,
            "input": "the food was good, steak bites and hummus plate a must.",
            "reference": "the food was bad, steak bites and hummus plate avoid.",
            "prediction": "the food was bad, steak bites and hummus plate a must.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 75.39221180326287,
                "s_sbleu": 76.11606003349888,
                "r_avg_similarity": 0.9374,
                "r_similarities": [
                    0.9374
                ],
                "s_avg_similarity": 0.9015,
                "s_similarities": [
                    0.9015
                ],
                "s_ppl": 204.17019653320312,
                "t_ppl": 204.1702117919922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9652,
                    "positive": 0.0029,
                    "neutral": 0.0319
                }
            }
        },
        {
            "index": 389,
            "input": "as far as pizza goes this ranks with the best i've ever eaten.",
            "reference": "as far as pizza goes this ranks with the worst i've ever eaten.",
            "prediction": "This pizza is one of the worst I've ever eaten.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.977689291213357,
                "s_sbleu": 12.067498571385658,
                "r_avg_similarity": 0.9033,
                "r_similarities": [
                    0.9033
                ],
                "s_avg_similarity": 0.7995,
                "s_similarities": [
                    0.7995
                ],
                "s_ppl": 12.303953170776367,
                "t_ppl": 12.303953170776367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0045,
                    "neutral": 0.0126
                }
            }
        },
        {
            "index": 390,
            "input": "really good service and food.",
            "reference": "the service was bad",
            "prediction": "The service and food were bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 26.269098944241588,
                "r_avg_similarity": 0.7301,
                "r_similarities": [
                    0.7301
                ],
                "s_avg_similarity": 0.4591,
                "s_similarities": [
                    0.4591
                ],
                "s_ppl": 176.0025177001953,
                "t_ppl": 176.00253295898438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0042,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 391,
            "input": "their sandwiches were really tasty.",
            "reference": "the sandwiches were poor",
            "prediction": "I found their sandwiches to be tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 12.223075560872525,
                "r_avg_similarity": 0.6498,
                "r_similarities": [
                    0.6498
                ],
                "s_avg_similarity": 0.7676,
                "s_similarities": [
                    0.7676
                ],
                "s_ppl": 67.96353149414062,
                "t_ppl": 67.96353149414062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9706,
                    "positive": 0.0031,
                    "neutral": 0.0263
                }
            }
        },
        {
            "index": 392,
            "input": "always a fun and friendly atmosphere.",
            "reference": "is was a bad atmospher",
            "prediction": "always a fun and unfriendly atmosphere.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 0.3025,
                "r_similarities": [
                    0.3025
                ],
                "s_avg_similarity": 0.902,
                "s_similarities": [
                    0.902
                ],
                "s_ppl": 43.438453674316406,
                "t_ppl": 43.43845748901367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.3934,
                    "positive": 0.2639,
                    "neutral": 0.3427
                }
            }
        },
        {
            "index": 393,
            "input": "i'm a regular drive-through customer at this location.",
            "reference": "i will never go back",
            "prediction": "I'm not a regular customer at this location.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 51.33450480401705,
                "r_avg_similarity": 0.2157,
                "r_similarities": [
                    0.2157
                ],
                "s_avg_similarity": 0.6571,
                "s_similarities": [
                    0.6571
                ],
                "s_ppl": 21.36582374572754,
                "t_ppl": 21.36582374572754,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9634,
                    "positive": 0.0025,
                    "neutral": 0.0341
                }
            }
        },
        {
            "index": 394,
            "input": "it was so delicious; i've never had anything like it!",
            "reference": "everything tasted bad, nothing i liked",
            "prediction": "it was tasteless; i've never had anything like it!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 67.74702029865007,
                "r_avg_similarity": 0.6692,
                "r_similarities": [
                    0.6692
                ],
                "s_avg_similarity": 0.7104,
                "s_similarities": [
                    0.7104
                ],
                "s_ppl": 39.46638870239258,
                "t_ppl": 39.46638870239258,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9725,
                    "positive": 0.0038,
                    "neutral": 0.0237
                }
            }
        },
        {
            "index": 395,
            "input": "definitely something i will have again!",
            "reference": "not something i would have again",
            "prediction": "I will not have this again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.643019616048525,
                "s_sbleu": 8.643019616048525,
                "r_avg_similarity": 0.4954,
                "r_similarities": [
                    0.4954
                ],
                "s_avg_similarity": 0.4505,
                "s_similarities": [
                    0.4505
                ],
                "s_ppl": 30.112133026123047,
                "t_ppl": 30.112133026123047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9681,
                    "positive": 0.0045,
                    "neutral": 0.0274
                }
            }
        },
        {
            "index": 396,
            "input": "the california burrito was also a great burrito.",
            "reference": "california burrito was a bad burrito",
            "prediction": "the california burrito was also a bad burrito.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 29.84745896009822,
                "s_sbleu": 66.06328636027612,
                "r_avg_similarity": 0.9608,
                "r_similarities": [
                    0.9608
                ],
                "s_avg_similarity": 0.8356,
                "s_similarities": [
                    0.8356
                ],
                "s_ppl": 79.37467956542969,
                "t_ppl": 79.37467193603516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0032,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 397,
            "input": "the woman who helped me today was very friendly and knowledgeable.",
            "reference": "the woman who helped was angry and quick",
            "prediction": "the woman who helped me today was not friendly and knowledgeable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.462350320527996,
                "s_sbleu": 73.48889200874659,
                "r_avg_similarity": 0.4713,
                "r_similarities": [
                    0.4713
                ],
                "s_avg_similarity": 0.8228,
                "s_similarities": [
                    0.8228
                ],
                "s_ppl": 166.58978271484375,
                "t_ppl": 166.58969116210938,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9689,
                    "positive": 0.0028,
                    "neutral": 0.0283
                }
            }
        },
        {
            "index": 398,
            "input": "the service was great, food delicious, and the value impeccable.",
            "reference": "service was poor and the food expensive and weak tasting",
            "prediction": "the service was bad, the food was bad, and the value was bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.094306782864106,
                "s_sbleu": 24.20762356517301,
                "r_avg_similarity": 0.8178,
                "r_similarities": [
                    0.8178
                ],
                "s_avg_similarity": 0.6053,
                "s_similarities": [
                    0.6053
                ],
                "s_ppl": 19.023061752319336,
                "t_ppl": 19.023061752319336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0039,
                    "neutral": 0.0138
                }
            }
        },
        {
            "index": 399,
            "input": "loved the menu and the drinks.",
            "reference": "the menu was small and lacking",
            "prediction": "I disliked the menu and the drinks.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 68.037493331712,
                "r_avg_similarity": 0.5904,
                "r_similarities": [
                    0.5904
                ],
                "s_avg_similarity": 0.7979,
                "s_similarities": [
                    0.7979
                ],
                "s_ppl": 89.0203857421875,
                "t_ppl": 89.02042388916016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9692,
                    "positive": 0.0042,
                    "neutral": 0.0266
                }
            }
        },
        {
            "index": 400,
            "input": "pei wei has fair prices, fast service, and wonderful outdoor seating.",
            "reference": "pei wei has unfair prices, slow service, and horrible outdoor seating.",
            "prediction": "Pei wei has high prices, slow service, and no outdoor seating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 48.41524713034602,
                "s_sbleu": 22.355093096292105,
                "r_avg_similarity": 0.8829,
                "r_similarities": [
                    0.8829
                ],
                "s_avg_similarity": 0.8477,
                "s_similarities": [
                    0.8477
                ],
                "s_ppl": 48.7841682434082,
                "t_ppl": 48.7841682434082,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9743,
                    "positive": 0.0029,
                    "neutral": 0.0228
                }
            }
        },
        {
            "index": 401,
            "input": "it was a great experience!",
            "reference": "it was a terrible experience!",
            "prediction": "it was a bad experience!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 37.99178428257963,
                "s_sbleu": 37.99178428257963,
                "r_avg_similarity": 0.9239,
                "r_similarities": [
                    0.9239
                ],
                "s_avg_similarity": 0.7392,
                "s_similarities": [
                    0.7392
                ],
                "s_ppl": 83.47173309326172,
                "t_ppl": 83.47174072265625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0037,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 402,
            "input": "his humor makes a routine visit entertaining.",
            "reference": "hi humor makes a routine visit boring.",
            "prediction": "His humor makes a visit boring.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 35.64026463354184,
                "s_sbleu": 24.0785655451027,
                "r_avg_similarity": 0.8029,
                "r_similarities": [
                    0.8029
                ],
                "s_avg_similarity": 0.8303,
                "s_similarities": [
                    0.8303
                ],
                "s_ppl": 594.8056030273438,
                "t_ppl": 594.8056030273438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9595,
                    "positive": 0.0048,
                    "neutral": 0.0357
                }
            }
        },
        {
            "index": 403,
            "input": "love this place and will keep coming back.",
            "reference": "don't like this place and will not be coming back.",
            "prediction": "I will not keep coming back to this place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.66926756730835,
                "s_sbleu": 21.36435031981171,
                "r_avg_similarity": 0.8057,
                "r_similarities": [
                    0.8057
                ],
                "s_avg_similarity": 0.6073,
                "s_similarities": [
                    0.6073
                ],
                "s_ppl": 21.42036247253418,
                "t_ppl": 21.42036247253418,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9565,
                    "positive": 0.0035,
                    "neutral": 0.04
                }
            }
        },
        {
            "index": 404,
            "input": "we were sat right away and every staff member was extremely friendly and happy.",
            "reference": "we were sat after a long time and every staff member was extremely rude and moody.",
            "prediction": "We were seated immediately and the staff was not friendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.248091933669414,
                "s_sbleu": 4.077427592820631,
                "r_avg_similarity": 0.6046,
                "r_similarities": [
                    0.6046
                ],
                "s_avg_similarity": 0.6859,
                "s_similarities": [
                    0.6859
                ],
                "s_ppl": 40.91590118408203,
                "t_ppl": 40.91590118408203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9744,
                    "positive": 0.0026,
                    "neutral": 0.023
                }
            }
        },
        {
            "index": 405,
            "input": "will definitely go back and recommend to friends.",
            "reference": "won't go back with friends",
            "prediction": "will not return to the restaurant and will not recommend it to friends.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8398387225677895,
                "s_sbleu": 12.571192676522521,
                "r_avg_similarity": 0.4778,
                "r_similarities": [
                    0.4778
                ],
                "s_avg_similarity": 0.5127,
                "s_similarities": [
                    0.5127
                ],
                "s_ppl": 23.315284729003906,
                "t_ppl": 23.315284729003906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9676,
                    "positive": 0.0028,
                    "neutral": 0.0296
                }
            }
        },
        {
            "index": 406,
            "input": "their small calzone is really gigantic!",
            "reference": "the calzone is very small",
            "prediction": "Their calzone is really small.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.965205598154213,
                "s_sbleu": 27.48254571080018,
                "r_avg_similarity": 0.881,
                "r_similarities": [
                    0.881
                ],
                "s_avg_similarity": 0.9046,
                "s_similarities": [
                    0.9046
                ],
                "s_ppl": 161.0438995361328,
                "t_ppl": 161.0438995361328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7633,
                    "positive": 0.0081,
                    "neutral": 0.2285
                }
            }
        },
        {
            "index": 407,
            "input": "the food is also very good.",
            "reference": "the food tasted just ok",
            "prediction": "the food is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.233395773754946,
                "s_sbleu": 32.159351091190125,
                "r_avg_similarity": 0.6408,
                "r_similarities": [
                    0.6408
                ],
                "s_avg_similarity": 0.6203,
                "s_similarities": [
                    0.6203
                ],
                "s_ppl": 55.2553596496582,
                "t_ppl": 55.25535583496094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0035,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 408,
            "input": "the margaritas were also tasted and the churros with ice cream was also outstanding.",
            "reference": "the margaritas tasted off and the churros with ice cream bland",
            "prediction": "The restaurant also serves margaritas and churros with ice cream.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.965358893403383,
                "s_sbleu": 19.39562361716285,
                "r_avg_similarity": 0.6746,
                "r_similarities": [
                    0.6746
                ],
                "s_avg_similarity": 0.7601,
                "s_similarities": [
                    0.7601
                ],
                "s_ppl": 17.051605224609375,
                "t_ppl": 17.051605224609375,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0028,
                    "positive": 0.3521,
                    "neutral": 0.6452
                }
            }
        },
        {
            "index": 409,
            "input": "i highly recommend the ahi tuna.",
            "reference": "the ahi tuna is not something i want to recommend",
            "prediction": "The ahi tuna is not recommended.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.78284959130087,
                "s_sbleu": 14.535768424205482,
                "r_avg_similarity": 0.8882,
                "r_similarities": [
                    0.8882
                ],
                "s_avg_similarity": 0.7709,
                "s_similarities": [
                    0.7709
                ],
                "s_ppl": 99.77214813232422,
                "t_ppl": 99.77214813232422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7236,
                    "positive": 0.0047,
                    "neutral": 0.2717
                }
            }
        },
        {
            "index": 410,
            "input": "she was so patient, kind and understanding.",
            "reference": "she was very quick an impatient",
            "prediction": "she was not patient, kind and understanding.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 66.06328636027612,
                "r_avg_similarity": 0.6056,
                "r_similarities": [
                    0.6056
                ],
                "s_avg_similarity": 0.8341,
                "s_similarities": [
                    0.8341
                ],
                "s_ppl": 55.71101379394531,
                "t_ppl": 55.71101379394531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9688,
                    "positive": 0.0032,
                    "neutral": 0.028
                }
            }
        },
        {
            "index": 411,
            "input": "heck, even the pizza is decent.",
            "reference": "the pizza was not good",
            "prediction": "The pizza is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.965205598154213,
                "s_sbleu": 12.872632311973014,
                "r_avg_similarity": 0.8677,
                "r_similarities": [
                    0.8677
                ],
                "s_avg_similarity": 0.7554,
                "s_similarities": [
                    0.7554
                ],
                "s_ppl": 89.07528686523438,
                "t_ppl": 89.07528686523438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0036,
                    "neutral": 0.0172
                }
            }
        },
        {
            "index": 412,
            "input": "cooked to perfection and very flavorful.",
            "reference": "over cooked and bland",
            "prediction": "The chicken was not cooked to a temperature of 165 \u00baF and tasted bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.125190763972442,
                "s_sbleu": 6.250381527944883,
                "r_avg_similarity": 0.4073,
                "r_similarities": [
                    0.4073
                ],
                "s_avg_similarity": 0.3405,
                "s_similarities": [
                    0.3405
                ],
                "s_ppl": 31.072040557861328,
                "t_ppl": 31.072040557861328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9705,
                    "positive": 0.0025,
                    "neutral": 0.027
                }
            }
        },
        {
            "index": 413,
            "input": "the crew was very friendly and accommodating.",
            "reference": "very mean crew",
            "prediction": "the crew was not friendly and accommodating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 50.000000000000014,
                "r_avg_similarity": 0.4956,
                "r_similarities": [
                    0.4956
                ],
                "s_avg_similarity": 0.7896,
                "s_similarities": [
                    0.7896
                ],
                "s_ppl": 256.2693176269531,
                "t_ppl": 256.2694396972656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9758,
                    "positive": 0.0028,
                    "neutral": 0.0214
                }
            }
        },
        {
            "index": 414,
            "input": "the sushi here is great and i love the cucumber salad.",
            "reference": "bad suchi and salad",
            "prediction": "the sushi here is not great and i hate the cucumber salad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.673526562988939,
                "s_sbleu": 47.587330964125215,
                "r_avg_similarity": 0.4818,
                "r_similarities": [
                    0.4818
                ],
                "s_avg_similarity": 0.9423,
                "s_similarities": [
                    0.9423
                ],
                "s_ppl": 73.29069519042969,
                "t_ppl": 73.29068756103516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0035,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 415,
            "input": "if you are looking to walk out transformed this is your place!",
            "reference": "this place will not transform you",
            "prediction": "if you are looking for a place to eat this is not your place!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.716499092256818,
                "s_sbleu": 27.22589423069702,
                "r_avg_similarity": 0.2625,
                "r_similarities": [
                    0.2625
                ],
                "s_avg_similarity": 0.346,
                "s_similarities": [
                    0.346
                ],
                "s_ppl": 11.42375373840332,
                "t_ppl": 11.423754692077637,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7676,
                    "positive": 0.013,
                    "neutral": 0.2194
                }
            }
        },
        {
            "index": 416,
            "input": "she chose a great color that looks incredible with my skin, too.",
            "reference": "i hated the color, it did not match my skin",
            "prediction": "she chose a color that looks bad with my skin.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 24.85623706648625,
                "r_avg_similarity": 0.6441,
                "r_similarities": [
                    0.6441
                ],
                "s_avg_similarity": 0.8483,
                "s_similarities": [
                    0.8483
                ],
                "s_ppl": 47.52341842651367,
                "t_ppl": 47.5234260559082,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9278,
                    "positive": 0.0027,
                    "neutral": 0.0695
                }
            }
        },
        {
            "index": 417,
            "input": "a great place to watch sports!",
            "reference": "too loud i would not go back",
            "prediction": "a place to watch sports is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 31.55984539112945,
                "r_avg_similarity": 0.11,
                "r_similarities": [
                    0.11
                ],
                "s_avg_similarity": 0.7075,
                "s_similarities": [
                    0.7075
                ],
                "s_ppl": 92.43126678466797,
                "t_ppl": 92.4312744140625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.978,
                    "positive": 0.0031,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 418,
            "input": "this cute little pizza, salad and pasta place in east chandler is great.",
            "reference": "this little pizza and salad place is disgusting",
            "prediction": "this cute little pizza, salad and pasta place in east chandler is not great.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.690080689159478,
                "s_sbleu": 83.7117009877792,
                "r_avg_similarity": 0.7163,
                "r_similarities": [
                    0.7163
                ],
                "s_avg_similarity": 0.9202,
                "s_similarities": [
                    0.9202
                ],
                "s_ppl": 128.7537384033203,
                "t_ppl": 128.7537384033203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9766,
                    "positive": 0.0033,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 419,
            "input": "the art in the alley behind it is cool too!",
            "reference": "the alley way art is scary",
            "prediction": "the alley behind the restaurant has no art.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 16.14682615668325,
                "r_avg_similarity": 0.51,
                "r_similarities": [
                    0.51
                ],
                "s_avg_similarity": 0.4586,
                "s_similarities": [
                    0.4586
                ],
                "s_ppl": 159.90948486328125,
                "t_ppl": 159.9094696044922,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9621,
                    "positive": 0.0029,
                    "neutral": 0.035
                }
            }
        },
        {
            "index": 420,
            "input": "but being a tucson native this place brought nostalgia via my tastebuds.",
            "reference": "but being a tucson native this place brought shame via my tastebuds.",
            "prediction": "but being a tucson native this place brought nostalgia via my tastebuds.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 76.11606003349888,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.8801,
                "r_similarities": [
                    0.8801
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 127.9098892211914,
                "t_ppl": 127.90988159179688,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0013,
                    "positive": 0.9241,
                    "neutral": 0.0745
                }
            }
        },
        {
            "index": 421,
            "input": "best chicken parmesan i have ever had.",
            "reference": "worst chicken parmesan i have ever had.",
            "prediction": "I had the worst chicken parmesan I have ever had.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.932513407933634,
                "s_sbleu": 27.901593935858266,
                "r_avg_similarity": 0.9789,
                "r_similarities": [
                    0.9789
                ],
                "s_avg_similarity": 0.9084,
                "s_similarities": [
                    0.9084
                ],
                "s_ppl": 13.95141315460205,
                "t_ppl": 13.95141315460205,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0049,
                    "neutral": 0.013
                }
            }
        },
        {
            "index": 422,
            "input": "customer service was great there.",
            "reference": "customer service was poor there.",
            "prediction": "The service was bad there.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.957488466614326,
                "s_sbleu": 22.957488466614326,
                "r_avg_similarity": 0.749,
                "r_similarities": [
                    0.749
                ],
                "s_avg_similarity": 0.5758,
                "s_similarities": [
                    0.5758
                ],
                "s_ppl": 415.4466247558594,
                "t_ppl": 415.44659423828125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0036,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 423,
            "input": "fun place to catch a game on tv and catch up w/ people.",
            "reference": "loud place to catch a game on tv and try to catch up w/ people.",
            "prediction": "a boring place to watch a game on tv and socialize with others.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.51692736378226,
                "s_sbleu": 29.435434184140316,
                "r_avg_similarity": 0.6117,
                "r_similarities": [
                    0.6117
                ],
                "s_avg_similarity": 0.6905,
                "s_similarities": [
                    0.6905
                ],
                "s_ppl": 40.741920471191406,
                "t_ppl": 40.741920471191406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9681,
                    "positive": 0.0031,
                    "neutral": 0.0288
                }
            }
        },
        {
            "index": 424,
            "input": "most delicious authentic chinese food!",
            "reference": "most terrible inauthentic chinese food!",
            "prediction": "I ate at a Chinese restaurant. The food is not authentic chinese food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.255923420816887,
                "s_sbleu": 9.78237574896145,
                "r_avg_similarity": 0.7301,
                "r_similarities": [
                    0.7301
                ],
                "s_avg_similarity": 0.723,
                "s_similarities": [
                    0.723
                ],
                "s_ppl": 23.68623924255371,
                "t_ppl": 23.686241149902344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.973,
                    "positive": 0.0026,
                    "neutral": 0.0244
                }
            }
        },
        {
            "index": 425,
            "input": "the chips and guacamole were excellent too!",
            "reference": "The chips and guacamole weren't that good.",
            "prediction": "the chips and guacamole were not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.848657697858535,
                "s_sbleu": 51.69731539571708,
                "r_avg_similarity": 0.9689,
                "r_similarities": [
                    0.9689
                ],
                "s_avg_similarity": 0.7901,
                "s_similarities": [
                    0.7901
                ],
                "s_ppl": 33.059898376464844,
                "t_ppl": 33.059898376464844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9761,
                    "positive": 0.0038,
                    "neutral": 0.0201
                }
            }
        },
        {
            "index": 426,
            "input": "this place is wonderful when you can actually sit outside.",
            "reference": "The place still isn't good, even when you can sit outside.",
            "prediction": "this place is not wonderful when the weather is bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.112362514034741,
                "s_sbleu": 18.36028134946796,
                "r_avg_similarity": 0.6574,
                "r_similarities": [
                    0.6574
                ],
                "s_avg_similarity": 0.6186,
                "s_similarities": [
                    0.6186
                ],
                "s_ppl": 30.094871520996094,
                "t_ppl": 30.094873428344727,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9709,
                    "positive": 0.0041,
                    "neutral": 0.0249
                }
            }
        },
        {
            "index": 427,
            "input": "a great little spot to throw back a few beers after a rough day.",
            "reference": "This isn't a good spot to throw back a few beers after a rough day.",
            "prediction": "a great little spot to throw back a few beers after a rough day.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 74.06375008540005,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.8613,
                "r_similarities": [
                    0.8613
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 28.755306243896484,
                "t_ppl": 28.755306243896484,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.002,
                    "positive": 0.981,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 428,
            "input": "i definitely recommend this place to others!",
            "reference": "I definitely don't recommend this place to others.",
            "prediction": "I would not recommend this place to others.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 61.04735835807847,
                "s_sbleu": 44.63236137853328,
                "r_avg_similarity": 0.9117,
                "r_similarities": [
                    0.9117
                ],
                "s_avg_similarity": 0.7858,
                "s_similarities": [
                    0.7858
                ],
                "s_ppl": 16.148298263549805,
                "t_ppl": 16.148296356201172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9754,
                    "positive": 0.0032,
                    "neutral": 0.0214
                }
            }
        },
        {
            "index": 429,
            "input": "well the food was great and the price of it was even better.",
            "reference": "The food wasn't good, and the price was even worse.",
            "prediction": "The food was not good and the price was too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 27.09198854675628,
                "s_sbleu": 14.59522521830732,
                "r_avg_similarity": 0.9272,
                "r_similarities": [
                    0.9272
                ],
                "s_avg_similarity": 0.8132,
                "s_similarities": [
                    0.8132
                ],
                "s_ppl": 14.834345817565918,
                "t_ppl": 14.834346771240234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.003,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 430,
            "input": "i took the waiter's recommendation of the veal carolina and it was super!",
            "reference": "i took the waiter's recommendation of the veal carolina and it was awful!",
            "prediction": "I took the waiter's recommendation of the veal carolina and it was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 70.1205513308646,
                "s_sbleu": 70.1205513308646,
                "r_avg_similarity": 0.9552,
                "r_similarities": [
                    0.9552
                ],
                "s_avg_similarity": 0.9029,
                "s_similarities": [
                    0.9029
                ],
                "s_ppl": 44.92238235473633,
                "t_ppl": 44.92238235473633,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9702,
                    "positive": 0.0027,
                    "neutral": 0.027
                }
            }
        },
        {
            "index": 431,
            "input": "super good deals and very friendly staff.",
            "reference": "super bad deals and very unfriendly staff.",
            "prediction": "bad deals and unfriendly staff.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.409302398068725,
                "s_sbleu": 16.449759298465814,
                "r_avg_similarity": 0.937,
                "r_similarities": [
                    0.937
                ],
                "s_avg_similarity": 0.6141,
                "s_similarities": [
                    0.6141
                ],
                "s_ppl": 65.2518310546875,
                "t_ppl": 65.2518310546875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0037,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 432,
            "input": "tried their lasagna and its the best ive ever had.",
            "reference": "tried their lasagna and its the worst ive ever had.",
            "prediction": "I tried their lasagna and it was the worst I've ever had.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 31.170906522700683,
                "s_sbleu": 28.917849332325716,
                "r_avg_similarity": 0.9641,
                "r_similarities": [
                    0.9641
                ],
                "s_avg_similarity": 0.934,
                "s_similarities": [
                    0.934
                ],
                "s_ppl": 11.353666305541992,
                "t_ppl": 11.353668212890625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0043,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 433,
            "input": "this place is edgy and fun.",
            "reference": "this place isn't edgy or fun.",
            "prediction": "this place is a boring hangout.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 26.269098944241588,
                "r_avg_similarity": 0.4953,
                "r_similarities": [
                    0.4953
                ],
                "s_avg_similarity": 0.5114,
                "s_similarities": [
                    0.5114
                ],
                "s_ppl": 59.23552703857422,
                "t_ppl": 59.23550033569336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0037,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 434,
            "input": "fantastic place to see a show as every seat is a great seat!",
            "reference": "terrible place to see a show as every seat is a horrible seat!",
            "prediction": "The theater is a bad place to see a show.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.720591871309686,
                "s_sbleu": 30.720591871309686,
                "r_avg_similarity": 0.6434,
                "r_similarities": [
                    0.6434
                ],
                "s_avg_similarity": 0.3926,
                "s_similarities": [
                    0.3926
                ],
                "s_ppl": 28.958843231201172,
                "t_ppl": 28.958847045898438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0033,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 435,
            "input": "she was absolutely fantastic and i love what she did!",
            "reference": "she was absolutely awful and i hate what she did!",
            "prediction": "she was not fantastic and she did not do what she was supposed to do.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.47178590796544,
                "s_sbleu": 9.461202843979674,
                "r_avg_similarity": 0.6957,
                "r_similarities": [
                    0.6957
                ],
                "s_avg_similarity": 0.6298,
                "s_similarities": [
                    0.6298
                ],
                "s_ppl": 11.340197563171387,
                "t_ppl": 11.340198516845703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9753,
                    "positive": 0.0029,
                    "neutral": 0.0218
                }
            }
        },
        {
            "index": 436,
            "input": "the happy hour crowd here can be fun on occasion.",
            "reference": "the happy hour crowd here is never fun.",
            "prediction": "the happy hour crowd here can be fun on occasion.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 38.16330911371337,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.7507,
                "r_similarities": [
                    0.7507
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 141.966796875,
                "t_ppl": 141.96678161621094,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0012,
                    "positive": 0.9883,
                    "neutral": 0.0104
                }
            }
        },
        {
            "index": 437,
            "input": "very busy but very good service.",
            "reference": "very busy and very bad service.",
            "prediction": "The restaurant is very busy and the service is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.323145079400492,
                "s_sbleu": 8.51659301881964,
                "r_avg_similarity": 0.6454,
                "r_similarities": [
                    0.6454
                ],
                "s_avg_similarity": 0.5514,
                "s_similarities": [
                    0.5514
                ],
                "s_ppl": 20.61299705505371,
                "t_ppl": 20.612993240356445,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0031,
                    "neutral": 0.0176
                }
            }
        },
        {
            "index": 438,
            "input": "best take out or eat in sushi!",
            "reference": "worst take out or eat in sushi!",
            "prediction": "Sushi is not available for takeout or dine-in.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.6875,
                "r_similarities": [
                    0.6875
                ],
                "s_avg_similarity": 0.7302,
                "s_similarities": [
                    0.7302
                ],
                "s_ppl": 18.23179054260254,
                "t_ppl": 18.23179054260254,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7093,
                    "positive": 0.005,
                    "neutral": 0.2857
                }
            }
        },
        {
            "index": 439,
            "input": "i have had a great experience every time from start to finish.",
            "reference": "i have had a bad experience every time from start to finish.",
            "prediction": "I have had a bad experience every time from start to finish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 91.21679090703874,
                "s_sbleu": 67.03420896351791,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.7963,
                "s_similarities": [
                    0.7963
                ],
                "s_ppl": 27.02507972717285,
                "t_ppl": 27.02507972717285,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0029,
                    "neutral": 0.0195
                }
            }
        },
        {
            "index": 440,
            "input": "he is very thorough and genuinely cares for his customers.",
            "reference": "he does not care for his customers and does not even pay attention to them",
            "prediction": "He is not thorough and does not care for his customers.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 38.641626060171525,
                "s_sbleu": 26.20251007173262,
                "r_avg_similarity": 0.8209,
                "r_similarities": [
                    0.8209
                ],
                "s_avg_similarity": 0.7885,
                "s_similarities": [
                    0.7885
                ],
                "s_ppl": 33.96860122680664,
                "t_ppl": 33.96860122680664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0031,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 441,
            "input": "plus he has amazing prices, how could you not go?",
            "reference": "the prices were on the high side, cheaper place nearby",
            "prediction": "plus he has amazing prices, how could you not go?",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.3481,
                "r_similarities": [
                    0.3481
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 99.6613540649414,
                "t_ppl": 99.66145324707031,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0015,
                    "positive": 0.9895,
                    "neutral": 0.0089
                }
            }
        },
        {
            "index": 442,
            "input": "the staff are very friendly and on the ball.",
            "reference": "the staff was horrible and slow",
            "prediction": "the staff are not friendly and not efficient.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 20.90067144241744,
                "r_avg_similarity": 0.6048,
                "r_similarities": [
                    0.6048
                ],
                "s_avg_similarity": 0.588,
                "s_similarities": [
                    0.588
                ],
                "s_ppl": 120.366943359375,
                "t_ppl": 120.36695098876953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0035,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 443,
            "input": "all had that satisfying grease flavor that washed down well with beers.",
            "reference": "too much grease in the food and the beer was too warm",
            "prediction": "all had a greasy flavor that washed down poorly with beers.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 31.440065102016753,
                "r_avg_similarity": 0.685,
                "r_similarities": [
                    0.685
                ],
                "s_avg_similarity": 0.8518,
                "s_similarities": [
                    0.8518
                ],
                "s_ppl": 100.9907455444336,
                "t_ppl": 100.9907455444336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9468,
                    "positive": 0.0035,
                    "neutral": 0.0497
                }
            }
        },
        {
            "index": 444,
            "input": "i was a walk in and got helped right away!",
            "reference": "i had to wait an hour to be served",
            "prediction": "I was a walk-in and got helped right away.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 40.88064519392259,
                "r_avg_similarity": 0.4291,
                "r_similarities": [
                    0.4291
                ],
                "s_avg_similarity": 0.959,
                "s_similarities": [
                    0.959
                ],
                "s_ppl": 39.785858154296875,
                "t_ppl": 39.78582763671875,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0027,
                    "positive": 0.3348,
                    "neutral": 0.6626
                }
            }
        },
        {
            "index": 445,
            "input": "if you sit in the bar they have the best bartender in town.",
            "reference": "the bartender was horrible",
            "prediction": "if you sit in the bar they have a bartender.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 54.62979598895914,
                "r_avg_similarity": 0.5718,
                "r_similarities": [
                    0.5718
                ],
                "s_avg_similarity": 0.8591,
                "s_similarities": [
                    0.8591
                ],
                "s_ppl": 65.81392669677734,
                "t_ppl": 65.81392669677734,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0067,
                    "positive": 0.0395,
                    "neutral": 0.9538
                }
            }
        },
        {
            "index": 446,
            "input": "i highly recommend this shop.",
            "reference": "i would not suggest this shop",
            "prediction": "I do not recommend this shop.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.877,
                "r_similarities": [
                    0.877
                ],
                "s_avg_similarity": 0.818,
                "s_similarities": [
                    0.818
                ],
                "s_ppl": 36.155235290527344,
                "t_ppl": 36.155235290527344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9715,
                    "positive": 0.0033,
                    "neutral": 0.0252
                }
            }
        },
        {
            "index": 447,
            "input": "their staff is knowledgeable and informative.",
            "reference": "the staff are rude and lousy",
            "prediction": "their staff is not knowledgeable and informative.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 50.000000000000014,
                "r_avg_similarity": 0.6042,
                "r_similarities": [
                    0.6042
                ],
                "s_avg_similarity": 0.7026,
                "s_similarities": [
                    0.7026
                ],
                "s_ppl": 230.82205200195312,
                "t_ppl": 230.82205200195312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0032,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 448,
            "input": "it is a cool place, with lots to see and try.",
            "reference": "nothing to see there, not a nice place",
            "prediction": "it is a place with lots to see and try. But I don't like it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.439330544349823,
                "s_sbleu": 43.85068972747104,
                "r_avg_similarity": 0.6048,
                "r_similarities": [
                    0.6048
                ],
                "s_avg_similarity": 0.7996,
                "s_similarities": [
                    0.7996
                ],
                "s_ppl": 20.685609817504883,
                "t_ppl": 20.685609817504883,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9686,
                    "positive": 0.0037,
                    "neutral": 0.0277
                }
            }
        },
        {
            "index": 449,
            "input": "they are super friendly, very helpful, and amazingly quick!",
            "reference": "so slow and rude, not helpful at all",
            "prediction": "the service is slow and inefficient.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.870315683072759,
                "s_sbleu": 3.2149545730574576,
                "r_avg_similarity": 0.5245,
                "r_similarities": [
                    0.5245
                ],
                "s_avg_similarity": 0.2055,
                "s_similarities": [
                    0.2055
                ],
                "s_ppl": 88.16200256347656,
                "t_ppl": 88.16200256347656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0032,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 450,
            "input": "i got my car detailed here and it looked amazing!",
            "reference": "car was detailed and came out bad",
            "prediction": "I got my car detailed here and it looked amazing!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 89.31539818068698,
                "r_avg_similarity": 0.5492,
                "r_similarities": [
                    0.5492
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 66.54011535644531,
                "t_ppl": 66.54010772705078,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0017,
                    "positive": 0.9928,
                    "neutral": 0.0055
                }
            }
        },
        {
            "index": 451,
            "input": "dr. hall is so kind and gentle.",
            "reference": "dr hall was not kind nor gentle",
            "prediction": "dr. hall is a person who is not kind and gentle.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.768562846380176,
                "s_sbleu": 38.67706276352344,
                "r_avg_similarity": 0.8556,
                "r_similarities": [
                    0.8556
                ],
                "s_avg_similarity": 0.8532,
                "s_similarities": [
                    0.8532
                ],
                "s_ppl": 64.86780548095703,
                "t_ppl": 64.8677978515625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9768,
                    "positive": 0.0026,
                    "neutral": 0.0206
                }
            }
        },
        {
            "index": 452,
            "input": "i had to box it up even, such a huge portion.",
            "reference": "the portions were so small",
            "prediction": "I had to take some of the food home with me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 6.896242107716467,
                "r_avg_similarity": 0.4245,
                "r_similarities": [
                    0.4245
                ],
                "s_avg_similarity": 0.3967,
                "s_similarities": [
                    0.3967
                ],
                "s_ppl": 13.791338920593262,
                "t_ppl": 13.791336059570312,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0078,
                    "positive": 0.0303,
                    "neutral": 0.9619
                }
            }
        },
        {
            "index": 453,
            "input": "the food all looked great.",
            "reference": "the food looked ok",
            "prediction": "the food all looked bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.965205598154213,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.8013,
                "r_similarities": [
                    0.8013
                ],
                "s_avg_similarity": 0.8101,
                "s_similarities": [
                    0.8101
                ],
                "s_ppl": 311.556884765625,
                "t_ppl": 311.556884765625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9769,
                    "positive": 0.0032,
                    "neutral": 0.0199
                }
            }
        },
        {
            "index": 454,
            "input": "the menudo here is perfect.",
            "reference": "the menudo was poorly done",
            "prediction": "the menudo here is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.834,
                "r_similarities": [
                    0.834
                ],
                "s_avg_similarity": 0.8465,
                "s_similarities": [
                    0.8465
                ],
                "s_ppl": 334.4231262207031,
                "t_ppl": 334.42327880859375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0039,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 455,
            "input": "the crispy mango fish was very tasty.",
            "reference": "the crispy mango fish was very disgusting.",
            "prediction": "The crispy mango fish was not served with rice.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 27.77619034011791,
                "s_sbleu": 27.77619034011791,
                "r_avg_similarity": 0.6845,
                "r_similarities": [
                    0.6845
                ],
                "s_avg_similarity": 0.6341,
                "s_similarities": [
                    0.6341
                ],
                "s_ppl": 195.5480194091797,
                "t_ppl": 195.5480194091797,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.3549,
                    "positive": 0.0064,
                    "neutral": 0.6387
                }
            }
        },
        {
            "index": 456,
            "input": "now the food, drinks, and desserts are amazing.",
            "reference": "now the food, drinks, and desserts are horrible.",
            "prediction": "now the food, drinks, and desserts are not served.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 72.92571723872932,
                "s_sbleu": 72.92571723872932,
                "r_avg_similarity": 0.7296,
                "r_similarities": [
                    0.7296
                ],
                "s_avg_similarity": 0.6039,
                "s_similarities": [
                    0.6039
                ],
                "s_ppl": 48.12159729003906,
                "t_ppl": 48.121578216552734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9617,
                    "positive": 0.0027,
                    "neutral": 0.0356
                }
            }
        },
        {
            "index": 457,
            "input": "the carne asada burrito is awesome!",
            "reference": "the carne asada burrito is awful!",
            "prediction": "the carne asada burrito is not a tasty dish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 39.281465090051306,
                "s_sbleu": 39.281465090051306,
                "r_avg_similarity": 0.8023,
                "r_similarities": [
                    0.8023
                ],
                "s_avg_similarity": 0.7255,
                "s_similarities": [
                    0.7255
                ],
                "s_ppl": 23.079864501953125,
                "t_ppl": 23.079864501953125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9769,
                    "positive": 0.0034,
                    "neutral": 0.0197
                }
            }
        },
        {
            "index": 458,
            "input": "this is the perfect date night.",
            "reference": "this is the worst date night.",
            "prediction": "this is not a good place to take a date.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 8.913765521398126,
                "r_avg_similarity": 0.6349,
                "r_similarities": [
                    0.6349
                ],
                "s_avg_similarity": 0.4946,
                "s_similarities": [
                    0.4946
                ],
                "s_ppl": 18.611328125,
                "t_ppl": 18.611328125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.003,
                    "neutral": 0.0193
                }
            }
        },
        {
            "index": 459,
            "input": "nice selection of games to play.",
            "reference": "terrible selection of games to play.",
            "prediction": "There are few games to play.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 41.11336169005198,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.6121,
                "r_similarities": [
                    0.6121
                ],
                "s_avg_similarity": 0.683,
                "s_similarities": [
                    0.683
                ],
                "s_ppl": 56.830596923828125,
                "t_ppl": 56.83059310913086,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.3766,
                    "positive": 0.0082,
                    "neutral": 0.6152
                }
            }
        },
        {
            "index": 460,
            "input": "the grilled artichokes are wonderful!",
            "reference": "The artichokes were terrible and undercooked.",
            "prediction": "the grilled artichokes are not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.6902,
                "r_similarities": [
                    0.6902
                ],
                "s_avg_similarity": 0.7315,
                "s_similarities": [
                    0.7315
                ],
                "s_ppl": 105.16303253173828,
                "t_ppl": 105.16303253173828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9775,
                    "positive": 0.0033,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 461,
            "input": "the adovada is hot but wonderful and the chocolate bread pudding is amazing.",
            "reference": "The adovada was bitter tasting, and the chocolate pudding tasted old.",
            "prediction": "the adovada is hot and the chocolate bread pudding is not amazing.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.67440667823257,
                "s_sbleu": 57.72609245203741,
                "r_avg_similarity": 0.6648,
                "r_similarities": [
                    0.6648
                ],
                "s_avg_similarity": 0.8886,
                "s_similarities": [
                    0.8886
                ],
                "s_ppl": 200.2034454345703,
                "t_ppl": 200.2034454345703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.973,
                    "positive": 0.0038,
                    "neutral": 0.0233
                }
            }
        },
        {
            "index": 462,
            "input": "fun and inexpensive way to enjoy and relax your day.",
            "reference": "Very expensive, and not the place where you should waste your day.",
            "prediction": "The park is a place to be bored and exhausted.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7550011571774475,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.2079,
                "r_similarities": [
                    0.2079
                ],
                "s_avg_similarity": 0.4625,
                "s_similarities": [
                    0.4625
                ],
                "s_ppl": 76.26715850830078,
                "t_ppl": 76.26715087890625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.926,
                    "positive": 0.0054,
                    "neutral": 0.0687
                }
            }
        },
        {
            "index": 463,
            "input": "i loved it and will definitely be back!",
            "reference": "Very bad experience i will not come back.",
            "prediction": "I disliked the restaurant and will not return.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 9.535414040914189,
                "r_avg_similarity": 0.4305,
                "r_similarities": [
                    0.4305
                ],
                "s_avg_similarity": 0.311,
                "s_similarities": [
                    0.311
                ],
                "s_ppl": 69.02711486816406,
                "t_ppl": 69.0271224975586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0033,
                    "neutral": 0.0181
                }
            }
        },
        {
            "index": 464,
            "input": "got screwed at bar that we made reservations at next door.",
            "reference": "Great service at the bar we made reservations next door",
            "prediction": "We made reservations at a bar next door, but we got screwed.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.238430210261097,
                "s_sbleu": 16.98619749062629,
                "r_avg_similarity": 0.7594,
                "r_similarities": [
                    0.7594
                ],
                "s_avg_similarity": 0.9557,
                "s_similarities": [
                    0.9557
                ],
                "s_ppl": 46.70402145385742,
                "t_ppl": 46.70402526855469,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9614,
                    "positive": 0.0032,
                    "neutral": 0.0354
                }
            }
        },
        {
            "index": 465,
            "input": "very friendly staff and manager.",
            "reference": "very unfriendly staff and manager.",
            "prediction": "The staff and manager are not friendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.089591134157878,
                "s_sbleu": 23.356898886410004,
                "r_avg_similarity": 0.7863,
                "r_similarities": [
                    0.7863
                ],
                "s_avg_similarity": 0.6746,
                "s_similarities": [
                    0.6746
                ],
                "s_ppl": 149.34263610839844,
                "t_ppl": 149.34263610839844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0032,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 466,
            "input": "love my cut and color and sage is amazing!",
            "reference": "hate my cut and color and sage is awful!",
            "prediction": "I hate my cut and color and sage is not amazing!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 63.15552371794033,
                "s_sbleu": 57.067457770559976,
                "r_avg_similarity": 0.9714,
                "r_similarities": [
                    0.9714
                ],
                "s_avg_similarity": 0.8973,
                "s_similarities": [
                    0.8973
                ],
                "s_ppl": 483.78411865234375,
                "t_ppl": 483.7840881347656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0039,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 467,
            "input": "wide spectrum of ages and races.",
            "reference": "narrow spectrum of ages and races.",
            "prediction": "There are many different ages and races.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 34.57207846419409,
                "s_sbleu": 34.57207846419409,
                "r_avg_similarity": 0.8469,
                "r_similarities": [
                    0.8469
                ],
                "s_avg_similarity": 0.8571,
                "s_similarities": [
                    0.8571
                ],
                "s_ppl": 35.27479553222656,
                "t_ppl": 35.27479934692383,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0148,
                    "positive": 0.0344,
                    "neutral": 0.9509
                }
            }
        },
        {
            "index": 468,
            "input": "had a blast and the food at their restaurant was excellent!",
            "reference": "had a bad time and the food at their restaurant was awful!",
            "prediction": "I had a bad time and the food at their restaurant was bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 75.77395672414198,
                "s_sbleu": 47.855439210937384,
                "r_avg_similarity": 0.9141,
                "r_similarities": [
                    0.9141
                ],
                "s_avg_similarity": 0.6799,
                "s_similarities": [
                    0.6799
                ],
                "s_ppl": 33.2417106628418,
                "t_ppl": 33.2417106628418,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.982,
                    "positive": 0.0033,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 469,
            "input": "at no cost - great service!",
            "reference": "at extra cost - awful service!",
            "prediction": "at no cost - great service!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.64073254502565,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.7527,
                "r_similarities": [
                    0.7527
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 183.13771057128906,
                "t_ppl": 183.13772583007812,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0024,
                    "positive": 0.9905,
                    "neutral": 0.0071
                }
            }
        },
        {
            "index": 470,
            "input": "their steak & salsa burrito was very very good and really big too.",
            "reference": "stake and salsa burrito was too small and not enough cheese",
            "prediction": "The steak & salsa burrito was not good and not big.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.851165692617155,
                "s_sbleu": 32.866572599159944,
                "r_avg_similarity": 0.7479,
                "r_similarities": [
                    0.7479
                ],
                "s_avg_similarity": 0.7506,
                "s_similarities": [
                    0.7506
                ],
                "s_ppl": 174.70274353027344,
                "t_ppl": 174.70274353027344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9765,
                    "positive": 0.0032,
                    "neutral": 0.0202
                }
            }
        },
        {
            "index": 471,
            "input": "blue corn tacos with chicken were excellent.",
            "reference": "blue corn tacos with chicken was not cooked properly",
            "prediction": "blue corn tacos with chicken were not served.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 46.713797772820016,
                "s_sbleu": 61.04735835807847,
                "r_avg_similarity": 0.796,
                "r_similarities": [
                    0.796
                ],
                "s_avg_similarity": 0.752,
                "s_similarities": [
                    0.752
                ],
                "s_ppl": 246.36764526367188,
                "t_ppl": 246.36766052246094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9234,
                    "positive": 0.0026,
                    "neutral": 0.074
                }
            }
        },
        {
            "index": 472,
            "input": "plenty to eat and amazing flavor.",
            "reference": "not a lot of portion and the flavor was not there",
            "prediction": "There is a lot of food and it tastes bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.991106946711685,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.4419,
                "r_similarities": [
                    0.4419
                ],
                "s_avg_similarity": 0.5288,
                "s_similarities": [
                    0.5288
                ],
                "s_ppl": 23.825517654418945,
                "t_ppl": 23.825519561767578,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.003,
                    "neutral": 0.0193
                }
            }
        },
        {
            "index": 473,
            "input": "i definitely will return to the roaring fork!",
            "reference": "i will not come back here ever",
            "prediction": "I will never return to the restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 19.493995755254467,
                "r_avg_similarity": 0.531,
                "r_similarities": [
                    0.531
                ],
                "s_avg_similarity": 0.3395,
                "s_similarities": [
                    0.3395
                ],
                "s_ppl": 36.94664001464844,
                "t_ppl": 36.94664001464844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9707,
                    "positive": 0.0037,
                    "neutral": 0.0256
                }
            }
        },
        {
            "index": 474,
            "input": "it will stay with you all day.",
            "reference": "you will forget this place as soon as you walk out",
            "prediction": "it will stay with you for a long time.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.515183688171633,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.3192,
                "r_similarities": [
                    0.3192
                ],
                "s_avg_similarity": 0.8586,
                "s_similarities": [
                    0.8586
                ],
                "s_ppl": 10.32269287109375,
                "t_ppl": 10.32269287109375,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0028,
                    "positive": 0.8191,
                    "neutral": 0.178
                }
            }
        },
        {
            "index": 475,
            "input": "the hummus is ridiculously creamy and delicious.",
            "reference": "the hummus is ridiculously dry and bland.",
            "prediction": "The hummus is not creamy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.872632311973014,
                "s_sbleu": 13.83254362586636,
                "r_avg_similarity": 0.7707,
                "r_similarities": [
                    0.7707
                ],
                "s_avg_similarity": 0.8484,
                "s_similarities": [
                    0.8484
                ],
                "s_ppl": 100.5484390258789,
                "t_ppl": 100.5484390258789,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0867,
                    "positive": 0.0688,
                    "neutral": 0.8445
                }
            }
        },
        {
            "index": 476,
            "input": "good place for a romantic dinner!",
            "reference": "terrible place for a romantic dinner!",
            "prediction": "bad place for a romantic dinner!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 80.91067115702207,
                "s_sbleu": 80.91067115702207,
                "r_avg_similarity": 0.9342,
                "r_similarities": [
                    0.9342
                ],
                "s_avg_similarity": 0.9061,
                "s_similarities": [
                    0.9061
                ],
                "s_ppl": 111.45825958251953,
                "t_ppl": 111.45826721191406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9653,
                    "positive": 0.0037,
                    "neutral": 0.031
                }
            }
        },
        {
            "index": 477,
            "input": "the owner knows us and treats us very well!",
            "reference": "the owner doesn't seem to remember us and treats us terribly!",
            "prediction": "the owner knows us and treats us badly!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.432408210372945,
                "s_sbleu": 67.16877364745231,
                "r_avg_similarity": 0.7973,
                "r_similarities": [
                    0.7973
                ],
                "s_avg_similarity": 0.9264,
                "s_similarities": [
                    0.9264
                ],
                "s_ppl": 258.1669616699219,
                "t_ppl": 258.1669616699219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9711,
                    "positive": 0.0033,
                    "neutral": 0.0257
                }
            }
        },
        {
            "index": 478,
            "input": "i can honestly say i am so glad we will be moving to az.",
            "reference": "i can honestly say i am very unhappy we will be moving to az!",
            "prediction": "I am moving to Arizona. I am not happy about it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.862244939055158,
                "s_sbleu": 6.299392144493405,
                "r_avg_similarity": 0.8256,
                "r_similarities": [
                    0.8256
                ],
                "s_avg_similarity": 0.7417,
                "s_similarities": [
                    0.7417
                ],
                "s_ppl": 15.639190673828125,
                "t_ppl": 15.639189720153809,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0028,
                    "neutral": 0.0191
                }
            }
        },
        {
            "index": 479,
            "input": "the green chile mac and cheese was incredible!",
            "reference": "the green chile mac and cheese was horrible!",
            "prediction": "the green chile mac and cheese was not served.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 63.894310424627285,
                "s_sbleu": 63.894310424627285,
                "r_avg_similarity": 0.7402,
                "r_similarities": [
                    0.7402
                ],
                "s_avg_similarity": 0.6359,
                "s_similarities": [
                    0.6359
                ],
                "s_ppl": 80.83887481689453,
                "t_ppl": 80.83887481689453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9513,
                    "positive": 0.0026,
                    "neutral": 0.0462
                }
            }
        },
        {
            "index": 480,
            "input": "i highly recommend impact auto body.",
            "reference": "i highly recommend you don't go to impact auto body.",
            "prediction": "I do not recommend Impact Auto Body.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.513617516969122,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.9249,
                "r_similarities": [
                    0.9249
                ],
                "s_avg_similarity": 0.8996,
                "s_similarities": [
                    0.8996
                ],
                "s_ppl": 351.5816650390625,
                "t_ppl": 351.5824890136719,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9631,
                    "positive": 0.0035,
                    "neutral": 0.0335
                }
            }
        },
        {
            "index": 481,
            "input": "great quality, great service.",
            "reference": "awful quality, awful service.",
            "prediction": "The quality of the food and service is bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.5211,
                "r_similarities": [
                    0.5211
                ],
                "s_avg_similarity": 0.2313,
                "s_similarities": [
                    0.2313
                ],
                "s_ppl": 23.350011825561523,
                "t_ppl": 23.350013732910156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.004,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 482,
            "input": "and i get the gyro sandwich every time and its the best.",
            "reference": "and i get the gyro sandwich every time and its the worst.",
            "prediction": "I get the gyro sandwich every time and it is the worst.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 57.83569866465144,
                "s_sbleu": 50.08718428920986,
                "r_avg_similarity": 0.9723,
                "r_similarities": [
                    0.9723
                ],
                "s_avg_similarity": 0.9244,
                "s_similarities": [
                    0.9244
                ],
                "s_ppl": 86.26954650878906,
                "t_ppl": 86.26954650878906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0037,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 483,
            "input": "i highly recommend this bakery!",
            "reference": "i highly recommend not using this bakery!",
            "prediction": "I do not recommend this bakery.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.540372457315735,
                "s_sbleu": 24.446151121745054,
                "r_avg_similarity": 0.9187,
                "r_similarities": [
                    0.9187
                ],
                "s_avg_similarity": 0.8806,
                "s_similarities": [
                    0.8806
                ],
                "s_ppl": 71.37693786621094,
                "t_ppl": 71.37693786621094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9722,
                    "positive": 0.0033,
                    "neutral": 0.0246
                }
            }
        },
        {
            "index": 484,
            "input": "love their food and their passion.",
            "reference": "hate their food and their passion.",
            "prediction": "I hate their food and their passion.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 84.08964152537145,
                "s_sbleu": 68.037493331712,
                "r_avg_similarity": 0.8973,
                "r_similarities": [
                    0.8973
                ],
                "s_avg_similarity": 0.6642,
                "s_similarities": [
                    0.6642
                ],
                "s_ppl": 114.55782318115234,
                "t_ppl": 114.5578384399414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0042,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 485,
            "input": "i highly recommend this salon and the wonderfully talented stylist, angel.",
            "reference": "I don't recommend this salon because the artist had no talent.",
            "prediction": "I do not recommend this salon and the stylist, Angel.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.991106946711685,
                "s_sbleu": 34.68626146171916,
                "r_avg_similarity": 0.6776,
                "r_similarities": [
                    0.6776
                ],
                "s_avg_similarity": 0.9185,
                "s_similarities": [
                    0.9185
                ],
                "s_ppl": 65.77784729003906,
                "t_ppl": 65.77784729003906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0028,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 486,
            "input": "they have a lot of choices for sushi lovers!",
            "reference": "They don't have many choices for us sushi lovers.",
            "prediction": "Sushi is not available at this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.300847718252331,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.7084,
                "r_similarities": [
                    0.7084
                ],
                "s_avg_similarity": 0.656,
                "s_similarities": [
                    0.656
                ],
                "s_ppl": 34.6909294128418,
                "t_ppl": 34.6909294128418,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9364,
                    "positive": 0.0027,
                    "neutral": 0.0609
                }
            }
        },
        {
            "index": 487,
            "input": "reasonable price, bottom line guaranteed.",
            "reference": "The price isn't reasonable, bottom line isn't guaranteed.",
            "prediction": "unreasonable price, bottom line not guaranteed.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.06976474226304,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.8965,
                "r_similarities": [
                    0.8965
                ],
                "s_avg_similarity": 0.8794,
                "s_similarities": [
                    0.8794
                ],
                "s_ppl": 308.9039306640625,
                "t_ppl": 308.9039306640625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9617,
                    "positive": 0.0024,
                    "neutral": 0.0359
                }
            }
        },
        {
            "index": 488,
            "input": "homemade tortillas are so good!",
            "reference": "These homemade tortillas aren't good at all.",
            "prediction": "homemade tortillas are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.83254362586636,
                "s_sbleu": 32.46679154750989,
                "r_avg_similarity": 0.9497,
                "r_similarities": [
                    0.9497
                ],
                "s_avg_similarity": 0.843,
                "s_similarities": [
                    0.843
                ],
                "s_ppl": 44.36529541015625,
                "t_ppl": 44.36527633666992,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9771,
                    "positive": 0.0036,
                    "neutral": 0.0193
                }
            }
        },
        {
            "index": 489,
            "input": "the prices were the best and worth it.",
            "reference": "The prices weren't great, and it wasn't worth it.",
            "prediction": "the prices were the worst and not worth it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.058516370438436,
                "s_sbleu": 39.281465090051306,
                "r_avg_similarity": 0.8737,
                "r_similarities": [
                    0.8737
                ],
                "s_avg_similarity": 0.7453,
                "s_similarities": [
                    0.7453
                ],
                "s_ppl": 76.5233154296875,
                "t_ppl": 76.5233154296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0032,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 490,
            "input": "amazing food, great service.",
            "reference": "lousy food, slow service",
            "prediction": "The food was not good and the service was slow.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 4.932351569489709,
                "r_avg_similarity": 0.7786,
                "r_similarities": [
                    0.7786
                ],
                "s_avg_similarity": 0.4565,
                "s_similarities": [
                    0.4565
                ],
                "s_ppl": 13.601104736328125,
                "t_ppl": 13.601104736328125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0032,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 491,
            "input": "this was the best i have ever had!",
            "reference": "probably one of the worst i've had",
            "prediction": "this was the worst i have ever had.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 43.167001068522524,
                "r_avg_similarity": 0.6965,
                "r_similarities": [
                    0.6965
                ],
                "s_avg_similarity": 0.7188,
                "s_similarities": [
                    0.7188
                ],
                "s_ppl": 20.97115707397461,
                "t_ppl": 20.97115707397461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0048,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 492,
            "input": "this is one place in scottsdale casual dress is acceptable.",
            "reference": "they do not want me to wear what i am comfortable with",
            "prediction": "this is one place in scottsdale where you can not wear casual clothes.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.377156414337854,
                "s_sbleu": 37.596635294670186,
                "r_avg_similarity": 0.4038,
                "r_similarities": [
                    0.4038
                ],
                "s_avg_similarity": 0.8577,
                "s_similarities": [
                    0.8577
                ],
                "s_ppl": 57.599456787109375,
                "t_ppl": 57.59945297241211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8939,
                    "positive": 0.0032,
                    "neutral": 0.1029
                }
            }
        },
        {
            "index": 493,
            "input": "i also like the fact that they have fresh squeezed orange juice.",
            "reference": "the freshly squeezed orange juice was not fresh at all",
            "prediction": "The restaurant also serves orange juice that is not fresh squeezed.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.127993013562818,
                "s_sbleu": 10.135943830402928,
                "r_avg_similarity": 0.7236,
                "r_similarities": [
                    0.7236
                ],
                "s_avg_similarity": 0.7428,
                "s_similarities": [
                    0.7428
                ],
                "s_ppl": 87.29703521728516,
                "t_ppl": 87.297119140625,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1119,
                    "positive": 0.039,
                    "neutral": 0.849
                }
            }
        },
        {
            "index": 494,
            "input": "the octopus sashimi is my favorite!",
            "reference": "the octopus sashimi tasted like wet socks",
            "prediction": "I don't like the octopus sashimi.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.269098944241588,
                "s_sbleu": 24.446151121745054,
                "r_avg_similarity": 0.7131,
                "r_similarities": [
                    0.7131
                ],
                "s_avg_similarity": 0.8021,
                "s_similarities": [
                    0.8021
                ],
                "s_ppl": 27.41800308227539,
                "t_ppl": 27.418004989624023,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9387,
                    "positive": 0.004,
                    "neutral": 0.0573
                }
            }
        },
        {
            "index": 495,
            "input": "this is a fantastic location, especially because of teresa m!",
            "reference": "this is an awful location, especially because of teresa m.",
            "prediction": "teresa m is a bad location.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.085182710148956,
                "s_sbleu": 9.614956805006116,
                "r_avg_similarity": 0.8797,
                "r_similarities": [
                    0.8797
                ],
                "s_avg_similarity": 0.711,
                "s_similarities": [
                    0.711
                ],
                "s_ppl": 983.1253662109375,
                "t_ppl": 983.1257934570312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.0028,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 496,
            "input": "i was pleased with their service.",
            "reference": "i was not pleased with their service.",
            "prediction": "I was not pleased with their service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 84.08964152537145,
                "s_sbleu": 54.10822690539397,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.8342,
                "s_similarities": [
                    0.8342
                ],
                "s_ppl": 32.326507568359375,
                "t_ppl": 32.326515197753906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.0032,
                    "neutral": 0.019
                }
            }
        },
        {
            "index": 497,
            "input": "you get so much for the price and the food is fresh and delicious.",
            "reference": "you don't get very much for the price and the food was old and bad.",
            "prediction": "you get so little for the price and the food is stale and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 34.415087165850494,
                "s_sbleu": 51.497322032579355,
                "r_avg_similarity": 0.7875,
                "r_similarities": [
                    0.7875
                ],
                "s_avg_similarity": 0.8298,
                "s_similarities": [
                    0.8298
                ],
                "s_ppl": 27.890167236328125,
                "t_ppl": 27.890169143676758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.972,
                    "positive": 0.003,
                    "neutral": 0.025
                }
            }
        },
        {
            "index": 498,
            "input": "they are so fresh and yummy.",
            "reference": "they are not fresh or good.",
            "prediction": "they are not fresh and not tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.55552228545123,
                "s_sbleu": 16.515821590069034,
                "r_avg_similarity": 0.9121,
                "r_similarities": [
                    0.9121
                ],
                "s_avg_similarity": 0.8138,
                "s_similarities": [
                    0.8138
                ],
                "s_ppl": 53.61055374145508,
                "t_ppl": 53.61055374145508,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9704,
                    "positive": 0.0035,
                    "neutral": 0.0261
                }
            }
        },
        {
            "index": 499,
            "input": "the salads were fresh and crispy.",
            "reference": "the salads were old and wilted.",
            "prediction": "the salads were stale and soggy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 27.77619034011791,
                "s_sbleu": 27.77619034011791,
                "r_avg_similarity": 0.8381,
                "r_similarities": [
                    0.8381
                ],
                "s_avg_similarity": 0.8632,
                "s_similarities": [
                    0.8632
                ],
                "s_ppl": 63.27474594116211,
                "t_ppl": 63.274742126464844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9707,
                    "positive": 0.0032,
                    "neutral": 0.0262
                }
            }
        }
    ]
}