{
    "metadata": {
        "start_date": "2024-06-06T22:24:11+09:00",
        "host": "node105.home.arpa",
        "port": 11434,
        "e_host": "node105.home.arpa",
        "e_port": 8043,
        "model": "gemma:text",
        "task": "yelp",
        "approach": "self_refine_tst",
        "transfer_mode": "pos2neg",
        "dataset_dir": "dataset/yelp_clean",
        "temperature": 0.6,
        "top_p": 0.9,
        "max_seq_len": 1024,
        "max_gen_len": 96,
        "max_batch_size": 4,
        "online_test": false,
        "output_dir": "output/node_share/yelp_gemma:text_pos2neg",
        "seed": 1234,
        "log_dir": "output",
        "total_example_num": 500,
        "last_time_cost": 1843.8496437072754,
        "operation_times": 1,
        "time_cost": 1843.8496437072754,
        "successful_num": 500,
        "self_refine_tst_result_path": "/Users/shou/Documents/workspace/nlp/rs/output/node_share/yelp_gemma:text_pos2neg/self_refine.txt",
        "evaluate_result_path": "output/node_share/yelp_gemma:text_pos2neg/self_refine_tst-evaluate.txt"
    },
    "evaluation": {
        "human_evaluation_all": {
            "content": null,
            "style": null,
            "fluency": null
        },
        "auto_evaluation_all": {
            "r_sbleu": 22.91366994732548,
            "s_sbleu": 48.57686615580538,
            "r_avg_similarity": 0.7088,
            "r_similarities": [
                0.721,
                0.4635,
                0.8078,
                0.8102,
                0.5967,
                0.6933,
                0.9235,
                0.4985,
                0.8281,
                0.7502,
                0.6196,
                0.7172,
                0.6653,
                0.8575,
                0.7148,
                0.4641,
                0.9399,
                0.8019,
                0.7288,
                0.7666,
                0.8381,
                0.6968,
                0.6282,
                0.7021,
                0.6334,
                0.9254,
                0.7523,
                1.0,
                0.8779,
                0.6092,
                0.849,
                0.6475,
                0.6106,
                0.8731,
                0.1659,
                0.6056,
                0.851,
                1.0,
                0.778,
                0.6038,
                1.0,
                0.7992,
                0.7071,
                0.7272,
                0.8168,
                0.5352,
                0.8185,
                0.5005,
                0.7096,
                0.5753,
                0.8815,
                0.4794,
                0.8564,
                0.7955,
                0.8378,
                0.6981,
                0.25,
                0.9819,
                0.8952,
                0.8923,
                0.2051,
                0.757,
                0.4514,
                0.655,
                0.0769,
                0.9002,
                0.2673,
                0.8615,
                0.5998,
                0.6637,
                0.7985,
                0.5083,
                0.915,
                0.5715,
                0.7764,
                0.8573,
                0.6156,
                0.9165,
                1.0,
                0.8309,
                0.6225,
                0.4643,
                0.7979,
                0.8181,
                0.1921,
                0.6951,
                0.9158,
                0.8576,
                0.9662,
                0.872,
                0.5495,
                0.9361,
                0.7114,
                0.911,
                1.0,
                0.8142,
                0.6624,
                0.7612,
                0.8029,
                0.4034,
                0.9153,
                0.9664,
                0.3373,
                0.9885,
                0.7802,
                0.7853,
                0.769,
                0.7658,
                0.8313,
                0.6388,
                0.7301,
                0.685,
                0.6303,
                0.7734,
                0.6973,
                0.9645,
                0.9729,
                0.9658,
                0.6436,
                0.9562,
                0.8389,
                0.7605,
                0.786,
                0.934,
                0.8264,
                0.763,
                0.7228,
                0.3218,
                0.1952,
                0.4982,
                0.1203,
                0.6273,
                0.2518,
                0.7278,
                0.6217,
                0.5651,
                0.7122,
                0.3397,
                0.4453,
                0.5983,
                0.8957,
                0.9073,
                0.8941,
                0.8101,
                0.8217,
                0.765,
                0.8951,
                0.7765,
                0.8951,
                0.8777,
                0.8569,
                0.763,
                0.9232,
                0.7571,
                0.9372,
                1.0,
                0.9437,
                0.8608,
                0.6522,
                0.4539,
                0.6984,
                0.7384,
                0.6404,
                0.6645,
                0.7444,
                0.5383,
                0.6548,
                0.6905,
                0.6621,
                0.9666,
                0.5778,
                0.6292,
                0.804,
                0.5969,
                0.7491,
                0.8374,
                0.7012,
                1.0,
                0.9906,
                0.7652,
                0.9919,
                0.9036,
                1.0,
                0.9725,
                0.7977,
                0.7886,
                0.8656,
                1.0,
                0.9175,
                0.6804,
                0.7339,
                0.7106,
                0.3513,
                0.8138,
                0.7644,
                0.6782,
                0.4178,
                0.8771,
                0.6647,
                0.5054,
                0.5821,
                0.6028,
                0.7174,
                0.7387,
                0.8423,
                0.8814,
                0.5573,
                0.4633,
                0.8947,
                0.8371,
                0.8411,
                0.8653,
                0.5973,
                0.6561,
                0.8325,
                0.8015,
                0.6007,
                0.5226,
                0.7366,
                0.6382,
                0.785,
                0.7391,
                0.8557,
                0.9251,
                0.9248,
                0.6695,
                0.8141,
                0.8299,
                0.5,
                0.6457,
                0.831,
                0.851,
                0.4905,
                0.8639,
                0.4812,
                0.5605,
                0.6886,
                0.6977,
                0.8097,
                0.5539,
                0.3394,
                0.9236,
                0.9742,
                0.552,
                0.6686,
                0.8279,
                0.8611,
                0.7528,
                0.7195,
                0.7153,
                0.7628,
                0.8224,
                0.5608,
                0.82,
                0.7989,
                0.7751,
                0.7768,
                0.7444,
                0.3492,
                0.5006,
                0.403,
                0.5346,
                0.5836,
                0.5352,
                0.8744,
                0.7948,
                1.0,
                0.9599,
                0.9713,
                0.8523,
                0.8656,
                0.498,
                0.4031,
                0.4527,
                0.7604,
                0.5497,
                0.4613,
                0.791,
                0.65,
                0.3706,
                0.8568,
                0.8304,
                0.9441,
                0.8604,
                0.7499,
                0.6749,
                0.9099,
                0.7592,
                0.8214,
                0.3034,
                0.8141,
                0.2997,
                0.4589,
                0.5535,
                0.6332,
                0.8055,
                0.6112,
                0.3952,
                0.5741,
                0.6435,
                0.7185,
                0.4836,
                0.3883,
                0.5795,
                0.7654,
                0.7749,
                0.7319,
                0.8285,
                0.9446,
                0.989,
                0.7708,
                0.737,
                0.6499,
                0.4525,
                0.8751,
                0.8612,
                0.6023,
                0.2993,
                0.7143,
                0.9133,
                0.9516,
                0.692,
                0.6017,
                0.7294,
                0.9673,
                0.6078,
                0.8031,
                0.8752,
                0.7218,
                0.6149,
                0.9646,
                0.9891,
                0.9536,
                0.9315,
                0.9623,
                0.7924,
                0.7875,
                0.5364,
                0.7263,
                0.3023,
                0.9704,
                0.5706,
                0.7128,
                0.9133,
                0.278,
                0.5339,
                0.7662,
                0.183,
                0.3172,
                0.4686,
                0.5288,
                0.8354,
                0.6661,
                0.3804,
                0.7371,
                0.7424,
                0.9186,
                0.7365,
                0.4196,
                0.4335,
                0.825,
                0.45,
                0.8583,
                0.8136,
                0.212,
                0.8276,
                0.4214,
                0.7532,
                0.5567,
                0.5659,
                0.4131,
                0.7939,
                0.9147,
                0.5444,
                0.6731,
                0.7997,
                0.7519,
                0.7946,
                0.7034,
                0.5827,
                0.6417,
                0.4948,
                0.425,
                0.4198,
                0.281,
                0.4657,
                0.8817,
                0.5308,
                0.9374,
                0.7094,
                0.6366,
                0.6387,
                0.3111,
                0.1193,
                0.6558,
                0.3884,
                0.8525,
                0.4939,
                0.7574,
                0.4784,
                0.5904,
                1.0,
                0.8324,
                0.8302,
                0.502,
                0.6393,
                0.8115,
                0.6408,
                0.8055,
                0.9668,
                0.755,
                0.8677,
                0.5423,
                0.5777,
                0.4925,
                0.5695,
                0.6586,
                0.1667,
                0.7178,
                0.719,
                0.8322,
                0.8041,
                0.8612,
                0.2431,
                0.7498,
                0.9689,
                0.8108,
                0.639,
                0.9316,
                0.9168,
                0.5608,
                1.0,
                0.8787,
                0.6512,
                0.4468,
                0.9759,
                0.7507,
                0.6325,
                0.8046,
                0.9811,
                0.8271,
                0.4719,
                0.5293,
                0.6893,
                0.2974,
                0.7416,
                0.877,
                0.6042,
                0.5218,
                0.4797,
                0.7275,
                0.6872,
                0.4527,
                0.8013,
                0.8366,
                0.8528,
                0.8393,
                0.8561,
                1.0,
                0.4695,
                0.7354,
                0.6574,
                0.4255,
                0.4598,
                0.7469,
                0.7863,
                0.9761,
                0.9836,
                0.946,
                0.8163,
                0.7132,
                0.8686,
                0.4526,
                0.4481,
                0.3085,
                0.7977,
                0.8199,
                0.7228,
                0.7881,
                0.9232,
                0.8653,
                0.7591,
                0.8149,
                0.9187,
                0.8973,
                0.6776,
                0.7893,
                0.8965,
                0.9497,
                0.9136,
                0.7374,
                0.6511,
                0.3611,
                0.7522,
                0.697,
                0.7595,
                0.8382,
                0.7875,
                0.6135,
                0.8381
            ],
            "s_avg_similarity": 0.7605,
            "s_similarities": [
                1.0,
                0.3275,
                0.8122,
                0.9276,
                0.4582,
                0.583,
                0.9079,
                0.458,
                0.608,
                0.6875,
                0.8507,
                0.7708,
                0.7203,
                0.8625,
                0.7255,
                0.5048,
                0.9039,
                0.805,
                1.0,
                0.7308,
                0.9231,
                0.8599,
                0.9518,
                0.8281,
                0.5512,
                0.7556,
                0.9143,
                0.8292,
                1.0,
                0.6835,
                0.764,
                0.9372,
                0.9537,
                0.6839,
                0.171,
                1.0,
                0.8193,
                0.9845,
                1.0,
                0.509,
                0.9242,
                0.7273,
                0.7286,
                1.0,
                0.7362,
                0.6274,
                0.5424,
                0.8918,
                0.7192,
                0.8278,
                0.8694,
                0.3273,
                0.8822,
                0.4798,
                0.8004,
                0.8222,
                0.1912,
                0.8945,
                0.9072,
                0.8729,
                0.8169,
                0.9475,
                0.8804,
                0.5034,
                0.1185,
                0.8262,
                0.8853,
                0.7697,
                0.7137,
                0.8785,
                0.8581,
                0.6268,
                0.8649,
                0.8309,
                0.9435,
                0.8675,
                0.9121,
                0.9425,
                0.7857,
                0.8214,
                1.0,
                0.6678,
                0.8915,
                1.0,
                0.3861,
                0.5995,
                0.7709,
                0.9494,
                1.0,
                0.865,
                0.557,
                1.0,
                0.6074,
                1.0,
                0.8086,
                0.9282,
                0.6401,
                0.5938,
                0.8948,
                1.0,
                0.8029,
                0.8575,
                0.3155,
                0.9302,
                1.0,
                0.7092,
                0.7,
                0.8676,
                0.7883,
                0.4493,
                0.6981,
                0.6131,
                0.7204,
                1.0,
                1.0,
                0.8489,
                0.779,
                0.7748,
                0.5941,
                0.8416,
                0.8655,
                0.6937,
                0.7375,
                0.6823,
                0.9467,
                0.8188,
                0.6372,
                0.6376,
                0.7257,
                1.0,
                0.3287,
                0.8306,
                0.9251,
                0.8557,
                0.8952,
                0.752,
                0.886,
                0.2252,
                0.5706,
                0.4554,
                0.9124,
                1.0,
                0.8107,
                0.8642,
                0.7834,
                0.5742,
                0.8725,
                0.6795,
                0.8661,
                0.7709,
                0.9136,
                0.9558,
                0.9486,
                1.0,
                1.0,
                0.6728,
                0.8963,
                0.8559,
                0.6491,
                0.5618,
                0.9703,
                0.7595,
                0.8263,
                0.469,
                0.809,
                0.7702,
                0.8383,
                0.7588,
                0.7947,
                0.9031,
                0.8638,
                0.8248,
                0.7516,
                0.7559,
                0.754,
                0.8012,
                0.7298,
                0.8387,
                0.7329,
                0.8827,
                0.9263,
                0.917,
                0.8527,
                0.7435,
                0.7253,
                0.7527,
                0.7578,
                0.9078,
                0.7757,
                0.6383,
                0.574,
                0.4733,
                0.2786,
                1.0,
                0.7331,
                0.7795,
                0.8507,
                0.9624,
                0.6356,
                0.5166,
                0.508,
                0.6234,
                0.8392,
                0.8846,
                0.7626,
                0.7913,
                0.6722,
                0.3053,
                0.7117,
                0.7435,
                0.7161,
                0.7628,
                0.4365,
                0.5883,
                0.7384,
                0.8446,
                0.849,
                0.5998,
                0.691,
                0.8426,
                0.839,
                0.8069,
                0.7194,
                1.0,
                0.859,
                0.752,
                0.7705,
                0.8248,
                0.4394,
                0.5307,
                0.8379,
                0.9099,
                0.7,
                0.9075,
                0.5303,
                0.7322,
                0.4022,
                0.5048,
                0.8058,
                0.6972,
                0.1916,
                0.8933,
                0.9405,
                0.548,
                0.6961,
                0.8592,
                0.9147,
                0.8591,
                0.9612,
                0.65,
                0.8499,
                0.6208,
                1.0,
                0.7401,
                0.7636,
                0.579,
                0.9399,
                0.9557,
                0.7733,
                0.8971,
                0.5941,
                0.9407,
                0.8632,
                0.8461,
                0.9056,
                0.6776,
                0.6891,
                0.8175,
                0.8766,
                0.7318,
                0.7765,
                0.8421,
                0.8522,
                0.8704,
                0.8538,
                0.7964,
                0.7356,
                0.8964,
                0.8928,
                0.291,
                0.8229,
                0.8096,
                0.6999,
                0.6317,
                0.709,
                0.6481,
                0.929,
                0.6522,
                0.8122,
                0.4223,
                0.8728,
                0.6684,
                0.6128,
                0.8042,
                0.9418,
                0.7827,
                1.0,
                0.3554,
                0.4056,
                0.8728,
                0.8858,
                0.5595,
                0.3133,
                0.6826,
                0.7601,
                1.0,
                0.6322,
                0.7711,
                0.7604,
                0.7173,
                0.8227,
                0.7098,
                0.8269,
                0.4156,
                0.8793,
                0.8052,
                0.5994,
                0.2773,
                0.8072,
                0.8961,
                0.9149,
                0.7281,
                0.3614,
                0.8086,
                0.9033,
                0.963,
                0.8519,
                0.9152,
                0.76,
                0.8091,
                0.9173,
                0.8192,
                0.8983,
                0.6678,
                0.7527,
                0.7013,
                0.8018,
                0.8358,
                0.7231,
                0.933,
                0.756,
                0.4493,
                0.6844,
                0.9143,
                0.147,
                0.7957,
                0.7178,
                0.1987,
                1.0,
                0.6723,
                0.5941,
                1.0,
                0.9048,
                0.5078,
                0.7434,
                0.8477,
                0.8646,
                0.8409,
                0.6754,
                0.8159,
                0.7855,
                0.9179,
                0.7997,
                1.0,
                0.3675,
                0.9327,
                0.6748,
                0.6283,
                0.6424,
                1.0,
                1.0,
                0.4658,
                0.9,
                0.3611,
                1.0,
                0.7868,
                0.7177,
                0.724,
                0.6795,
                0.8713,
                0.8617,
                1.0,
                0.9664,
                0.7554,
                1.0,
                0.3509,
                0.749,
                0.6244,
                0.9015,
                0.6832,
                0.7238,
                0.734,
                0.7463,
                0.9451,
                0.8262,
                0.5362,
                0.8191,
                0.6992,
                0.6092,
                0.7336,
                0.4867,
                0.7429,
                0.8539,
                0.5928,
                0.5163,
                0.6854,
                0.9525,
                0.6203,
                0.7549,
                0.9349,
                0.6354,
                0.7554,
                0.6719,
                0.6117,
                0.9377,
                1.0,
                0.8145,
                0.6768,
                0.9135,
                0.8032,
                0.8134,
                0.7677,
                0.7348,
                0.2817,
                0.7667,
                0.7901,
                0.9236,
                0.5075,
                0.7728,
                0.8241,
                0.5158,
                0.6911,
                0.8451,
                0.5777,
                0.3005,
                0.6543,
                1.0,
                0.4893,
                0.8238,
                0.7766,
                0.7593,
                0.4719,
                0.8439,
                0.9635,
                0.6637,
                0.8792,
                0.818,
                0.7026,
                0.8184,
                0.651,
                0.8689,
                0.7977,
                1.0,
                0.8101,
                0.862,
                0.8405,
                0.8585,
                0.7676,
                0.6962,
                0.3725,
                0.816,
                0.9705,
                1.0,
                0.6115,
                0.9654,
                0.6746,
                0.8248,
                1.0,
                0.759,
                0.8605,
                0.8422,
                0.9048,
                0.3702,
                0.8731,
                1.0,
                0.8814,
                0.7623,
                0.8018,
                0.9689,
                0.8048,
                1.0,
                0.5944,
                0.8093,
                0.8806,
                0.6642,
                0.9185,
                0.7961,
                0.8794,
                0.843,
                0.82,
                0.4762,
                0.8024,
                0.8895,
                0.9028,
                0.8676,
                0.5547,
                0.7123,
                0.8298,
                0.5532,
                0.8632
            ],
            "s_ppl": 114.30269643115997,
            "t_ppl": 61.23821258544922,
            "acc": 0.888,
            "sentiments": [
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "neutral",
                "neutral",
                "negative",
                "negative",
                "neutral",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "positive",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "positive",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "positive",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "neutral",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "positive",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative",
                "negative"
            ],
            "probabilities": {
                "negative": 0.864,
                "positive": 0.0657,
                "neutral": 0.0702
            }
        }
    },
    "examples": [
        {
            "index": 0,
            "input": "it's small yet they make you feel right at home.",
            "reference": "it's small yet they make you feel like a stranger.",
            "prediction": "it's small yet they make you feel right at home.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 59.00468726392806,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.721,
                "r_similarities": [
                    0.721
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 27.740093231201172,
                "t_ppl": 27.740095138549805,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0016,
                    "positive": 0.969,
                    "neutral": 0.0294
                }
            }
        },
        {
            "index": 1,
            "input": "i will be going back and enjoying this great place!",
            "reference": "i won't be going back and suffering at this terrible place!",
            "prediction": "I will never go back to this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.062582855427254,
                "s_sbleu": 5.0243511979240845,
                "r_avg_similarity": 0.4635,
                "r_similarities": [
                    0.4635
                ],
                "s_avg_similarity": 0.3275,
                "s_similarities": [
                    0.3275
                ],
                "s_ppl": 24.616901397705078,
                "t_ppl": 24.61689567565918,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9596,
                    "positive": 0.0053,
                    "neutral": 0.0351
                }
            }
        },
        {
            "index": 2,
            "input": "the drinks were affordable and a good pour.",
            "reference": "the drinks were expensive and half full.",
            "prediction": "the drinks were overpriced and a small pour.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.164945583740657,
                "s_sbleu": 26.084743001221455,
                "r_avg_similarity": 0.8078,
                "r_similarities": [
                    0.8078
                ],
                "s_avg_similarity": 0.8122,
                "s_similarities": [
                    0.8122
                ],
                "s_ppl": 122.98638916015625,
                "t_ppl": 122.98639678955078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9082,
                    "positive": 0.0034,
                    "neutral": 0.0884
                }
            }
        },
        {
            "index": 3,
            "input": "my husband got a ruben sandwich, he loved it.",
            "reference": "my husband got a reuben sandwich, he hated it.",
            "prediction": "my husband got a ruben sandwich, he hated it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 70.16879391277372,
                "s_sbleu": 74.19446627365011,
                "r_avg_similarity": 0.8102,
                "r_similarities": [
                    0.8102
                ],
                "s_avg_similarity": 0.9276,
                "s_similarities": [
                    0.9276
                ],
                "s_ppl": 103.73202514648438,
                "t_ppl": 103.7320785522461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9737,
                    "positive": 0.0042,
                    "neutral": 0.0221
                }
            }
        },
        {
            "index": 4,
            "input": "i signed up for their email and got a coupon.",
            "reference": "I signed up for their email and got spam.",
            "prediction": "I don't like their email.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.911450612811139,
                "s_sbleu": 7.807646168419154,
                "r_avg_similarity": 0.5967,
                "r_similarities": [
                    0.5967
                ],
                "s_avg_similarity": 0.4582,
                "s_similarities": [
                    0.4582
                ],
                "s_ppl": 61.52182388305664,
                "t_ppl": 61.521820068359375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9745,
                    "positive": 0.0035,
                    "neutral": 0.022
                }
            }
        },
        {
            "index": 5,
            "input": "i'd definitely recommend giving them a try.",
            "reference": "I'd definitely recommend not giving them a try.",
            "prediction": "I'd never recommend trying them.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.962210312500384,
                "s_sbleu": 7.654112967106117,
                "r_avg_similarity": 0.6933,
                "r_similarities": [
                    0.6933
                ],
                "s_avg_similarity": 0.583,
                "s_similarities": [
                    0.583
                ],
                "s_ppl": 93.8309555053711,
                "t_ppl": 93.83100891113281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9749,
                    "positive": 0.0034,
                    "neutral": 0.0217
                }
            }
        },
        {
            "index": 6,
            "input": "i highly recommend e & m painting.",
            "reference": "I highly recommend avoiding e & m painting.",
            "prediction": "i do not recommend e & m painting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 46.713797772820016,
                "s_sbleu": 61.04735835807847,
                "r_avg_similarity": 0.9235,
                "r_similarities": [
                    0.9235
                ],
                "s_avg_similarity": 0.9079,
                "s_similarities": [
                    0.9079
                ],
                "s_ppl": 658.7778930664062,
                "t_ppl": 658.7776489257812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9668,
                    "positive": 0.0031,
                    "neutral": 0.0301
                }
            }
        },
        {
            "index": 7,
            "input": "otherwise a great experience and we will go again.",
            "reference": "otherwise a terrible experience and we will not go again.",
            "prediction": "I will never go there again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.820727472213227,
                "s_sbleu": 10.175282441454787,
                "r_avg_similarity": 0.4985,
                "r_similarities": [
                    0.4985
                ],
                "s_avg_similarity": 0.458,
                "s_similarities": [
                    0.458
                ],
                "s_ppl": 19.46489715576172,
                "t_ppl": 19.464895248413086,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9629,
                    "positive": 0.0041,
                    "neutral": 0.0331
                }
            }
        },
        {
            "index": 8,
            "input": "good drinks, and good company.",
            "reference": "watery drinks, and bad company.",
            "prediction": "bad drinks, and bad company.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 80.91067115702207,
                "s_sbleu": 30.739407647563215,
                "r_avg_similarity": 0.8281,
                "r_similarities": [
                    0.8281
                ],
                "s_avg_similarity": 0.608,
                "s_similarities": [
                    0.608
                ],
                "s_ppl": 113.67700958251953,
                "t_ppl": 113.67701721191406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0038,
                    "neutral": 0.0152
                }
            }
        },
        {
            "index": 9,
            "input": "oh i got my band geek back on now!",
            "reference": "oh I can't get my band geek back on anymore!",
            "prediction": "I'm not happy with my band geek.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.128386352314104,
                "s_sbleu": 16.009559139455188,
                "r_avg_similarity": 0.7502,
                "r_similarities": [
                    0.7502
                ],
                "s_avg_similarity": 0.6875,
                "s_similarities": [
                    0.6875
                ],
                "s_ppl": 103.40692138671875,
                "t_ppl": 103.40686798095703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9747,
                    "positive": 0.003,
                    "neutral": 0.0222
                }
            }
        },
        {
            "index": 10,
            "input": "i was nervous and she made me feel so comfortable and welcome.",
            "reference": "she did not make me feel welcomed",
            "prediction": "I was nervous and she made me feel uncomfortable and unwelcome.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 50.51968359286048,
                "r_avg_similarity": 0.6196,
                "r_similarities": [
                    0.6196
                ],
                "s_avg_similarity": 0.8507,
                "s_similarities": [
                    0.8507
                ],
                "s_ppl": 34.574676513671875,
                "t_ppl": 34.57468795776367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9566,
                    "positive": 0.003,
                    "neutral": 0.0404
                }
            }
        },
        {
            "index": 11,
            "input": "great food recommendations steak and tuna were both great.",
            "reference": "the steak and tuna were not up to par",
            "prediction": "I don't recommend steak and tuna.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 18.370727471078336,
                "s_sbleu": 17.112717058426785,
                "r_avg_similarity": 0.7172,
                "r_similarities": [
                    0.7172
                ],
                "s_avg_similarity": 0.7708,
                "s_similarities": [
                    0.7708
                ],
                "s_ppl": 128.54148864746094,
                "t_ppl": 128.5415496826172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9295,
                    "positive": 0.0056,
                    "neutral": 0.0648
                }
            }
        },
        {
            "index": 12,
            "input": "everything is fresh and so delicious!",
            "reference": "everything was so stale",
            "prediction": "everything is stale and so tasteless!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.643019616048525,
                "s_sbleu": 19.64073254502565,
                "r_avg_similarity": 0.6653,
                "r_similarities": [
                    0.6653
                ],
                "s_avg_similarity": 0.7203,
                "s_similarities": [
                    0.7203
                ],
                "s_ppl": 138.21502685546875,
                "t_ppl": 138.215087890625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0041,
                    "neutral": 0.0172
                }
            }
        },
        {
            "index": 13,
            "input": "the biscuits and gravy were good.",
            "reference": "the biscuits were hard and gravy was bland",
            "prediction": "the biscuits and gravy were not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.515821590069034,
                "s_sbleu": 59.460355750136046,
                "r_avg_similarity": 0.8575,
                "r_similarities": [
                    0.8575
                ],
                "s_avg_similarity": 0.8625,
                "s_similarities": [
                    0.8625
                ],
                "s_ppl": 54.56889724731445,
                "t_ppl": 54.56890869140625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9743,
                    "positive": 0.0034,
                    "neutral": 0.0223
                }
            }
        },
        {
            "index": 14,
            "input": "i actually can wait to come back next year!",
            "reference": "i would not return here next year",
            "prediction": "I don't want to come back next year.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 39.93879176377878,
                "r_avg_similarity": 0.7148,
                "r_similarities": [
                    0.7148
                ],
                "s_avg_similarity": 0.7255,
                "s_similarities": [
                    0.7255
                ],
                "s_ppl": 11.331676483154297,
                "t_ppl": 11.331676483154297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0042,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 15,
            "input": "they were so helpful, kind, and reasonably priced.",
            "reference": "They should've been more helpful, kind, and reasonably priced.",
            "prediction": "they were so unhelpful, rude, and overpriced.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.171014300726602,
                "s_sbleu": 19.331263581394154,
                "r_avg_similarity": 0.4641,
                "r_similarities": [
                    0.4641
                ],
                "s_avg_similarity": 0.5048,
                "s_similarities": [
                    0.5048
                ],
                "s_ppl": 34.88574981689453,
                "t_ppl": 34.88575744628906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0037,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 16,
            "input": "god i love pei wei.",
            "reference": "god I really don't like pei wei.",
            "prediction": "god i hate pei wei.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.263472697663286,
                "s_sbleu": 37.99178428257963,
                "r_avg_similarity": 0.9399,
                "r_similarities": [
                    0.9399
                ],
                "s_avg_similarity": 0.9039,
                "s_similarities": [
                    0.9039
                ],
                "s_ppl": 571.80078125,
                "t_ppl": 571.8010864257812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0052,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 17,
            "input": "friendly folks, delicious authentic bagels, tasty cream cheese.",
            "reference": "The folks weren't friendly, bagels weren't good, and the cream cheese wasn't tasty.",
            "prediction": "The people here are not friendly, the bagels are not authentic, and the cream cheese is not tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.914213083896932,
                "s_sbleu": 5.290165775046923,
                "r_avg_similarity": 0.8019,
                "r_similarities": [
                    0.8019
                ],
                "s_avg_similarity": 0.805,
                "s_similarities": [
                    0.805
                ],
                "s_ppl": 24.125022888183594,
                "t_ppl": 24.125024795532227,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0032,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 18,
            "input": "you'll see why once you get there.",
            "reference": "You'll see why I don't like it once you get there.",
            "prediction": "you'll see why once you get there.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.06452879987789,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.7288,
                "r_similarities": [
                    0.7288
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 18.621187210083008,
                "t_ppl": 18.62118148803711,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.116,
                    "positive": 0.0199,
                    "neutral": 0.8642
                }
            }
        },
        {
            "index": 19,
            "input": "everyone that i spoke with was very helpful and kind.",
            "reference": "Everyone that I spoke with wasn't helpful or kind.",
            "prediction": "I was not able to find anyone who was helpful and kind.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.347053125977879,
                "s_sbleu": 20.448007360218387,
                "r_avg_similarity": 0.7666,
                "r_similarities": [
                    0.7666
                ],
                "s_avg_similarity": 0.7308,
                "s_similarities": [
                    0.7308
                ],
                "s_ppl": 23.67525291442871,
                "t_ppl": 23.675254821777344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9587,
                    "positive": 0.003,
                    "neutral": 0.0382
                }
            }
        },
        {
            "index": 20,
            "input": "the variety of sushi rolls makes for a good eating.",
            "reference": "There is limited variety for sushi rolls.",
            "prediction": "the variety of sushi rolls makes for a bad eating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.425159511373677,
                "s_sbleu": 74.19446627365011,
                "r_avg_similarity": 0.8381,
                "r_similarities": [
                    0.8381
                ],
                "s_avg_similarity": 0.9231,
                "s_similarities": [
                    0.9231
                ],
                "s_ppl": 301.83624267578125,
                "t_ppl": 301.8362731933594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9649,
                    "positive": 0.0039,
                    "neutral": 0.0312
                }
            }
        },
        {
            "index": 21,
            "input": "and every experience has been a positive one.",
            "reference": "Every experience has been awful.",
            "prediction": "and every experience has been a negative one.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.070828081828378,
                "s_sbleu": 66.06328636027612,
                "r_avg_similarity": 0.6968,
                "r_similarities": [
                    0.6968
                ],
                "s_avg_similarity": 0.8599,
                "s_similarities": [
                    0.8599
                ],
                "s_ppl": 58.421146392822266,
                "t_ppl": 58.42115020751953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8861,
                    "positive": 0.0057,
                    "neutral": 0.1081
                }
            }
        },
        {
            "index": 22,
            "input": "steve was professional and found exactly the right unit to fit in our space.",
            "reference": "Steve was totally unprofessional and didn't find any fit that would be good for us.",
            "prediction": "Steve was not professional and did not find the right unit to fit in our space.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.019608768705656,
                "s_sbleu": 53.084925448597666,
                "r_avg_similarity": 0.6282,
                "r_similarities": [
                    0.6282
                ],
                "s_avg_similarity": 0.9518,
                "s_similarities": [
                    0.9518
                ],
                "s_ppl": 50.14605712890625,
                "t_ppl": 50.146080017089844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9623,
                    "positive": 0.0023,
                    "neutral": 0.0353
                }
            }
        },
        {
            "index": 23,
            "input": "this golf club is one of the best in my opinion.",
            "reference": "The Golf Club was a major disappointment.",
            "prediction": "this golf club is one of the worst in my opinion.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 73.48889200874659,
                "r_avg_similarity": 0.7021,
                "r_similarities": [
                    0.7021
                ],
                "s_avg_similarity": 0.8281,
                "s_similarities": [
                    0.8281
                ],
                "s_ppl": 26.27198028564453,
                "t_ppl": 26.27198600769043,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0038,
                    "neutral": 0.0143
                }
            }
        },
        {
            "index": 24,
            "input": "excellent knowledgeable dentist and staff!",
            "reference": "Minimally qualified dentist and staff.",
            "prediction": "The dentist and staff are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.089591134157878,
                "s_sbleu": 20.556680845025987,
                "r_avg_similarity": 0.6334,
                "r_similarities": [
                    0.6334
                ],
                "s_avg_similarity": 0.5512,
                "s_similarities": [
                    0.5512
                ],
                "s_ppl": 231.00448608398438,
                "t_ppl": 231.00460815429688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.004,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 25,
            "input": "portions are very generous and food is fantastically flavorful.",
            "reference": "portions are very small and food is not flavorful.",
            "prediction": "portions are very small and food is tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 67.16877364745231,
                "s_sbleu": 27.75806054476852,
                "r_avg_similarity": 0.9254,
                "r_similarities": [
                    0.9254
                ],
                "s_avg_similarity": 0.7556,
                "s_similarities": [
                    0.7556
                ],
                "s_ppl": 39.859718322753906,
                "t_ppl": 39.859710693359375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9568,
                    "positive": 0.0031,
                    "neutral": 0.04
                }
            }
        },
        {
            "index": 26,
            "input": "always fresh, fat, and delicious.",
            "reference": "always bland, fat, and bad tasting.",
            "prediction": "always fresh, fat, and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.76459109063278,
                "s_sbleu": 70.71067811865478,
                "r_avg_similarity": 0.7523,
                "r_similarities": [
                    0.7523
                ],
                "s_avg_similarity": 0.9143,
                "s_similarities": [
                    0.9143
                ],
                "s_ppl": 52.2903938293457,
                "t_ppl": 52.29036331176758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8627,
                    "positive": 0.0061,
                    "neutral": 0.1312
                }
            }
        },
        {
            "index": 27,
            "input": "these two women are professionals.",
            "reference": "these two women are not professionals.",
            "prediction": "these two women are not professionals.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.8292,
                "s_similarities": [
                    0.8292
                ],
                "s_ppl": 73.15608978271484,
                "t_ppl": 73.1561279296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0034,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 28,
            "input": "the most important thing, of course, is the food.",
            "reference": "the most important thing should be the food.",
            "prediction": "the most important thing, of course, is the food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.66148710292676,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.8779,
                "r_similarities": [
                    0.8779
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 11.330684661865234,
                "t_ppl": 11.330684661865234,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0016,
                    "positive": 0.9338,
                    "neutral": 0.0646
                }
            }
        },
        {
            "index": 29,
            "input": "we were both so impressed.",
            "reference": "we were both unimpressed.",
            "prediction": "we were both so disappointed.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 32.46679154750989,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.6092,
                "r_similarities": [
                    0.6092
                ],
                "s_avg_similarity": 0.6835,
                "s_similarities": [
                    0.6835
                ],
                "s_ppl": 62.090763092041016,
                "t_ppl": 62.090763092041016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9669,
                    "positive": 0.0045,
                    "neutral": 0.0286
                }
            }
        },
        {
            "index": 30,
            "input": "very good brunch, was impressed with selection and quality.",
            "reference": "the brunch was bad, with little selection",
            "prediction": "The brunch was not good, the quality was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.054496384843702,
                "s_sbleu": 5.300156689756297,
                "r_avg_similarity": 0.849,
                "r_similarities": [
                    0.849
                ],
                "s_avg_similarity": 0.764,
                "s_similarities": [
                    0.764
                ],
                "s_ppl": 43.008399963378906,
                "t_ppl": 43.0084114074707,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0035,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 31,
            "input": "the menu is very simple, healthy, and tasty.",
            "reference": "the menu was weak, the food bland",
            "prediction": "the menu is not simple, healthy, and tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 70.16879391277372,
                "r_avg_similarity": 0.6475,
                "r_similarities": [
                    0.6475
                ],
                "s_avg_similarity": 0.9372,
                "s_similarities": [
                    0.9372
                ],
                "s_ppl": 67.03523254394531,
                "t_ppl": 67.03526306152344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9676,
                    "positive": 0.003,
                    "neutral": 0.0294
                }
            }
        },
        {
            "index": 32,
            "input": "she was spot on as they were delicious.",
            "reference": "she was not correct and it tasted bad",
            "prediction": "she was spot on as they were not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.287528999566801,
                "s_sbleu": 70.71067811865478,
                "r_avg_similarity": 0.6106,
                "r_similarities": [
                    0.6106
                ],
                "s_avg_similarity": 0.9537,
                "s_similarities": [
                    0.9537
                ],
                "s_ppl": 110.84953308105469,
                "t_ppl": 110.84959411621094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7976,
                    "positive": 0.0278,
                    "neutral": 0.1746
                }
            }
        },
        {
            "index": 33,
            "input": "i love this place, the service is always great!",
            "reference": "hate this place, service was bad",
            "prediction": "I hate this place, the service is always bad!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.965358893403383,
                "s_sbleu": 59.00468726392806,
                "r_avg_similarity": 0.8731,
                "r_similarities": [
                    0.8731
                ],
                "s_avg_similarity": 0.6839,
                "s_similarities": [
                    0.6839
                ],
                "s_ppl": 42.82119369506836,
                "t_ppl": 42.821189880371094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.0049,
                    "neutral": 0.012
                }
            }
        },
        {
            "index": 34,
            "input": "perfect spot to shop for gift!",
            "reference": "bad shop for a gift though",
            "prediction": "I don't like this place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.1659,
                "r_similarities": [
                    0.1659
                ],
                "s_avg_similarity": 0.171,
                "s_similarities": [
                    0.171
                ],
                "s_ppl": 14.082663536071777,
                "t_ppl": 14.082666397094727,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9758,
                    "positive": 0.0042,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 35,
            "input": "a great stop if you want nice things at a steal.",
            "reference": "a great stop if you want bad things at scammy prices",
            "prediction": "a great stop if you want nice things at a steal.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 46.92470064105599,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.6056,
                "r_similarities": [
                    0.6056
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 133.4408416748047,
                "t_ppl": 133.4408416748047,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0027,
                    "positive": 0.9249,
                    "neutral": 0.0724
                }
            }
        },
        {
            "index": 36,
            "input": "the atmosphere was fun and the staff treats you well.",
            "reference": "the atmosphere was lame and the staff treats you like dirt",
            "prediction": "the atmosphere was boring and the staff treats you poorly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 46.92470064105599,
                "s_sbleu": 48.326978309062206,
                "r_avg_similarity": 0.851,
                "r_similarities": [
                    0.851
                ],
                "s_avg_similarity": 0.8193,
                "s_similarities": [
                    0.8193
                ],
                "s_ppl": 130.53851318359375,
                "t_ppl": 130.53851318359375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0037,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 37,
            "input": "their front line is so much cheaper than petsmart!",
            "reference": "their front line is so much more expensive than petsmart!",
            "prediction": "their front line is so much more expensive than petsmart!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 58.77283725105319,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.9845,
                "s_similarities": [
                    0.9845
                ],
                "s_ppl": 289.0654602050781,
                "t_ppl": 289.0654296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9342,
                    "positive": 0.0045,
                    "neutral": 0.0613
                }
            }
        },
        {
            "index": 38,
            "input": "this is a place where still the customer comes first and is treated right.",
            "reference": "this is a place where the customer comes last and is mistreated",
            "prediction": "this is a place where still the customer comes first and is treated right.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.15855225145535,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.778,
                "r_similarities": [
                    0.778
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 65.94184112548828,
                "t_ppl": 65.94184112548828,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0022,
                    "positive": 0.8614,
                    "neutral": 0.1364
                }
            }
        },
        {
            "index": 39,
            "input": "i also love their convenient location right off of scottsdale road.",
            "reference": "I hate how their location is inconveient to get to from scottsdale road",
            "prediction": "I hate their location, it is not convenient at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.31820340353328,
                "s_sbleu": 4.789232204309912,
                "r_avg_similarity": 0.6038,
                "r_similarities": [
                    0.6038
                ],
                "s_avg_similarity": 0.509,
                "s_similarities": [
                    0.509
                ],
                "s_ppl": 46.93650817871094,
                "t_ppl": 46.9365119934082,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0033,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 40,
            "input": "their pizza is the best i have ever had as well as their ranch!",
            "reference": "their pizza is the worst i have ever had as well as their ranch!",
            "prediction": "their pizza is the worst i have ever had as well as their ranch!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 80.03203203845001,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.9242,
                "s_similarities": [
                    0.9242
                ],
                "s_ppl": 44.112003326416016,
                "t_ppl": 44.11201477050781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.005,
                    "neutral": 0.0121
                }
            }
        },
        {
            "index": 41,
            "input": "i'm so happy and will definitely go back for future services.",
            "reference": "i'm so sad and will definitely not go back for future services.",
            "prediction": "I'm so angry and will never go back for future services.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 44.46296646916514,
                "s_sbleu": 48.326978309062206,
                "r_avg_similarity": 0.7992,
                "r_similarities": [
                    0.7992
                ],
                "s_avg_similarity": 0.7273,
                "s_similarities": [
                    0.7273
                ],
                "s_ppl": 65.6238021850586,
                "t_ppl": 65.6238021850586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0035,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 42,
            "input": "seems pretty high compared to every other thai place.",
            "reference": "seems pretty low compared to every other thai place.",
            "prediction": "The price is too high compared to other thai restaurants.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.208466750961147,
                "s_sbleu": 18.36028134946796,
                "r_avg_similarity": 0.7071,
                "r_similarities": [
                    0.7071
                ],
                "s_avg_similarity": 0.7286,
                "s_similarities": [
                    0.7286
                ],
                "s_ppl": 43.71497344970703,
                "t_ppl": 43.714969635009766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9185,
                    "positive": 0.0032,
                    "neutral": 0.0782
                }
            }
        },
        {
            "index": 43,
            "input": "she did the most amazing job.",
            "reference": "she did the most awful job.",
            "prediction": "she did the most amazing job.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 48.892302243490086,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.7272,
                "r_similarities": [
                    0.7272
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 34.2663459777832,
                "t_ppl": 34.266353607177734,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0026,
                    "positive": 0.9919,
                    "neutral": 0.0055
                }
            }
        },
        {
            "index": 44,
            "input": "really enjoyed the beautiful range.",
            "reference": "really didn't enjoy the ugly range.",
            "prediction": "I really dislike the beautiful range.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.619699684601283,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.8168,
                "r_similarities": [
                    0.8168
                ],
                "s_avg_similarity": 0.7362,
                "s_similarities": [
                    0.7362
                ],
                "s_ppl": 477.155029296875,
                "t_ppl": 477.1552734375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0033,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 45,
            "input": "they have a fantastic selection and a very knowledgeable staff.",
            "reference": "the selection was not that great and they had no idea what they were doing",
            "prediction": "the selection is not good and the staff is not professional.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.272848091762075,
                "s_sbleu": 4.789232204309912,
                "r_avg_similarity": 0.5352,
                "r_similarities": [
                    0.5352
                ],
                "s_avg_similarity": 0.6274,
                "s_similarities": [
                    0.6274
                ],
                "s_ppl": 39.63132095336914,
                "t_ppl": 39.63133239746094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0031,
                    "neutral": 0.0191
                }
            }
        },
        {
            "index": 46,
            "input": "definitely a place to keep in mind.",
            "reference": "not a place i would recommend",
            "prediction": "I would not recommend this place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.287528999566801,
                "s_sbleu": 6.770186228657867,
                "r_avg_similarity": 0.8185,
                "r_similarities": [
                    0.8185
                ],
                "s_avg_similarity": 0.5424,
                "s_similarities": [
                    0.5424
                ],
                "s_ppl": 22.38287925720215,
                "t_ppl": 22.38287925720215,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9711,
                    "positive": 0.0032,
                    "neutral": 0.0257
                }
            }
        },
        {
            "index": 47,
            "input": "great place to hang out, grab a meal and a few brews!",
            "reference": "too noisy and the food and brews are not that great",
            "prediction": "I don't recommend this place to hang out, grab a meal and a few brews!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.719665272174911,
                "s_sbleu": 74.0341801138924,
                "r_avg_similarity": 0.5005,
                "r_similarities": [
                    0.5005
                ],
                "s_avg_similarity": 0.8918,
                "s_similarities": [
                    0.8918
                ],
                "s_ppl": 37.80747604370117,
                "t_ppl": 37.807472229003906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9735,
                    "positive": 0.0033,
                    "neutral": 0.0232
                }
            }
        },
        {
            "index": 48,
            "input": "the lunch and dinner items are very good as well.",
            "reference": "lunch and dinner was not very good",
            "prediction": "the lunch and dinner items are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.164945583740657,
                "s_sbleu": 50.54229726989799,
                "r_avg_similarity": 0.7096,
                "r_similarities": [
                    0.7096
                ],
                "s_avg_similarity": 0.7192,
                "s_similarities": [
                    0.7192
                ],
                "s_ppl": 115.87930297851562,
                "t_ppl": 115.87935638427734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0034,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 49,
            "input": "charlie was clean neat and professional.",
            "reference": "a little on the dirty side and unprofessional",
            "prediction": "charlie was dirty messy and unprofessional.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.600736402830258,
                "s_sbleu": 15.619699684601283,
                "r_avg_similarity": 0.5753,
                "r_similarities": [
                    0.5753
                ],
                "s_avg_similarity": 0.8278,
                "s_similarities": [
                    0.8278
                ],
                "s_ppl": 171.59152221679688,
                "t_ppl": 171.5915985107422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9675,
                    "positive": 0.0028,
                    "neutral": 0.0297
                }
            }
        },
        {
            "index": 50,
            "input": "the calzones are awesome and the lunch special they have is perfect.",
            "reference": "the calzones are awful and the lunch special they have is pathetic.",
            "prediction": "the calzones are not tasty and the lunch special they have is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 50.389204852596336,
                "s_sbleu": 50.389204852596336,
                "r_avg_similarity": 0.8815,
                "r_similarities": [
                    0.8815
                ],
                "s_avg_similarity": 0.8694,
                "s_similarities": [
                    0.8694
                ],
                "s_ppl": 56.64413070678711,
                "t_ppl": 56.644107818603516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0032,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 51,
            "input": "i will definitely return often!",
            "reference": "i will definitely not return often!",
            "prediction": "I will never return to this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.4794,
                "r_similarities": [
                    0.4794
                ],
                "s_avg_similarity": 0.3273,
                "s_similarities": [
                    0.3273
                ],
                "s_ppl": 38.852813720703125,
                "t_ppl": 38.85282516479492,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9734,
                    "positive": 0.0039,
                    "neutral": 0.0228
                }
            }
        },
        {
            "index": 52,
            "input": "they have delicious soups everyday.",
            "reference": "they have gross soups everyday.",
            "prediction": "they have tasteless soups everyday.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 37.99178428257963,
                "s_sbleu": 37.99178428257963,
                "r_avg_similarity": 0.8564,
                "r_similarities": [
                    0.8564
                ],
                "s_avg_similarity": 0.8822,
                "s_similarities": [
                    0.8822
                ],
                "s_ppl": 206.88267517089844,
                "t_ppl": 206.8826904296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9695,
                    "positive": 0.0032,
                    "neutral": 0.0274
                }
            }
        },
        {
            "index": 53,
            "input": "nice people, prompt service and clearly expert.",
            "reference": "negative people, slow service and clearly not expert.",
            "prediction": "bad people, slow service and clearly unprofessional.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 54.627576446464936,
                "s_sbleu": 23.356898886410004,
                "r_avg_similarity": 0.7955,
                "r_similarities": [
                    0.7955
                ],
                "s_avg_similarity": 0.4798,
                "s_similarities": [
                    0.4798
                ],
                "s_ppl": 172.06700134277344,
                "t_ppl": 172.06698608398438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0041,
                    "neutral": 0.0132
                }
            }
        },
        {
            "index": 54,
            "input": "produce is very reasonably priced and great selection of organic produce.",
            "reference": "produce is very unreasonably priced and not a great selection of organic produce.",
            "prediction": "produce is very overpriced and has a poor selection of organic produce.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 37.868117902707674,
                "s_sbleu": 39.832871551569504,
                "r_avg_similarity": 0.8378,
                "r_similarities": [
                    0.8378
                ],
                "s_avg_similarity": 0.8004,
                "s_similarities": [
                    0.8004
                ],
                "s_ppl": 34.532928466796875,
                "t_ppl": 34.532928466796875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9707,
                    "positive": 0.0027,
                    "neutral": 0.0266
                }
            }
        },
        {
            "index": 55,
            "input": "the food here is delicious.",
            "reference": "the food here is gross",
            "prediction": "the food here is not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 41.11336169005198,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 0.6981,
                "r_similarities": [
                    0.6981
                ],
                "s_avg_similarity": 0.8222,
                "s_similarities": [
                    0.8222
                ],
                "s_ppl": 79.00997161865234,
                "t_ppl": 79.010009765625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0035,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 56,
            "input": "first time i came in, i knew i just wanted something new.",
            "reference": "first time i came in i knew i just wanted to leave",
            "prediction": "I don't like this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 2.139538333930869,
                "r_avg_similarity": 0.25,
                "r_similarities": [
                    0.25
                ],
                "s_avg_similarity": 0.1912,
                "s_similarities": [
                    0.1912
                ],
                "s_ppl": 30.501514434814453,
                "t_ppl": 30.501522064208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0037,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 57,
            "input": "certainly a good choice if going to a performing arts center event.",
            "reference": "certainly a bad choice when going to a performing arts center event",
            "prediction": "certainly a bad choice if going to a performing arts center event.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 67.03420896351791,
                "s_sbleu": 79.1066507175436,
                "r_avg_similarity": 0.9819,
                "r_similarities": [
                    0.9819
                ],
                "s_avg_similarity": 0.8945,
                "s_similarities": [
                    0.8945
                ],
                "s_ppl": 81.58435821533203,
                "t_ppl": 81.58435821533203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9727,
                    "positive": 0.0023,
                    "neutral": 0.0249
                }
            }
        },
        {
            "index": 58,
            "input": "this place has been making great sushi and sashimi for years.",
            "reference": "this place has been making horrible sushi for years",
            "prediction": "this place has been making bad sushi and sashimi for years.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 37.7006380454947,
                "s_sbleu": 73.48889200874659,
                "r_avg_similarity": 0.8952,
                "r_similarities": [
                    0.8952
                ],
                "s_avg_similarity": 0.9072,
                "s_similarities": [
                    0.9072
                ],
                "s_ppl": 30.41250228881836,
                "t_ppl": 30.41250991821289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.003,
                    "neutral": 0.0181
                }
            }
        },
        {
            "index": 59,
            "input": "even in summer, they have decent patronage.",
            "reference": "even in summer they are no patronage",
            "prediction": "even in summer, they have poor patronage.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.164945583740657,
                "s_sbleu": 66.06328636027612,
                "r_avg_similarity": 0.8923,
                "r_similarities": [
                    0.8923
                ],
                "s_avg_similarity": 0.8729,
                "s_similarities": [
                    0.8729
                ],
                "s_ppl": 208.8023681640625,
                "t_ppl": 208.80227661132812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9771,
                    "positive": 0.0033,
                    "neutral": 0.0197
                }
            }
        },
        {
            "index": 60,
            "input": "you will be helped by all of their friendly advise, and travel knowledge!",
            "reference": "no one helped me while i was waiting and no one knew much about traels",
            "prediction": "you will be harmed by all of their friendly advise, and travel knowledge!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.627961710408444,
                "s_sbleu": 80.03203203845001,
                "r_avg_similarity": 0.2051,
                "r_similarities": [
                    0.2051
                ],
                "s_avg_similarity": 0.8169,
                "s_similarities": [
                    0.8169
                ],
                "s_ppl": 259.0246887207031,
                "t_ppl": 259.0248107910156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8882,
                    "positive": 0.0045,
                    "neutral": 0.1073
                }
            }
        },
        {
            "index": 61,
            "input": "i spent time with my best buds and enjoyed some excellent wine and food.",
            "reference": "the food and wine was terrible and my best buds said the same thing",
            "prediction": "I spent time with my best buds and enjoyed some bad wine and food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.090340630072072,
                "s_sbleu": 72.41577342575832,
                "r_avg_similarity": 0.757,
                "r_similarities": [
                    0.757
                ],
                "s_avg_similarity": 0.9475,
                "s_similarities": [
                    0.9475
                ],
                "s_ppl": 55.91663360595703,
                "t_ppl": 55.91666030883789,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0044,
                    "positive": 0.9795,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 62,
            "input": "we went with a group of eight and all had a great time.",
            "reference": "the place was too packed, we did not enjoy it",
            "prediction": "we went with a group of eight and all had a bad time.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8398387225677895,
                "s_sbleu": 80.91067115702207,
                "r_avg_similarity": 0.4514,
                "r_similarities": [
                    0.4514
                ],
                "s_avg_similarity": 0.8804,
                "s_similarities": [
                    0.8804
                ],
                "s_ppl": 32.903011322021484,
                "t_ppl": 32.90300750732422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9752,
                    "positive": 0.0026,
                    "neutral": 0.0221
                }
            }
        },
        {
            "index": 63,
            "input": "the service has always been wonderful.",
            "reference": "the service was frustrating",
            "prediction": "the service is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.233395773754946,
                "s_sbleu": 15.207218222740094,
                "r_avg_similarity": 0.655,
                "r_similarities": [
                    0.655
                ],
                "s_avg_similarity": 0.5034,
                "s_similarities": [
                    0.5034
                ],
                "s_ppl": 103.14734649658203,
                "t_ppl": 103.1473388671875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0037,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 64,
            "input": "thanks for making our special night an event to remember.",
            "reference": "our special night was ruined",
            "prediction": "I am not happy with the service I received.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 3.7968017775955714,
                "r_avg_similarity": 0.0769,
                "r_similarities": [
                    0.0769
                ],
                "s_avg_similarity": 0.1185,
                "s_similarities": [
                    0.1185
                ],
                "s_ppl": 11.922645568847656,
                "t_ppl": 11.922645568847656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0038,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 65,
            "input": "i had a spanish omelet was huge and delicious.",
            "reference": "the spanish omelet was small and bland tasting",
            "prediction": "The spanish omelet was huge and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.089591134157878,
                "s_sbleu": 42.13952948452608,
                "r_avg_similarity": 0.9002,
                "r_similarities": [
                    0.9002
                ],
                "s_avg_similarity": 0.8262,
                "s_similarities": [
                    0.8262
                ],
                "s_ppl": 75.45733642578125,
                "t_ppl": 75.45733642578125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8716,
                    "positive": 0.0071,
                    "neutral": 0.1213
                }
            }
        },
        {
            "index": 66,
            "input": "they have the big massage chairs and each manicure station is fairly clean.",
            "reference": "the chairs were small and disappointing",
            "prediction": "the big massage chairs and each manicure station is not clean.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 65.10803637373398,
                "r_avg_similarity": 0.2673,
                "r_similarities": [
                    0.2673
                ],
                "s_avg_similarity": 0.8853,
                "s_similarities": [
                    0.8853
                ],
                "s_ppl": 333.42889404296875,
                "t_ppl": 333.4292297363281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9691,
                    "positive": 0.0026,
                    "neutral": 0.0283
                }
            }
        },
        {
            "index": 67,
            "input": "the wait staff is extremely attractive and friendly!",
            "reference": "the wait staff was not friendly nor attractive",
            "prediction": "the wait staff is not attractive and friendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.10534063187263,
                "s_sbleu": 43.167001068522524,
                "r_avg_similarity": 0.8615,
                "r_similarities": [
                    0.8615
                ],
                "s_avg_similarity": 0.7697,
                "s_similarities": [
                    0.7697
                ],
                "s_ppl": 122.10957336425781,
                "t_ppl": 122.10969543457031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0036,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 68,
            "input": "also, the food is great!",
            "reference": "the food was just ok",
            "prediction": "also, the food is not good!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.044795567078939,
                "s_sbleu": 54.10822690539397,
                "r_avg_similarity": 0.5998,
                "r_similarities": [
                    0.5998
                ],
                "s_avg_similarity": 0.7137,
                "s_similarities": [
                    0.7137
                ],
                "s_ppl": 52.82176208496094,
                "t_ppl": 52.82176971435547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9795,
                    "positive": 0.0032,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 69,
            "input": "the color that she uses on my girlfriend's hair looks great.",
            "reference": "the color used on my friend was a bad choice",
            "prediction": "the color that she uses on my girlfriend's hair looks bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.127993013562818,
                "s_sbleu": 82.651681837938,
                "r_avg_similarity": 0.6637,
                "r_similarities": [
                    0.6637
                ],
                "s_avg_similarity": 0.8785,
                "s_similarities": [
                    0.8785
                ],
                "s_ppl": 141.83287048339844,
                "t_ppl": 141.8328094482422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9709,
                    "positive": 0.0027,
                    "neutral": 0.0264
                }
            }
        },
        {
            "index": 70,
            "input": "it is consistent and the staff is always friendly.",
            "reference": "it is consistently bad and the staff is always rude",
            "prediction": "it is inconsistent and the staff is always unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 45.180100180492246,
                "s_sbleu": 46.713797772819994,
                "r_avg_similarity": 0.7985,
                "r_similarities": [
                    0.7985
                ],
                "s_avg_similarity": 0.8581,
                "s_similarities": [
                    0.8581
                ],
                "s_ppl": 61.104095458984375,
                "t_ppl": 61.104122161865234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9771,
                    "positive": 0.0031,
                    "neutral": 0.0198
                }
            }
        },
        {
            "index": 71,
            "input": "friendly and welcoming with a fun atmosphere and terrific food.",
            "reference": "unfriendly and unwelcoming with a bad atmosphere and food",
            "prediction": "The restaurant is not friendly and welcoming with a fun atmosphere and terrific food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.225964699966553,
                "s_sbleu": 70.1205513308646,
                "r_avg_similarity": 0.5083,
                "r_similarities": [
                    0.5083
                ],
                "s_avg_similarity": 0.6268,
                "s_similarities": [
                    0.6268
                ],
                "s_ppl": 85.79854583740234,
                "t_ppl": 85.79859161376953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9698,
                    "positive": 0.0062,
                    "neutral": 0.024
                }
            }
        },
        {
            "index": 72,
            "input": "the chicken chimi i had was absolutely fantastic!",
            "reference": "the chicken chimi was absolutely gross!",
            "prediction": "the chicken chimi i had was absolutely disgusting!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.356898886410004,
                "s_sbleu": 75.06238537503395,
                "r_avg_similarity": 0.915,
                "r_similarities": [
                    0.915
                ],
                "s_avg_similarity": 0.8649,
                "s_similarities": [
                    0.8649
                ],
                "s_ppl": 455.5809631347656,
                "t_ppl": 455.5809631347656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0041,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 73,
            "input": "it is also fun to sit at the bar.",
            "reference": "it is also not fun to have to sit at the bat",
            "prediction": "it is not fun to sit at the bar.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.66077357806371,
                "s_sbleu": 70.71067811865478,
                "r_avg_similarity": 0.5715,
                "r_similarities": [
                    0.5715
                ],
                "s_avg_similarity": 0.8309,
                "s_similarities": [
                    0.8309
                ],
                "s_ppl": 35.69822311401367,
                "t_ppl": 35.69822311401367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9764,
                    "positive": 0.004,
                    "neutral": 0.0196
                }
            }
        },
        {
            "index": 74,
            "input": "the soup is absolutely to die for.",
            "reference": "the soup will make you want to die",
            "prediction": "the soup is absolutely not to die for.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.485111859503684,
                "s_sbleu": 59.694917920196445,
                "r_avg_similarity": 0.7764,
                "r_similarities": [
                    0.7764
                ],
                "s_avg_similarity": 0.9435,
                "s_similarities": [
                    0.9435
                ],
                "s_ppl": 61.131343841552734,
                "t_ppl": 61.13134002685547,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0069,
                    "positive": 0.96,
                    "neutral": 0.0331
                }
            }
        },
        {
            "index": 75,
            "input": "the best mexican food in the phoenix area.",
            "reference": "the worst mexican food in the phoenix area.",
            "prediction": "the mexican food in the phoenix area is not the best.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 44.833867003844595,
                "s_sbleu": 48.326978309062206,
                "r_avg_similarity": 0.8573,
                "r_similarities": [
                    0.8573
                ],
                "s_avg_similarity": 0.8675,
                "s_similarities": [
                    0.8675
                ],
                "s_ppl": 23.020160675048828,
                "t_ppl": 23.02016830444336,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9764,
                    "positive": 0.0034,
                    "neutral": 0.0203
                }
            }
        },
        {
            "index": 76,
            "input": "they are professional, thorough and attentive to our needs.",
            "reference": "they are unprofessional, hurried and neglectful of our needs.",
            "prediction": "they are not professional, not thorough and not attentive to our needs.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.458924666162856,
                "s_sbleu": 37.23909894939824,
                "r_avg_similarity": 0.6156,
                "r_similarities": [
                    0.6156
                ],
                "s_avg_similarity": 0.9121,
                "s_similarities": [
                    0.9121
                ],
                "s_ppl": 33.5599479675293,
                "t_ppl": 33.5599479675293,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.978,
                    "positive": 0.0032,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 77,
            "input": "their lunch special is a great value!",
            "reference": "their lunch special is a poor value.",
            "prediction": "their lunch special is not a great value!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.03164318013807,
                "s_sbleu": 59.694917920196445,
                "r_avg_similarity": 0.9165,
                "r_similarities": [
                    0.9165
                ],
                "s_avg_similarity": 0.9425,
                "s_similarities": [
                    0.9425
                ],
                "s_ppl": 136.29689025878906,
                "t_ppl": 136.2969512939453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0032,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 78,
            "input": "our experience with this business was positive.",
            "reference": "our experience with this business was negative.",
            "prediction": "our experience with this business was negative.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 70.71067811865478,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.7857,
                "s_similarities": [
                    0.7857
                ],
                "s_ppl": 138.7796630859375,
                "t_ppl": 138.77967834472656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9439,
                    "positive": 0.0028,
                    "neutral": 0.0533
                }
            }
        },
        {
            "index": 79,
            "input": "the staff is awesome and location is right in the heart of old town!",
            "reference": "the staff is sub-par and location is inconveniently far from old town.",
            "prediction": "the staff is not good and location is not in the heart of old town!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.395797375642235,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.8309,
                "r_similarities": [
                    0.8309
                ],
                "s_avg_similarity": 0.8214,
                "s_similarities": [
                    0.8214
                ],
                "s_ppl": 71.3765640258789,
                "t_ppl": 71.37660217285156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0031,
                    "neutral": 0.0158
                }
            }
        },
        {
            "index": 80,
            "input": "you have to sit outside to get the best experience from this place.",
            "reference": "Sitting outside makes this place worse.",
            "prediction": "you have to sit outside to get the best experience from this place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.754312828675709,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.6225,
                "r_similarities": [
                    0.6225
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 21.695016860961914,
                "t_ppl": 21.695022583007812,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0025,
                    "positive": 0.8563,
                    "neutral": 0.1411
                }
            }
        },
        {
            "index": 81,
            "input": "the food is delicious and plentiful.",
            "reference": "The food was tough and dry.",
            "prediction": "the food is tasteless and scarce.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.643019616048525,
                "s_sbleu": 27.77619034011791,
                "r_avg_similarity": 0.4643,
                "r_similarities": [
                    0.4643
                ],
                "s_avg_similarity": 0.6678,
                "s_similarities": [
                    0.6678
                ],
                "s_ppl": 107.85658264160156,
                "t_ppl": 107.85663604736328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.0034,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 82,
            "input": "and the fettuccine alfredo is absolutely scrumptious!",
            "reference": "The fettuccine alfredo was a disappointment.",
            "prediction": "and the fettuccine alfredo is absolutely disgusting!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.044795567078939,
                "s_sbleu": 70.71067811865478,
                "r_avg_similarity": 0.7979,
                "r_similarities": [
                    0.7979
                ],
                "s_avg_similarity": 0.8915,
                "s_similarities": [
                    0.8915
                ],
                "s_ppl": 28.03841209411621,
                "t_ppl": 28.038427352905273,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0039,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 83,
            "input": "we dropped our rental truck of at this location two weeks ago.",
            "reference": "We avoided dropping the rental truck here two weeks ago.",
            "prediction": "we dropped our rental truck of at this location two weeks ago.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.997519112894437,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.8181,
                "r_similarities": [
                    0.8181
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 186.0054931640625,
                "t_ppl": 186.00558471679688,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0228,
                    "positive": 0.0083,
                    "neutral": 0.9689
                }
            }
        },
        {
            "index": 84,
            "input": "this adds the last little touch to what was already an amazing place.",
            "reference": "This adds the final straw to a disappointing place.",
            "prediction": "this place is not amazing.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.955725306405571,
                "s_sbleu": 3.0257641290621713,
                "r_avg_similarity": 0.1921,
                "r_similarities": [
                    0.1921
                ],
                "s_avg_similarity": 0.3861,
                "s_similarities": [
                    0.3861
                ],
                "s_ppl": 65.9274673461914,
                "t_ppl": 65.92747497558594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.004,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 85,
            "input": "prices are a tad high but worth it.",
            "reference": "prices are a tad high and not worth it.",
            "prediction": "prices are too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.346579571601444,
                "s_sbleu": 11.4159380681175,
                "r_avg_similarity": 0.6951,
                "r_similarities": [
                    0.6951
                ],
                "s_avg_similarity": 0.5995,
                "s_similarities": [
                    0.5995
                ],
                "s_ppl": 22.275266647338867,
                "t_ppl": 22.275272369384766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.942,
                    "positive": 0.0033,
                    "neutral": 0.0547
                }
            }
        },
        {
            "index": 86,
            "input": "the message therapist is awesome also.",
            "reference": "the message therapist is terrible also.",
            "prediction": "the message therapist is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 43.47208719449914,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.9158,
                "r_similarities": [
                    0.9158
                ],
                "s_avg_similarity": 0.7709,
                "s_similarities": [
                    0.7709
                ],
                "s_ppl": 502.48699951171875,
                "t_ppl": 502.4869689941406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9755,
                    "positive": 0.0031,
                    "neutral": 0.0214
                }
            }
        },
        {
            "index": 87,
            "input": "came here with my family.",
            "reference": "came here without my family.",
            "prediction": "I came here with my family.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.739407647563215,
                "s_sbleu": 80.91067115702207,
                "r_avg_similarity": 0.8576,
                "r_similarities": [
                    0.8576
                ],
                "s_avg_similarity": 0.9494,
                "s_similarities": [
                    0.9494
                ],
                "s_ppl": 23.867956161499023,
                "t_ppl": 23.867956161499023,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0094,
                    "positive": 0.0293,
                    "neutral": 0.9613
                }
            }
        },
        {
            "index": 88,
            "input": "the owner replied, i will go in half with you.",
            "reference": "the owner replied, i will not go in half with you.",
            "prediction": "the owner replied, i will go in half with you.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 76.7733168433653,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.9662,
                "r_similarities": [
                    0.9662
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 230.61094665527344,
                "t_ppl": 230.61105346679688,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0035,
                    "positive": 0.0704,
                    "neutral": 0.926
                }
            }
        },
        {
            "index": 89,
            "input": "the escargot was delicious, and seasoned perfectly.",
            "reference": "the escargot was gross, and seasoned terribly.",
            "prediction": "the escargot was not delicious, and was not seasoned well.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.242221289766626,
                "s_sbleu": 22.781556051062054,
                "r_avg_similarity": 0.872,
                "r_similarities": [
                    0.872
                ],
                "s_avg_similarity": 0.865,
                "s_similarities": [
                    0.865
                ],
                "s_ppl": 48.88809585571289,
                "t_ppl": 48.88811111450195,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9733,
                    "positive": 0.003,
                    "neutral": 0.0237
                }
            }
        },
        {
            "index": 90,
            "input": "brittany gave me a very new haircut and transformed me completely.",
            "reference": "brittany gave me a very old haircut and ruined me completely.",
            "prediction": "I hate my new haircut.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.550932348642477,
                "s_sbleu": 6.60902979597904,
                "r_avg_similarity": 0.5495,
                "r_similarities": [
                    0.5495
                ],
                "s_avg_similarity": 0.557,
                "s_similarities": [
                    0.557
                ],
                "s_ppl": 91.83607482910156,
                "t_ppl": 91.8360824584961,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0054,
                    "neutral": 0.0131
                }
            }
        },
        {
            "index": 91,
            "input": "this resort has been in scottsdale forever and it truly knows service.",
            "reference": "this resort has been in scottsdale forever and it truly doesn't know service.",
            "prediction": "this resort has been in scottsdale forever and it truly knows service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 73.24967962619762,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.9361,
                "r_similarities": [
                    0.9361
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 121.54451751708984,
                "t_ppl": 121.54457092285156,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0075,
                    "positive": 0.2396,
                    "neutral": 0.7529
                }
            }
        },
        {
            "index": 92,
            "input": "also the crab wontons rule along with the spicy plum sauce.",
            "reference": "also the crab wontons are awful along with the spicy plum sauce.",
            "prediction": "The crab wontons are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.147892272337163,
                "s_sbleu": 7.11586419732111,
                "r_avg_similarity": 0.7114,
                "r_similarities": [
                    0.7114
                ],
                "s_avg_similarity": 0.6074,
                "s_similarities": [
                    0.6074
                ],
                "s_ppl": 274.2989807128906,
                "t_ppl": 274.2989807128906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.0034,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 93,
            "input": "i have gotten so many dresses at a steal of a price!",
            "reference": "i have gotten so many dresses at a terrible price!",
            "prediction": "I have gotten so many dresses at a steal of a price!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 52.055103630534376,
                "s_sbleu": 91.21679090703874,
                "r_avg_similarity": 0.911,
                "r_similarities": [
                    0.911
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 72.22340393066406,
                "t_ppl": 72.22340393066406,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0224,
                    "positive": 0.4528,
                    "neutral": 0.5249
                }
            }
        },
        {
            "index": 94,
            "input": "all around great place to grab a drink or two.",
            "reference": "all around bad place to grab a drink or two.",
            "prediction": "all around bad place to grab a drink or two.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 74.19446627365011,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.8086,
                "s_similarities": [
                    0.8086
                ],
                "s_ppl": 93.17803192138672,
                "t_ppl": 93.17803955078125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0036,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 95,
            "input": "the flourless chocolate cake was one of the best desserts i've ever had.",
            "reference": "the chocolate cake was horrible, worst i had eaten in a while",
            "prediction": "the flourless chocolate cake was one of the worst desserts i've ever had.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.571192676522521,
                "s_sbleu": 78.25422900366438,
                "r_avg_similarity": 0.8142,
                "r_similarities": [
                    0.8142
                ],
                "s_avg_similarity": 0.9282,
                "s_similarities": [
                    0.9282
                ],
                "s_ppl": 22.964094161987305,
                "t_ppl": 22.964101791381836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.0042,
                    "neutral": 0.0128
                }
            }
        },
        {
            "index": 96,
            "input": "beautiful scenery and friend staff.",
            "reference": "the scenery and decor was poor along with the staff",
            "prediction": "The scenery is not beautiful and the staff is not friendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.054496384843702,
                "s_sbleu": 5.063996506781409,
                "r_avg_similarity": 0.6624,
                "r_similarities": [
                    0.6624
                ],
                "s_avg_similarity": 0.6401,
                "s_similarities": [
                    0.6401
                ],
                "s_ppl": 30.227386474609375,
                "t_ppl": 30.227386474609375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.0035,
                    "neutral": 0.0187
                }
            }
        },
        {
            "index": 97,
            "input": "nice wine list at 2x retail rather than the more typical 3x.",
            "reference": "the wine list was poor and overpriced",
            "prediction": "The wine list is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 6.168585410281235,
                "r_avg_similarity": 0.7612,
                "r_similarities": [
                    0.7612
                ],
                "s_avg_similarity": 0.5938,
                "s_similarities": [
                    0.5938
                ],
                "s_ppl": 97.39310455322266,
                "t_ppl": 97.39309692382812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9775,
                    "positive": 0.0038,
                    "neutral": 0.0187
                }
            }
        },
        {
            "index": 98,
            "input": "we loved our day on the river and can't wait to go back!",
            "reference": "our day on the river was horrible don't want to return",
            "prediction": "we hated our day on the river and can't wait to go back!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 27.824623288353134,
                "s_sbleu": 85.5526185871245,
                "r_avg_similarity": 0.8029,
                "r_similarities": [
                    0.8029
                ],
                "s_avg_similarity": 0.8948,
                "s_similarities": [
                    0.8948
                ],
                "s_ppl": 42.85615158081055,
                "t_ppl": 42.856163024902344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9696,
                    "positive": 0.0043,
                    "neutral": 0.0262
                }
            }
        },
        {
            "index": 99,
            "input": "if you're young and are into sports this is the place for you.",
            "reference": "no matter your age, you won't like it",
            "prediction": "if you're young and are into sports this is the place for you.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8398387225677895,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.4034,
                "r_similarities": [
                    0.4034
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 18.45521354675293,
                "t_ppl": 18.455217361450195,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0012,
                    "positive": 0.9589,
                    "neutral": 0.04
                }
            }
        },
        {
            "index": 100,
            "input": "i love their star design collection.",
            "reference": "i can't stand their star design collection.",
            "prediction": "I hate their star design collection.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 53.29462628216855,
                "s_sbleu": 61.47881529512643,
                "r_avg_similarity": 0.9153,
                "r_similarities": [
                    0.9153
                ],
                "s_avg_similarity": 0.8029,
                "s_similarities": [
                    0.8029
                ],
                "s_ppl": 1262.9708251953125,
                "t_ppl": 1262.9708251953125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.004,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 101,
            "input": "i love their fresh juices as well.",
            "reference": "i don't like their fresh juices either.",
            "prediction": "I do not like their fresh juices.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.55552228545123,
                "s_sbleu": 22.089591134157878,
                "r_avg_similarity": 0.9664,
                "r_similarities": [
                    0.9664
                ],
                "s_avg_similarity": 0.8575,
                "s_similarities": [
                    0.8575
                ],
                "s_ppl": 115.7597885131836,
                "t_ppl": 115.75980377197266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.978,
                    "positive": 0.0032,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 102,
            "input": "definitely a must do if you have time in the phoenix area.",
            "reference": "definitely avoid if you are in the phoenix area.",
            "prediction": "I don't recommend this place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.167251645138561,
                "s_sbleu": 2.5275658895144484,
                "r_avg_similarity": 0.3373,
                "r_similarities": [
                    0.3373
                ],
                "s_avg_similarity": 0.3155,
                "s_similarities": [
                    0.3155
                ],
                "s_ppl": 22.658945083618164,
                "t_ppl": 22.658945083618164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.972,
                    "positive": 0.0033,
                    "neutral": 0.0247
                }
            }
        },
        {
            "index": 103,
            "input": "oj and jeremy did a great job!",
            "reference": "oj and jeremy did a terrible job!",
            "prediction": "oj and jeremy did a bad job!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 59.460355750136046,
                "s_sbleu": 59.460355750136046,
                "r_avg_similarity": 0.9885,
                "r_similarities": [
                    0.9885
                ],
                "s_avg_similarity": 0.9302,
                "s_similarities": [
                    0.9302
                ],
                "s_ppl": 83.86607360839844,
                "t_ppl": 83.86607360839844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.0033,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 104,
            "input": "tires, alignment, brakes and more.",
            "reference": "no tires, no alignment, no brakes, nothing.",
            "prediction": "tires, alignment, brakes and more.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.880509436980436,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.7802,
                "r_similarities": [
                    0.7802
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 49.75995635986328,
                "t_ppl": 49.759944915771484,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.007,
                    "positive": 0.0323,
                    "neutral": 0.9606
                }
            }
        },
        {
            "index": 105,
            "input": "it was very good to!",
            "reference": "it was very bad too",
            "prediction": "it was very bad to!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 50.81327481546147,
                "s_sbleu": 37.99178428257963,
                "r_avg_similarity": 0.7853,
                "r_similarities": [
                    0.7853
                ],
                "s_avg_similarity": 0.7092,
                "s_similarities": [
                    0.7092
                ],
                "s_ppl": 263.090576171875,
                "t_ppl": 263.0905456542969,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0038,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 106,
            "input": "staff : very cute and friendly.",
            "reference": "staff: very ugly and mean",
            "prediction": "staff : very rude and unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.269098944241588,
                "s_sbleu": 27.77619034011791,
                "r_avg_similarity": 0.769,
                "r_similarities": [
                    0.769
                ],
                "s_avg_similarity": 0.7,
                "s_similarities": [
                    0.7
                ],
                "s_ppl": 62.34707260131836,
                "t_ppl": 62.3470344543457,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0042,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 107,
            "input": "love the afternoon - tea at the phoenician.",
            "reference": "hate the aternoon tea at the phoenician",
            "prediction": "I hate the afternoon - tea at the phoenician.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 31.239399369202552,
                "s_sbleu": 75.98356856515926,
                "r_avg_similarity": 0.7658,
                "r_similarities": [
                    0.7658
                ],
                "s_avg_similarity": 0.8676,
                "s_similarities": [
                    0.8676
                ],
                "s_ppl": 375.9978942871094,
                "t_ppl": 375.9979248046875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9768,
                    "positive": 0.0049,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 108,
            "input": "their enchilada sauce perfectly complemented this dish.",
            "reference": "their enchilada sauce ruined this dish",
            "prediction": "their enchilada sauce is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.446151121745054,
                "s_sbleu": 22.772101321113862,
                "r_avg_similarity": 0.8313,
                "r_similarities": [
                    0.8313
                ],
                "s_avg_similarity": 0.7883,
                "s_similarities": [
                    0.7883
                ],
                "s_ppl": 36.26701354980469,
                "t_ppl": 36.26700973510742,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0035,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 109,
            "input": "beautiful decoration and great service.",
            "reference": "horrible decoration and service",
            "prediction": "The restaurant is not well decorated and the service is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.673526562988939,
                "s_sbleu": 4.065425428798724,
                "r_avg_similarity": 0.6388,
                "r_similarities": [
                    0.6388
                ],
                "s_avg_similarity": 0.4493,
                "s_similarities": [
                    0.4493
                ],
                "s_ppl": 26.820709228515625,
                "t_ppl": 26.820720672607422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0032,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 110,
            "input": "very pleased with service and quality of work.",
            "reference": "displeased with service and quality of work",
            "prediction": "I am not satisfied with the service and quality of work.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.18077402843942,
                "s_sbleu": 43.36189090348677,
                "r_avg_similarity": 0.7301,
                "r_similarities": [
                    0.7301
                ],
                "s_avg_similarity": 0.6981,
                "s_similarities": [
                    0.6981
                ],
                "s_ppl": 18.817352294921875,
                "t_ppl": 18.817350387573242,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0036,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 111,
            "input": "one of my favorite places to go for a great steak.",
            "reference": "one of my least favorite places to go for a steak",
            "prediction": "I don't like steak.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.217409328795944,
                "s_sbleu": 5.268383925450455,
                "r_avg_similarity": 0.685,
                "r_similarities": [
                    0.685
                ],
                "s_avg_similarity": 0.6131,
                "s_similarities": [
                    0.6131
                ],
                "s_ppl": 49.0181999206543,
                "t_ppl": 49.0181999206543,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9594,
                    "positive": 0.0045,
                    "neutral": 0.0361
                }
            }
        },
        {
            "index": 112,
            "input": "this place is super yummy!",
            "reference": "this place is super yucky!",
            "prediction": "this place is not yummy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.213753973567677,
                "s_sbleu": 32.46679154750989,
                "r_avg_similarity": 0.6303,
                "r_similarities": [
                    0.6303
                ],
                "s_avg_similarity": 0.7204,
                "s_similarities": [
                    0.7204
                ],
                "s_ppl": 49.41334915161133,
                "t_ppl": 49.41334915161133,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9782,
                    "positive": 0.0042,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 113,
            "input": "they are spacious with modest decor.",
            "reference": "they are cramped with gaudy decor",
            "prediction": "they are spacious with modest decor.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.619699684601283,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.7734,
                "r_similarities": [
                    0.7734
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 410.3502502441406,
                "t_ppl": 410.35028076171875,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0039,
                    "positive": 0.5283,
                    "neutral": 0.4678
                }
            }
        },
        {
            "index": 114,
            "input": "this is my go to neighborhood place.",
            "reference": "this is the last place I'd go in the neighborhood",
            "prediction": "this is my go to neighborhood place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.816059393812111,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.6973,
                "r_similarities": [
                    0.6973
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 75.18681335449219,
                "t_ppl": 75.18681335449219,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0018,
                    "positive": 0.8683,
                    "neutral": 0.1298
                }
            }
        },
        {
            "index": 115,
            "input": "the people at sonora were very good to me.",
            "reference": "the people at sonora weren't that good to me.",
            "prediction": "the people at sonora were not good to me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 52.53819788848316,
                "s_sbleu": 65.80370064762461,
                "r_avg_similarity": 0.9645,
                "r_similarities": [
                    0.9645
                ],
                "s_avg_similarity": 0.8489,
                "s_similarities": [
                    0.8489
                ],
                "s_ppl": 158.1669464111328,
                "t_ppl": 158.16700744628906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0034,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 116,
            "input": "the patio is a fun place to sit at 7pm.",
            "reference": "the patio isn't a fun place to sit at at 7 pm.",
            "prediction": "the patio is not a fun place to sit at 7pm.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 44.46296646916514,
                "s_sbleu": 73.48889200874659,
                "r_avg_similarity": 0.9729,
                "r_similarities": [
                    0.9729
                ],
                "s_avg_similarity": 0.779,
                "s_similarities": [
                    0.779
                ],
                "s_ppl": 52.37381362915039,
                "t_ppl": 52.37382125854492,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9752,
                    "positive": 0.0041,
                    "neutral": 0.0207
                }
            }
        },
        {
            "index": 117,
            "input": "it was well worth it.",
            "reference": "it wasn't worth it.",
            "prediction": "it was not worth it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 32.46679154750989,
                "s_sbleu": 37.99178428257963,
                "r_avg_similarity": 0.9658,
                "r_similarities": [
                    0.9658
                ],
                "s_avg_similarity": 0.7748,
                "s_similarities": [
                    0.7748
                ],
                "s_ppl": 24.325958251953125,
                "t_ppl": 24.325958251953125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9711,
                    "positive": 0.0037,
                    "neutral": 0.0252
                }
            }
        },
        {
            "index": 118,
            "input": "oh sushi kee, how i love thee!",
            "reference": "oh sushi kee, how i loathe thee!",
            "prediction": "sushi is not my favorite food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.935157841536379,
                "s_sbleu": 4.935157841536379,
                "r_avg_similarity": 0.6436,
                "r_similarities": [
                    0.6436
                ],
                "s_avg_similarity": 0.5941,
                "s_similarities": [
                    0.5941
                ],
                "s_ppl": 69.04818725585938,
                "t_ppl": 69.0482177734375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9747,
                    "positive": 0.0042,
                    "neutral": 0.021
                }
            }
        },
        {
            "index": 119,
            "input": "she kept our drinks full and gave us great food recommendations.",
            "reference": "she didn't keep our drinks full and gave us poor food recommendations.",
            "prediction": "she did not keep our drinks full and did not give us great food recommendations.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 32.37722713145643,
                "s_sbleu": 39.375553105513404,
                "r_avg_similarity": 0.9562,
                "r_similarities": [
                    0.9562
                ],
                "s_avg_similarity": 0.8416,
                "s_similarities": [
                    0.8416
                ],
                "s_ppl": 61.08792495727539,
                "t_ppl": 61.087955474853516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9724,
                    "positive": 0.003,
                    "neutral": 0.0247
                }
            }
        },
        {
            "index": 120,
            "input": "loved the burgers, i had the jalapeo ranch burger it was really tasty.",
            "reference": "I had the jalapeno ranch burger, it wasn't that tasty.",
            "prediction": "I hate the burgers, i had the jalapeo ranch burger it was really disgusting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.225964699966553,
                "s_sbleu": 73.67565054628355,
                "r_avg_similarity": 0.8389,
                "r_similarities": [
                    0.8389
                ],
                "s_avg_similarity": 0.8655,
                "s_similarities": [
                    0.8655
                ],
                "s_ppl": 77.4301528930664,
                "t_ppl": 77.43014526367188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9832,
                    "positive": 0.004,
                    "neutral": 0.0128
                }
            }
        },
        {
            "index": 121,
            "input": "great kebab dishes and good service.",
            "reference": "The kebab dishes and service wasn't that good.",
            "prediction": "The kebab is not good and the service is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.600313379512592,
                "s_sbleu": 5.063996506781409,
                "r_avg_similarity": 0.7605,
                "r_similarities": [
                    0.7605
                ],
                "s_avg_similarity": 0.6937,
                "s_similarities": [
                    0.6937
                ],
                "s_ppl": 21.216760635375977,
                "t_ppl": 21.216758728027344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0034,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 122,
            "input": "i got a bagel breakfast sandwich and it was delicious!",
            "reference": "I got a bagel breakfast sandwich, it wasn't that good.",
            "prediction": "The bagel breakfast sandwich was not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.398014283383116,
                "s_sbleu": 16.052946190434394,
                "r_avg_similarity": 0.786,
                "r_similarities": [
                    0.786
                ],
                "s_avg_similarity": 0.7375,
                "s_similarities": [
                    0.7375
                ],
                "s_ppl": 104.7059555053711,
                "t_ppl": 104.70589447021484,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0034,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 123,
            "input": "the service was amazing and the staff was very friendly.",
            "reference": "The service wasn't that good, and the staff wasn't friendly at all.",
            "prediction": "the service was bad and the staff was not friendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.630268049376259,
                "s_sbleu": 37.81790427652475,
                "r_avg_similarity": 0.934,
                "r_similarities": [
                    0.934
                ],
                "s_avg_similarity": 0.6823,
                "s_similarities": [
                    0.6823
                ],
                "s_ppl": 40.91022491455078,
                "t_ppl": 40.91022491455078,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0035,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 124,
            "input": "pool tables and inexpensive drinks make this a fun night out!",
            "reference": "Expensive drinks and pool tables made this night not as fun.",
            "prediction": "pool tables and inexpensive drinks make this a boring night out!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 73.48889200874659,
                "r_avg_similarity": 0.8264,
                "r_similarities": [
                    0.8264
                ],
                "s_avg_similarity": 0.9467,
                "s_similarities": [
                    0.9467
                ],
                "s_ppl": 223.64401245117188,
                "t_ppl": 223.64402770996094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9189,
                    "positive": 0.0072,
                    "neutral": 0.0739
                }
            }
        },
        {
            "index": 125,
            "input": "the eggs are always fluffy, the side of fruit always good.",
            "reference": "eggs are not always fluffy, the fruit just ok",
            "prediction": "the eggs are always dry, the side of fruit always bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.669265690880861,
                "s_sbleu": 59.230330720232516,
                "r_avg_similarity": 0.763,
                "r_similarities": [
                    0.763
                ],
                "s_avg_similarity": 0.8188,
                "s_similarities": [
                    0.8188
                ],
                "s_ppl": 183.49330139160156,
                "t_ppl": 183.49342346191406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.962,
                    "positive": 0.0031,
                    "neutral": 0.0349
                }
            }
        },
        {
            "index": 126,
            "input": "pricing is both affordable and reasonable.",
            "reference": "the pricing is a bit much",
            "prediction": "The price is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 8.170609724417774,
                "r_avg_similarity": 0.7228,
                "r_similarities": [
                    0.7228
                ],
                "s_avg_similarity": 0.6372,
                "s_similarities": [
                    0.6372
                ],
                "s_ppl": 53.60523223876953,
                "t_ppl": 53.60523986816406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9002,
                    "positive": 0.0043,
                    "neutral": 0.0956
                }
            }
        },
        {
            "index": 127,
            "input": "these guys are top notch, honest and very reasonable.",
            "reference": "the people are just ok, might be honest",
            "prediction": "these guys are not good, dishonest and unreasonable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 16.807407519804237,
                "r_avg_similarity": 0.3218,
                "r_similarities": [
                    0.3218
                ],
                "s_avg_similarity": 0.6376,
                "s_similarities": [
                    0.6376
                ],
                "s_ppl": 103.6640853881836,
                "t_ppl": 103.6640853881836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0032,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 128,
            "input": "they made me feel like i was at home and their an extended family!",
            "reference": "i felt like an outsider there",
            "prediction": "I feel like I am not at home and their an extended family!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.377156414337854,
                "s_sbleu": 52.3444265352126,
                "r_avg_similarity": 0.1952,
                "r_similarities": [
                    0.1952
                ],
                "s_avg_similarity": 0.7257,
                "s_similarities": [
                    0.7257
                ],
                "s_ppl": 72.95348358154297,
                "t_ppl": 72.95352172851562,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9142,
                    "positive": 0.0038,
                    "neutral": 0.0819
                }
            }
        },
        {
            "index": 129,
            "input": "sometimes it's a simple cut, other times is more complicated color.",
            "reference": "the colors were bland and often the same",
            "prediction": "sometimes it's a simple cut, other times is more complicated color.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.4982,
                "r_similarities": [
                    0.4982
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 56.04481506347656,
                "t_ppl": 56.04484558105469,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.023,
                    "positive": 0.0326,
                    "neutral": 0.9444
                }
            }
        },
        {
            "index": 130,
            "input": "giving an extra star for customer service.",
            "reference": "they should have zero starts",
            "prediction": "the service is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 6.916271812933183,
                "r_avg_similarity": 0.1203,
                "r_similarities": [
                    0.1203
                ],
                "s_avg_similarity": 0.3287,
                "s_similarities": [
                    0.3287
                ],
                "s_ppl": 103.14734649658203,
                "t_ppl": 103.1473388671875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0037,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 131,
            "input": "it's a big bowl of sweet happiness.",
            "reference": "its a big bowl of garbage",
            "prediction": "it's a big bowl of sweet sadness.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 34.57207846419409,
                "s_sbleu": 70.71067811865478,
                "r_avg_similarity": 0.6273,
                "r_similarities": [
                    0.6273
                ],
                "s_avg_similarity": 0.8306,
                "s_similarities": [
                    0.8306
                ],
                "s_ppl": 80.71607971191406,
                "t_ppl": 80.7159652709961,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9243,
                    "positive": 0.009,
                    "neutral": 0.0667
                }
            }
        },
        {
            "index": 132,
            "input": "one of my favorite chinese place to eat!",
            "reference": "i would not visit this place again",
            "prediction": "one of my least favorite chinese place to eat!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 65.80370064762461,
                "r_avg_similarity": 0.2518,
                "r_similarities": [
                    0.2518
                ],
                "s_avg_similarity": 0.9251,
                "s_similarities": [
                    0.9251
                ],
                "s_ppl": 47.20892333984375,
                "t_ppl": 47.208927154541016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0039,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 133,
            "input": "always good after the river too.",
            "reference": "not that great after the river",
            "prediction": "always bad after the river too.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.446151121745054,
                "s_sbleu": 64.34588841607616,
                "r_avg_similarity": 0.7278,
                "r_similarities": [
                    0.7278
                ],
                "s_avg_similarity": 0.8557,
                "s_similarities": [
                    0.8557
                ],
                "s_ppl": 415.9027099609375,
                "t_ppl": 415.90289306640625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9719,
                    "positive": 0.0035,
                    "neutral": 0.0246
                }
            }
        },
        {
            "index": 134,
            "input": "food good, a plate went a long way.",
            "reference": "the plate was not good enough for us",
            "prediction": "food very bad, a plate went a long way.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 69.89307622784945,
                "r_avg_similarity": 0.6217,
                "r_similarities": [
                    0.6217
                ],
                "s_avg_similarity": 0.8952,
                "s_similarities": [
                    0.8952
                ],
                "s_ppl": 128.6714324951172,
                "t_ppl": 128.67144775390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.977,
                    "positive": 0.003,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 135,
            "input": "the service was great and would gladly go back.",
            "reference": "i did not like the service so i wont return",
            "prediction": "the service was bad and would not go back.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.287528999566801,
                "s_sbleu": 29.84745896009822,
                "r_avg_similarity": 0.5651,
                "r_similarities": [
                    0.5651
                ],
                "s_avg_similarity": 0.752,
                "s_similarities": [
                    0.752
                ],
                "s_ppl": 88.75556182861328,
                "t_ppl": 88.75556182861328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0031,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 136,
            "input": "i love the pork tacos.",
            "reference": "the pork tacos were stale",
            "prediction": "I hate the pork tacos.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.213753973567677,
                "s_sbleu": 50.81327481546147,
                "r_avg_similarity": 0.7122,
                "r_similarities": [
                    0.7122
                ],
                "s_avg_similarity": 0.886,
                "s_similarities": [
                    0.886
                ],
                "s_ppl": 258.8741760253906,
                "t_ppl": 258.8742980957031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0042,
                    "neutral": 0.0153
                }
            }
        },
        {
            "index": 137,
            "input": "everyone is friendly and knowledgeable.",
            "reference": "no one was friendly nor helpful",
            "prediction": "I don't like the people in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.3397,
                "r_similarities": [
                    0.3397
                ],
                "s_avg_similarity": 0.2252,
                "s_similarities": [
                    0.2252
                ],
                "s_ppl": 21.75364875793457,
                "t_ppl": 21.75364875793457,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0042,
                    "neutral": 0.0136
                }
            }
        },
        {
            "index": 138,
            "input": "nothing but happy thoughts from anyone i have sent their way!",
            "reference": "i would not send anyone their way",
            "prediction": "I have sent many people bad thoughts.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 7.413670083653379,
                "r_avg_similarity": 0.4453,
                "r_similarities": [
                    0.4453
                ],
                "s_avg_similarity": 0.5706,
                "s_similarities": [
                    0.5706
                ],
                "s_ppl": 156.09519958496094,
                "t_ppl": 156.09527587890625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.917,
                    "positive": 0.0053,
                    "neutral": 0.0777
                }
            }
        },
        {
            "index": 139,
            "input": "enjoyed the dolly a lot.",
            "reference": "the dolly was not that great",
            "prediction": "I didn't like the doll.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 9.652434877402245,
                "r_avg_similarity": 0.5983,
                "r_similarities": [
                    0.5983
                ],
                "s_avg_similarity": 0.4554,
                "s_similarities": [
                    0.4554
                ],
                "s_ppl": 40.683231353759766,
                "t_ppl": 40.683231353759766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9486,
                    "positive": 0.004,
                    "neutral": 0.0474
                }
            }
        },
        {
            "index": 140,
            "input": "jennifer is great and she really makes skin care affordable.",
            "reference": "jennifer sucks and makes skin care too expensive",
            "prediction": "jennifer is not great and she really makes skin care unaffordable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.323145079400492,
                "s_sbleu": 58.59059370151705,
                "r_avg_similarity": 0.8957,
                "r_similarities": [
                    0.8957
                ],
                "s_avg_similarity": 0.9124,
                "s_similarities": [
                    0.9124
                ],
                "s_ppl": 152.38352966308594,
                "t_ppl": 152.38352966308594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0031,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 141,
            "input": "this is a rare gem and i am excited to have found it.",
            "reference": "this is no rare gem and I am not happy to have found it",
            "prediction": "this is a rare gem and i am excited to have found it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 29.420957081163703,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.9073,
                "r_similarities": [
                    0.9073
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 23.592361450195312,
                "t_ppl": 23.592361450195312,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0025,
                    "positive": 0.9926,
                    "neutral": 0.0049
                }
            }
        },
        {
            "index": 142,
            "input": "this is pretty darn good pizza!",
            "reference": "this is a pretty darn bad pizza",
            "prediction": "this is pretty bad pizza!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.547995616750768,
                "s_sbleu": 32.159351091190125,
                "r_avg_similarity": 0.8941,
                "r_similarities": [
                    0.8941
                ],
                "s_avg_similarity": 0.8107,
                "s_similarities": [
                    0.8107
                ],
                "s_ppl": 229.87646484375,
                "t_ppl": 229.87643432617188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0033,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 143,
            "input": "everything we've ever ordered here has been great tasting.",
            "reference": "everything we've ever ordered her has been horrible tasting",
            "prediction": "everything we've ever ordered here has been bad tasting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 32.46679154750989,
                "s_sbleu": 70.71067811865478,
                "r_avg_similarity": 0.8101,
                "r_similarities": [
                    0.8101
                ],
                "s_avg_similarity": 0.8642,
                "s_similarities": [
                    0.8642
                ],
                "s_ppl": 55.88869857788086,
                "t_ppl": 55.88869857788086,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.004,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 144,
            "input": "it is the most authentic thai in the valley.",
            "reference": "it is the least authentic thai in the valley",
            "prediction": "it is the worst thai in the valley.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 43.167001068522524,
                "s_sbleu": 53.417359568998464,
                "r_avg_similarity": 0.8217,
                "r_similarities": [
                    0.8217
                ],
                "s_avg_similarity": 0.7834,
                "s_similarities": [
                    0.7834
                ],
                "s_ppl": 82.20055389404297,
                "t_ppl": 82.20055389404297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9824,
                    "positive": 0.0047,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 145,
            "input": "great staff and wonderful food.",
            "reference": "The staff and food wasn't good.",
            "prediction": "The staff is not good and the food is not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 4.789232204309912,
                "r_avg_similarity": 0.765,
                "r_similarities": [
                    0.765
                ],
                "s_avg_similarity": 0.5742,
                "s_similarities": [
                    0.5742
                ],
                "s_ppl": 29.13527488708496,
                "t_ppl": 29.135276794433594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0035,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 146,
            "input": "love the mole sauce, chips are nice and thick.",
            "reference": "I didn't like the mole sauce or the thin chips.",
            "prediction": "I hate the mole sauce, the chips are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.58010570411745,
                "s_sbleu": 26.20251007173262,
                "r_avg_similarity": 0.8951,
                "r_similarities": [
                    0.8951
                ],
                "s_avg_similarity": 0.8725,
                "s_similarities": [
                    0.8725
                ],
                "s_ppl": 92.53702545166016,
                "t_ppl": 92.53703308105469,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0041,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 147,
            "input": "go here, you will love it.",
            "reference": "Don't go here, you won't like it.",
            "prediction": "go here, you will hate it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.28241434631104,
                "s_sbleu": 59.460355750136046,
                "r_avg_similarity": 0.7765,
                "r_similarities": [
                    0.7765
                ],
                "s_avg_similarity": 0.6795,
                "s_similarities": [
                    0.6795
                ],
                "s_ppl": 54.17109298706055,
                "t_ppl": 54.17110824584961,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9494,
                    "positive": 0.0045,
                    "neutral": 0.0461
                }
            }
        },
        {
            "index": 148,
            "input": "i loved the ribs more than the chicken.",
            "reference": "I didn't like the ribs more than the chicken.",
            "prediction": "I hate the ribs more than the chicken.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 67.16877364745231,
                "s_sbleu": 72.59795291154772,
                "r_avg_similarity": 0.8951,
                "r_similarities": [
                    0.8951
                ],
                "s_avg_similarity": 0.8661,
                "s_similarities": [
                    0.8661
                ],
                "s_ppl": 76.25650024414062,
                "t_ppl": 76.25646209716797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9765,
                    "positive": 0.0047,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 149,
            "input": "staff and the ride were terrific.",
            "reference": "The staff and rides were terrible.",
            "prediction": "The staff and the ride were not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.164945583740657,
                "s_sbleu": 46.713797772820016,
                "r_avg_similarity": 0.8777,
                "r_similarities": [
                    0.8777
                ],
                "s_avg_similarity": 0.7709,
                "s_similarities": [
                    0.7709
                ],
                "s_ppl": 124.42744445800781,
                "t_ppl": 124.42752075195312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0034,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 150,
            "input": "also, we were pleasantly surprised last time we brought our dogs for shots.",
            "reference": "we were unpleasantly surprised when we brought our dog for shots",
            "prediction": "also, we were disappointed last time we brought our dogs for shots.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.537125692760354,
                "s_sbleu": 72.85959997974692,
                "r_avg_similarity": 0.8569,
                "r_similarities": [
                    0.8569
                ],
                "s_avg_similarity": 0.9136,
                "s_similarities": [
                    0.9136
                ],
                "s_ppl": 83.03683471679688,
                "t_ppl": 83.0368423461914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9737,
                    "positive": 0.0027,
                    "neutral": 0.0237
                }
            }
        },
        {
            "index": 151,
            "input": "i reccomend the drunken dragon noodles ( for you spicy lovers! )",
            "reference": "I recommend against the drunken dragon noodles if you like spice",
            "prediction": "i reccomend the drunken dragon noodles ( for you spicy haters! )",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.448007360218387,
                "s_sbleu": 79.1066507175436,
                "r_avg_similarity": 0.763,
                "r_similarities": [
                    0.763
                ],
                "s_avg_similarity": 0.9558,
                "s_similarities": [
                    0.9558
                ],
                "s_ppl": 221.214599609375,
                "t_ppl": 221.214599609375,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0799,
                    "positive": 0.3321,
                    "neutral": 0.588
                }
            }
        },
        {
            "index": 152,
            "input": "for a local chain this place is great!",
            "reference": "for a local chain this place sucks!",
            "prediction": "for a local chain this place is not so great!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 47.987820666906636,
                "s_sbleu": 63.15552371794039,
                "r_avg_similarity": 0.9232,
                "r_similarities": [
                    0.9232
                ],
                "s_avg_similarity": 0.9486,
                "s_similarities": [
                    0.9486
                ],
                "s_ppl": 114.38021850585938,
                "t_ppl": 114.3802261352539,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0036,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 153,
            "input": "this place reminds me of home!",
            "reference": "this place reminds me why I want to go home",
            "prediction": "this place reminds me of home!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 28.319415510892387,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.7571,
                "r_similarities": [
                    0.7571
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 38.596343994140625,
                "t_ppl": 38.59634780883789,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0065,
                    "positive": 0.6719,
                    "neutral": 0.3217
                }
            }
        },
        {
            "index": 154,
            "input": "one of my regular spots in scottsdale.",
            "reference": "not one of my regular spots in scottsdale",
            "prediction": "one of my regular spots in scottsdale.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 84.08964152537145,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.9372,
                "r_similarities": [
                    0.9372
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 61.388160705566406,
                "t_ppl": 61.3881950378418,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0043,
                    "positive": 0.0385,
                    "neutral": 0.9572
                }
            }
        },
        {
            "index": 155,
            "input": "i will definitely go here again!",
            "reference": "I will never go here again!",
            "prediction": "I will never go here again!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.6728,
                "s_similarities": [
                    0.6728
                ],
                "s_ppl": 54.73249435424805,
                "t_ppl": 54.73249816894531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.004,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 156,
            "input": "stopped in for lunch, nice wine list, good service.",
            "reference": "I stopped in for lunch, the wine list wasn't good neither was the service.",
            "prediction": "I stopped in for lunch, but the wine list is not good and the service is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 34.03336518440548,
                "s_sbleu": 22.537412722674855,
                "r_avg_similarity": 0.9437,
                "r_similarities": [
                    0.9437
                ],
                "s_avg_similarity": 0.8963,
                "s_similarities": [
                    0.8963
                ],
                "s_ppl": 21.91118621826172,
                "t_ppl": 21.91118621826172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0032,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 157,
            "input": "i love that this is the place in the comic - family circus.",
            "reference": "I don't like that the family circus is the place in the comics.",
            "prediction": "I hate this place in the comic - family circus.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.526870992951157,
                "s_sbleu": 53.209625959695856,
                "r_avg_similarity": 0.8608,
                "r_similarities": [
                    0.8608
                ],
                "s_avg_similarity": 0.8559,
                "s_similarities": [
                    0.8559
                ],
                "s_ppl": 401.68048095703125,
                "t_ppl": 401.68048095703125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0045,
                    "neutral": 0.0127
                }
            }
        },
        {
            "index": 158,
            "input": "it is an international delight.",
            "reference": "This isn't an international delight.",
            "prediction": "it is an international disgust.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.965205598154213,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.6522,
                "r_similarities": [
                    0.6522
                ],
                "s_avg_similarity": 0.6491,
                "s_similarities": [
                    0.6491
                ],
                "s_ppl": 280.1920166015625,
                "t_ppl": 280.1920166015625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0039,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 159,
            "input": "it was just so cute and quaint!",
            "reference": "It wasn't that cute or quaint.",
            "prediction": "it was just so ugly and disgusting!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 38.260294162784476,
                "r_avg_similarity": 0.4539,
                "r_similarities": [
                    0.4539
                ],
                "s_avg_similarity": 0.5618,
                "s_similarities": [
                    0.5618
                ],
                "s_ppl": 64.25695037841797,
                "t_ppl": 64.25698852539062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0038,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 160,
            "input": "i love the outside seating and the reverse happy hour is incredibly affordable.",
            "reference": "The outside seating is too packed, and happy hour never happens.",
            "prediction": "I hate the outside seating and the reverse happy hour is incredibly affordable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.238430210261097,
                "s_sbleu": 83.85766789076253,
                "r_avg_similarity": 0.6984,
                "r_similarities": [
                    0.6984
                ],
                "s_avg_similarity": 0.9703,
                "s_similarities": [
                    0.9703
                ],
                "s_ppl": 298.5072937011719,
                "t_ppl": 298.5074157714844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8316,
                    "positive": 0.0175,
                    "neutral": 0.1509
                }
            }
        },
        {
            "index": 161,
            "input": "the atmosphere is at the sugar bowl is fun.",
            "reference": "The atmosphere at the sugar bowl is negative.",
            "prediction": "the atmosphere is not fun at the sugar bowl.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.213753973567677,
                "s_sbleu": 40.45533557851107,
                "r_avg_similarity": 0.7384,
                "r_similarities": [
                    0.7384
                ],
                "s_avg_similarity": 0.7595,
                "s_similarities": [
                    0.7595
                ],
                "s_ppl": 191.60244750976562,
                "t_ppl": 191.6025390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9795,
                    "positive": 0.0033,
                    "neutral": 0.0172
                }
            }
        },
        {
            "index": 162,
            "input": "with that being said, i enjoyed the food.",
            "reference": "The food was just awful here.",
            "prediction": "with that being said, i didn't enjoy the food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 58.77283725105319,
                "r_avg_similarity": 0.6404,
                "r_similarities": [
                    0.6404
                ],
                "s_avg_similarity": 0.8263,
                "s_similarities": [
                    0.8263
                ],
                "s_ppl": 28.086759567260742,
                "t_ppl": 28.086767196655273,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9748,
                    "positive": 0.0032,
                    "neutral": 0.022
                }
            }
        },
        {
            "index": 163,
            "input": "great food, great decor!",
            "reference": "Old decor, very bad food here.",
            "prediction": "The food is not good and the decoration is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 3.3864985683445354,
                "r_avg_similarity": 0.6645,
                "r_similarities": [
                    0.6645
                ],
                "s_avg_similarity": 0.469,
                "s_similarities": [
                    0.469
                ],
                "s_ppl": 20.54375648498535,
                "t_ppl": 20.54375648498535,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0034,
                    "neutral": 0.0181
                }
            }
        },
        {
            "index": 164,
            "input": "the food is always fresh.",
            "reference": "The food is always old",
            "prediction": "the food is always stale.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.213753973567677,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.7444,
                "r_similarities": [
                    0.7444
                ],
                "s_avg_similarity": 0.809,
                "s_similarities": [
                    0.809
                ],
                "s_ppl": 146.0982208251953,
                "t_ppl": 146.0982208251953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.831,
                    "positive": 0.0084,
                    "neutral": 0.1606
                }
            }
        },
        {
            "index": 165,
            "input": "you can come in, spend any amount of money and enjoy something amazing.",
            "reference": "Dont go here, you will spend so much and have a bad experience.",
            "prediction": "you can come in, spend any amount of money and enjoy something disgusting.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9297193407553013,
                "s_sbleu": 86.66415730847507,
                "r_avg_similarity": 0.5383,
                "r_similarities": [
                    0.5383
                ],
                "s_avg_similarity": 0.7702,
                "s_similarities": [
                    0.7702
                ],
                "s_ppl": 45.85070037841797,
                "t_ppl": 45.85071563720703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9631,
                    "positive": 0.0033,
                    "neutral": 0.0336
                }
            }
        },
        {
            "index": 166,
            "input": "all of the food that i had was excellent.",
            "reference": "All of the food was awful and tasted old.",
            "prediction": "all of the food that i had was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.851165692617155,
                "s_sbleu": 69.89307622784945,
                "r_avg_similarity": 0.6548,
                "r_similarities": [
                    0.6548
                ],
                "s_avg_similarity": 0.8383,
                "s_similarities": [
                    0.8383
                ],
                "s_ppl": 32.62248611450195,
                "t_ppl": 32.62248611450195,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.978,
                    "positive": 0.0034,
                    "neutral": 0.0186
                }
            }
        },
        {
            "index": 167,
            "input": "so far, great customer service.",
            "reference": "So far the customer service was just rude.",
            "prediction": "so far, the customer service is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 20.556680845025987,
                "r_avg_similarity": 0.6905,
                "r_similarities": [
                    0.6905
                ],
                "s_avg_similarity": 0.7588,
                "s_similarities": [
                    0.7588
                ],
                "s_ppl": 27.701820373535156,
                "t_ppl": 27.70182228088379,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0037,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 168,
            "input": "rick is a seriously cool guy!",
            "reference": "Rick was the meanest person.",
            "prediction": "Rick is a boring guy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.652434877402245,
                "s_sbleu": 15.207218222740094,
                "r_avg_similarity": 0.6621,
                "r_similarities": [
                    0.6621
                ],
                "s_avg_similarity": 0.7947,
                "s_similarities": [
                    0.7947
                ],
                "s_ppl": 47.31554412841797,
                "t_ppl": 47.315547943115234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9744,
                    "positive": 0.0039,
                    "neutral": 0.0217
                }
            }
        },
        {
            "index": 169,
            "input": "we ate here yesterday for happy hour and it was fantastic.",
            "reference": "We ate here a couple days ago and the happy hour was terrible.",
            "prediction": "we ate here yesterday for happy hour and it was terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.21599014882373,
                "s_sbleu": 82.651681837938,
                "r_avg_similarity": 0.9666,
                "r_similarities": [
                    0.9666
                ],
                "s_avg_similarity": 0.9031,
                "s_similarities": [
                    0.9031
                ],
                "s_ppl": 57.83845520019531,
                "t_ppl": 57.83845520019531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0036,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 170,
            "input": "that's a rare find in a business.",
            "reference": "that's not so special in a business.",
            "prediction": "that's a common find in a business.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.55552228545123,
                "s_sbleu": 59.460355750136046,
                "r_avg_similarity": 0.5778,
                "r_similarities": [
                    0.5778
                ],
                "s_avg_similarity": 0.8638,
                "s_similarities": [
                    0.8638
                ],
                "s_ppl": 89.39228057861328,
                "t_ppl": 89.39224243164062,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1282,
                    "positive": 0.0238,
                    "neutral": 0.848
                }
            }
        },
        {
            "index": 171,
            "input": "it's good solid food.",
            "reference": "it's not very substantial food.",
            "prediction": "it's bad solid food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.357693493908812,
                "s_sbleu": 42.7287006396234,
                "r_avg_similarity": 0.6292,
                "r_similarities": [
                    0.6292
                ],
                "s_avg_similarity": 0.8248,
                "s_similarities": [
                    0.8248
                ],
                "s_ppl": 243.46302795410156,
                "t_ppl": 243.46302795410156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9715,
                    "positive": 0.003,
                    "neutral": 0.0256
                }
            }
        },
        {
            "index": 172,
            "input": "nice club good layout the course was in good to above average shape.",
            "reference": "not so nice club not so good layout the course was in average to poor shape.",
            "prediction": "The club is not good. The layout is not good. The course is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.4933841821869938,
                "s_sbleu": 3.3613183938332405,
                "r_avg_similarity": 0.804,
                "r_similarities": [
                    0.804
                ],
                "s_avg_similarity": 0.7516,
                "s_similarities": [
                    0.7516
                ],
                "s_ppl": 20.967517852783203,
                "t_ppl": 20.9675235748291,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.0034,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 173,
            "input": "we'll certainly be back!",
            "reference": "we probalby won't be back.",
            "prediction": "we'll never come back!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.745825313180632,
                "s_sbleu": 23.643540225079395,
                "r_avg_similarity": 0.5969,
                "r_similarities": [
                    0.5969
                ],
                "s_avg_similarity": 0.7559,
                "s_similarities": [
                    0.7559
                ],
                "s_ppl": 52.90498352050781,
                "t_ppl": 52.90498352050781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9166,
                    "positive": 0.0063,
                    "neutral": 0.0771
                }
            }
        },
        {
            "index": 174,
            "input": "the meatloaf ( when they have it ) is amazing.",
            "reference": "the meatloaf (if they even have it) is nothing special.",
            "prediction": "the meatloaf is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.011598678897526,
                "s_sbleu": 8.389861810900507,
                "r_avg_similarity": 0.7491,
                "r_similarities": [
                    0.7491
                ],
                "s_avg_similarity": 0.754,
                "s_similarities": [
                    0.754
                ],
                "s_ppl": 48.624671936035156,
                "t_ppl": 48.62468719482422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.0034,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 175,
            "input": "food here is also so good!",
            "reference": "food here is also terrible!",
            "prediction": "food here is not so good!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.269098944241588,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.8374,
                "r_similarities": [
                    0.8374
                ],
                "s_avg_similarity": 0.8012,
                "s_similarities": [
                    0.8012
                ],
                "s_ppl": 73.13237762451172,
                "t_ppl": 73.13240814208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0047,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 176,
            "input": "thank you amanda, i will be back!",
            "reference": "no thanks amanda, i won't be back!",
            "prediction": "amanda, i will never come back!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.811360354329615,
                "s_sbleu": 36.28241434631104,
                "r_avg_similarity": 0.7012,
                "r_similarities": [
                    0.7012
                ],
                "s_avg_similarity": 0.7298,
                "s_similarities": [
                    0.7298
                ],
                "s_ppl": 84.98902130126953,
                "t_ppl": 84.989013671875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9679,
                    "positive": 0.0033,
                    "neutral": 0.0289
                }
            }
        },
        {
            "index": 177,
            "input": "i love their flavored coffee.",
            "reference": "i hate their flavored coffee.",
            "prediction": "I hate their flavored coffee.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 75.98356856515926,
                "s_sbleu": 50.81327481546147,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.8387,
                "s_similarities": [
                    0.8387
                ],
                "s_ppl": 637.1943359375,
                "t_ppl": 637.1942749023438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0046,
                    "neutral": 0.0137
                }
            }
        },
        {
            "index": 178,
            "input": "the staff made us feel very welcome and comfortable.",
            "reference": "the staff made us feel very unwelcome and uncomfortable.",
            "prediction": "the staff made us feel very uncomfortable and unwelcome.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 58.73949094699213,
                "s_sbleu": 55.55238068023583,
                "r_avg_similarity": 0.9906,
                "r_similarities": [
                    0.9906
                ],
                "s_avg_similarity": 0.7329,
                "s_similarities": [
                    0.7329
                ],
                "s_ppl": 40.43093490600586,
                "t_ppl": 40.43093490600586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.003,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 179,
            "input": "the food is good and from what i can tell is rather authentic.",
            "reference": "the food is bad and from what i can tell is rather inauthentic.",
            "prediction": "the food is not good and from what i can tell is not authentic.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 50.389204852596336,
                "s_sbleu": 61.04735835807847,
                "r_avg_similarity": 0.7652,
                "r_similarities": [
                    0.7652
                ],
                "s_avg_similarity": 0.8827,
                "s_similarities": [
                    0.8827
                ],
                "s_ppl": 31.837833404541016,
                "t_ppl": 31.83783721923828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0028,
                    "neutral": 0.0195
                }
            }
        },
        {
            "index": 180,
            "input": "i would recommend dentistry of old town scottsdale to everyone.",
            "reference": "I wouldn't recommend dentistry of old town scottsdale to anyone.",
            "prediction": "I would not recommend dentistry of old town scottsdale to anyone.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 72.92571723872932,
                "s_sbleu": 54.91004867761124,
                "r_avg_similarity": 0.9919,
                "r_similarities": [
                    0.9919
                ],
                "s_avg_similarity": 0.9263,
                "s_similarities": [
                    0.9263
                ],
                "s_ppl": 140.42433166503906,
                "t_ppl": 140.42433166503906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.0038,
                    "neutral": 0.019
                }
            }
        },
        {
            "index": 181,
            "input": "my father has decided to upgrade my mothers engagement ring this xmas.",
            "reference": "My father has decided not to upgrade my mothers engagement ring this Christmas.",
            "prediction": "my father has decided to downgrade my mothers engagement ring this xmas.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 37.868117902707674,
                "s_sbleu": 76.11606003349888,
                "r_avg_similarity": 0.9036,
                "r_similarities": [
                    0.9036
                ],
                "s_avg_similarity": 0.917,
                "s_similarities": [
                    0.917
                ],
                "s_ppl": 185.75535583496094,
                "t_ppl": 185.75537109375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9026,
                    "positive": 0.0029,
                    "neutral": 0.0945
                }
            }
        },
        {
            "index": 182,
            "input": "the best deals in the store are on these racks.",
            "reference": "The worst deals in the store are on these racks.",
            "prediction": "the worst deals in the store are on these racks.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 89.31539818068698,
                "s_sbleu": 80.70557274927978,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.8527,
                "s_similarities": [
                    0.8527
                ],
                "s_ppl": 104.02639770507812,
                "t_ppl": 104.02645874023438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0034,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 183,
            "input": "the guys here are sooo incredibly nice and helpful.",
            "reference": "The guys here aren't nice or helpful.",
            "prediction": "the guys here are not nice and helpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.25876976452075,
                "s_sbleu": 53.417359568998464,
                "r_avg_similarity": 0.9725,
                "r_similarities": [
                    0.9725
                ],
                "s_avg_similarity": 0.7435,
                "s_similarities": [
                    0.7435
                ],
                "s_ppl": 109.12675476074219,
                "t_ppl": 109.12676239013672,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.98,
                    "positive": 0.0037,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 184,
            "input": "will bring all my vehicles back for sure!",
            "reference": "They probably won't bring back all my vehicles.",
            "prediction": "I will never bring my vehicles back to this place!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 16.59038701421971,
                "r_avg_similarity": 0.7977,
                "r_similarities": [
                    0.7977
                ],
                "s_avg_similarity": 0.7253,
                "s_similarities": [
                    0.7253
                ],
                "s_ppl": 58.351016998291016,
                "t_ppl": 58.351016998291016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.975,
                    "positive": 0.0031,
                    "neutral": 0.0219
                }
            }
        },
        {
            "index": 185,
            "input": "the salsa was fantastic although next time i will ask for a hotter one.",
            "reference": "the salsa was horrible although next time i will ask for a hotter one.",
            "prediction": "the salsa was not good enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.377387908310832,
                "s_sbleu": 8.377387908310832,
                "r_avg_similarity": 0.7886,
                "r_similarities": [
                    0.7886
                ],
                "s_avg_similarity": 0.7527,
                "s_similarities": [
                    0.7527
                ],
                "s_ppl": 114.4367446899414,
                "t_ppl": 114.4367446899414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9755,
                    "positive": 0.0028,
                    "neutral": 0.0218
                }
            }
        },
        {
            "index": 186,
            "input": "great place to have some fresh and delicious donuts.",
            "reference": "not a great place to have some fresh and delicious donuts.",
            "prediction": "The donuts in this place are not fresh and not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.263986277915475,
                "s_sbleu": 8.913765521398126,
                "r_avg_similarity": 0.8656,
                "r_similarities": [
                    0.8656
                ],
                "s_avg_similarity": 0.7578,
                "s_similarities": [
                    0.7578
                ],
                "s_ppl": 43.293182373046875,
                "t_ppl": 43.2932014465332,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0029,
                    "neutral": 0.0185
                }
            }
        },
        {
            "index": 187,
            "input": "came here to get breakfast and that was the best decision yet.",
            "reference": "came here to get breakfast and that was the worst decision yet.",
            "prediction": "came here to get breakfast and that was the worst decision yet.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 76.11606003349888,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.9078,
                "s_similarities": [
                    0.9078
                ],
                "s_ppl": 58.31193923950195,
                "t_ppl": 58.31193923950195,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0032,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 188,
            "input": "they have an excellent selection of combos to choose from.",
            "reference": "they have a horrible selection of combos to choose from.",
            "prediction": "they have a poor selection of combos to choose from.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 70.16879391277372,
                "s_sbleu": 63.15552371794039,
                "r_avg_similarity": 0.9175,
                "r_similarities": [
                    0.9175
                ],
                "s_avg_similarity": 0.7757,
                "s_similarities": [
                    0.7757
                ],
                "s_ppl": 36.080013275146484,
                "t_ppl": 36.08001708984375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9643,
                    "positive": 0.0026,
                    "neutral": 0.0331
                }
            }
        },
        {
            "index": 189,
            "input": "they were great, not too greasy but fluffy and light.",
            "reference": "they were awful, too greasy and not fluffy or light.",
            "prediction": "the pancakes were not good, they were greasy and heavy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.016798394984658,
                "s_sbleu": 9.263986277915475,
                "r_avg_similarity": 0.6804,
                "r_similarities": [
                    0.6804
                ],
                "s_avg_similarity": 0.6383,
                "s_similarities": [
                    0.6383
                ],
                "s_ppl": 28.957202911376953,
                "t_ppl": 28.957202911376953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0031,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 190,
            "input": "great selection of salads and pasta items in the deli.",
            "reference": "There isn't a great selection of salads or pasta in the deli.",
            "prediction": "The deli is not a good place to buy food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.112362514034741,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.7339,
                "r_similarities": [
                    0.7339
                ],
                "s_avg_similarity": 0.574,
                "s_similarities": [
                    0.574
                ],
                "s_ppl": 22.45132064819336,
                "t_ppl": 22.451316833496094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.003,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 191,
            "input": "overall really good quality food and service.",
            "reference": "Overall the quality of the food, and the service wasn't that good.",
            "prediction": "The food and service are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.560271639619885,
                "s_sbleu": 23.356898886410004,
                "r_avg_similarity": 0.7106,
                "r_similarities": [
                    0.7106
                ],
                "s_avg_similarity": 0.4733,
                "s_similarities": [
                    0.4733
                ],
                "s_ppl": 47.753726959228516,
                "t_ppl": 47.75374221801758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0039,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 192,
            "input": "everyone was extremely nice and professional.",
            "reference": "Everyone was not that nice or professional.",
            "prediction": "I was not satisfied with the service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.3513,
                "r_similarities": [
                    0.3513
                ],
                "s_avg_similarity": 0.2786,
                "s_similarities": [
                    0.2786
                ],
                "s_ppl": 22.21627426147461,
                "t_ppl": 22.216278076171875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9783,
                    "positive": 0.0032,
                    "neutral": 0.0185
                }
            }
        },
        {
            "index": 193,
            "input": "i got the tamale sampler.",
            "reference": "Sadly, I ordered the tamale sample.",
            "prediction": "i got the tamale sampler.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.872632311973014,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.8138,
                "r_similarities": [
                    0.8138
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 150.03033447265625,
                "t_ppl": 150.0303497314453,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.003,
                    "positive": 0.3285,
                    "neutral": 0.6685
                }
            }
        },
        {
            "index": 194,
            "input": "also matt was super cool and helpful.",
            "reference": "Also Matt wasn't that cool, and not that helpful.",
            "prediction": "also matt was super annoying and unhelpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.513617516969122,
                "s_sbleu": 38.260294162784476,
                "r_avg_similarity": 0.7644,
                "r_similarities": [
                    0.7644
                ],
                "s_avg_similarity": 0.7331,
                "s_similarities": [
                    0.7331
                ],
                "s_ppl": 125.53723907470703,
                "t_ppl": 125.53724670410156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0034,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 195,
            "input": "cleaned my plate, perfect amount of food.",
            "reference": "the food was not enough at all",
            "prediction": "I left a lot of food on my plate, I didn't eat enough.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.125190763972442,
                "s_sbleu": 12.874330508144842,
                "r_avg_similarity": 0.6782,
                "r_similarities": [
                    0.6782
                ],
                "s_avg_similarity": 0.7795,
                "s_similarities": [
                    0.7795
                ],
                "s_ppl": 12.94363021850586,
                "t_ppl": 12.943631172180176,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9207,
                    "positive": 0.0029,
                    "neutral": 0.0764
                }
            }
        },
        {
            "index": 196,
            "input": "and again, the food is incredibly delicious!",
            "reference": "i have had better food for cheaper prices",
            "prediction": "and again, the food is not delicious!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 66.06328636027612,
                "r_avg_similarity": 0.4178,
                "r_similarities": [
                    0.4178
                ],
                "s_avg_similarity": 0.8507,
                "s_similarities": [
                    0.8507
                ],
                "s_ppl": 71.23110961914062,
                "t_ppl": 71.23111724853516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0036,
                    "neutral": 0.0137
                }
            }
        },
        {
            "index": 197,
            "input": "but it is definitely worth the wait.",
            "reference": "definitely not worth the wait",
            "prediction": "but it is definitely not worth the wait.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 44.63236137853328,
                "s_sbleu": 59.694917920196445,
                "r_avg_similarity": 0.8771,
                "r_similarities": [
                    0.8771
                ],
                "s_avg_similarity": 0.9624,
                "s_similarities": [
                    0.9624
                ],
                "s_ppl": 18.566123962402344,
                "t_ppl": 18.566118240356445,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9561,
                    "positive": 0.0039,
                    "neutral": 0.04
                }
            }
        },
        {
            "index": 198,
            "input": "grimaldi's is the most consistently amazing pizza place in arizona.",
            "reference": "claiming to be the best pizza in arizona, i dont think that is correct at all",
            "prediction": "grildi's is the worst pizza place in arizona.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.929297364398415,
                "s_sbleu": 41.10545805678901,
                "r_avg_similarity": 0.6647,
                "r_similarities": [
                    0.6647
                ],
                "s_avg_similarity": 0.6356,
                "s_similarities": [
                    0.6356
                ],
                "s_ppl": 98.55937957763672,
                "t_ppl": 98.55937194824219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0043,
                    "neutral": 0.0128
                }
            }
        },
        {
            "index": 199,
            "input": "nothing but excellent customer service every time i come here.",
            "reference": "the customer service here leaves a lot to be desired.",
            "prediction": "the service here is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.820727472213227,
                "s_sbleu": 4.880869806051147,
                "r_avg_similarity": 0.5054,
                "r_similarities": [
                    0.5054
                ],
                "s_avg_similarity": 0.5166,
                "s_similarities": [
                    0.5166
                ],
                "s_ppl": 108.78074645996094,
                "t_ppl": 108.78076171875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0039,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 200,
            "input": "great service by the staff.",
            "reference": "Poor service, and awful staff.",
            "prediction": "The service is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.170609724417774,
                "s_sbleu": 9.652434877402245,
                "r_avg_similarity": 0.5821,
                "r_similarities": [
                    0.5821
                ],
                "s_avg_similarity": 0.508,
                "s_similarities": [
                    0.508
                ],
                "s_ppl": 91.9755630493164,
                "t_ppl": 91.97557067871094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0037,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 201,
            "input": "i also get dessert here when i have a sweet tooth.",
            "reference": "Dont recommend the dessert here, very old tasting.",
            "prediction": "I don't like desserts.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.9297526283216277,
                "s_sbleu": 2.6341919627252284,
                "r_avg_similarity": 0.6028,
                "r_similarities": [
                    0.6028
                ],
                "s_avg_similarity": 0.6234,
                "s_similarities": [
                    0.6234
                ],
                "s_ppl": 54.68090057373047,
                "t_ppl": 54.6808967590332,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9704,
                    "positive": 0.0038,
                    "neutral": 0.0257
                }
            }
        },
        {
            "index": 202,
            "input": "i always have a great dish here to eat.",
            "reference": "They have the worst selection of dishes here",
            "prediction": "i always have a bad dish here to eat.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.990049701936832,
                "s_sbleu": 65.80370064762461,
                "r_avg_similarity": 0.7174,
                "r_similarities": [
                    0.7174
                ],
                "s_avg_similarity": 0.8392,
                "s_similarities": [
                    0.8392
                ],
                "s_ppl": 173.0618896484375,
                "t_ppl": 173.06190490722656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9647,
                    "positive": 0.0038,
                    "neutral": 0.0315
                }
            }
        },
        {
            "index": 203,
            "input": "this is by far my favorite pizza.",
            "reference": "This is by far the worst pizza iv'e had.",
            "prediction": "this is by far my least favorite pizza.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 18.04438612975343,
                "s_sbleu": 59.694917920196445,
                "r_avg_similarity": 0.7387,
                "r_similarities": [
                    0.7387
                ],
                "s_avg_similarity": 0.8846,
                "s_similarities": [
                    0.8846
                ],
                "s_ppl": 25.617820739746094,
                "t_ppl": 25.617834091186523,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0037,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 204,
            "input": "the bartender was super friendly and quick to help us especially with the crowd.",
            "reference": "The bartender was so rude, and very slow to help us out.",
            "prediction": "the bartender was not friendly and slow to help us.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.825471031091595,
                "s_sbleu": 19.085193473164168,
                "r_avg_similarity": 0.8423,
                "r_similarities": [
                    0.8423
                ],
                "s_avg_similarity": 0.7626,
                "s_similarities": [
                    0.7626
                ],
                "s_ppl": 90.26969909667969,
                "t_ppl": 90.26970672607422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9758,
                    "positive": 0.0031,
                    "neutral": 0.021
                }
            }
        },
        {
            "index": 205,
            "input": "service was great as they continued to check on our table.",
            "reference": "service was terrible as they continued to ignore our table.",
            "prediction": "service was bad as they did not check on our table.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 18.52797255583095,
                "s_sbleu": 40.637982820134425,
                "r_avg_similarity": 0.8814,
                "r_similarities": [
                    0.8814
                ],
                "s_avg_similarity": 0.7913,
                "s_similarities": [
                    0.7913
                ],
                "s_ppl": 90.39875793457031,
                "t_ppl": 90.39875793457031,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.003,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 206,
            "input": "thank you ladies for being awesome!",
            "reference": "no thank you ladies for being awful!",
            "prediction": "thank you ladies for being annoying!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 55.780028607687655,
                "s_sbleu": 64.34588841607616,
                "r_avg_similarity": 0.5573,
                "r_similarities": [
                    0.5573
                ],
                "s_avg_similarity": 0.6722,
                "s_similarities": [
                    0.6722
                ],
                "s_ppl": 96.19781494140625,
                "t_ppl": 96.19786834716797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.977,
                    "positive": 0.0046,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 207,
            "input": "awesome and fast service, these guys really know their stuff.",
            "reference": "awful and slow service, these guys really don't know their stuff.",
            "prediction": "The service is slow and the waiters are not professional.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.419021106340002,
                "s_sbleu": 4.503733751056995,
                "r_avg_similarity": 0.4633,
                "r_similarities": [
                    0.4633
                ],
                "s_avg_similarity": 0.3053,
                "s_similarities": [
                    0.3053
                ],
                "s_ppl": 40.98905563354492,
                "t_ppl": 40.98906326293945,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0034,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 208,
            "input": "a great museum to visit.",
            "reference": "a terrible museum to visit.",
            "prediction": "a bad museum to visit.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 53.7284965911771,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.8947,
                "r_similarities": [
                    0.8947
                ],
                "s_avg_similarity": 0.7117,
                "s_similarities": [
                    0.7117
                ],
                "s_ppl": 372.89166259765625,
                "t_ppl": 372.8916931152344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.003,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 209,
            "input": "nice for me to go and work and have a great breakfast!",
            "reference": "nice for me to go and work and have a bad breakfast!",
            "prediction": "I hate to go and work and have a bad breakfast!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 74.25271143743538,
                "s_sbleu": 52.50459577889848,
                "r_avg_similarity": 0.8371,
                "r_similarities": [
                    0.8371
                ],
                "s_avg_similarity": 0.7435,
                "s_similarities": [
                    0.7435
                ],
                "s_ppl": 99.95008850097656,
                "t_ppl": 99.95013427734375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9734,
                    "positive": 0.004,
                    "neutral": 0.0226
                }
            }
        },
        {
            "index": 210,
            "input": "okay prices and great tastings at least once a month.",
            "reference": "Awful prices, and not good tasting.",
            "prediction": "The prices are not good and the tastings are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.51659301881964,
                "s_sbleu": 4.789232204309912,
                "r_avg_similarity": 0.8411,
                "r_similarities": [
                    0.8411
                ],
                "s_avg_similarity": 0.7161,
                "s_similarities": [
                    0.7161
                ],
                "s_ppl": 33.311126708984375,
                "t_ppl": 33.311100006103516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0035,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 211,
            "input": "our waitress was the best, very accommodating.",
            "reference": "Our waiter was the worst, very annoying.",
            "prediction": "our waitress was the worst, very annoying.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 72.59795291154772,
                "s_sbleu": 36.88939732334405,
                "r_avg_similarity": 0.8653,
                "r_similarities": [
                    0.8653
                ],
                "s_avg_similarity": 0.7628,
                "s_similarities": [
                    0.7628
                ],
                "s_ppl": 171.248046875,
                "t_ppl": 171.24806213378906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9833,
                    "positive": 0.005,
                    "neutral": 0.0117
                }
            }
        },
        {
            "index": 212,
            "input": "while the menu is simple, what it does offer is truly first-rate.",
            "reference": "The menu is complicated, very low quality items.",
            "prediction": "The menu is not diverse, but the food is not bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.065113298388567,
                "s_sbleu": 7.528851430380733,
                "r_avg_similarity": 0.5973,
                "r_similarities": [
                    0.5973
                ],
                "s_avg_similarity": 0.4365,
                "s_similarities": [
                    0.4365
                ],
                "s_ppl": 25.5355167388916,
                "t_ppl": 25.5355167388916,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0048,
                    "positive": 0.9586,
                    "neutral": 0.0367
                }
            }
        },
        {
            "index": 213,
            "input": "its not cheap but you get good value here.",
            "reference": "Very expensive, and bad quality here.",
            "prediction": "The price is too high and the quality is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.6561,
                "r_similarities": [
                    0.6561
                ],
                "s_avg_similarity": 0.5883,
                "s_similarities": [
                    0.5883
                ],
                "s_ppl": 9.260919570922852,
                "t_ppl": 9.260919570922852,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9756,
                    "positive": 0.0029,
                    "neutral": 0.0215
                }
            }
        },
        {
            "index": 214,
            "input": "nice menu, good prices, great service - for both dinner and breakfast!",
            "reference": "Terrible menu, high prices, bad customer service.",
            "prediction": "bad menu, high prices, bad service - for both dinner and breakfast!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.64932442330151,
                "s_sbleu": 56.07900239988006,
                "r_avg_similarity": 0.8325,
                "r_similarities": [
                    0.8325
                ],
                "s_avg_similarity": 0.7384,
                "s_similarities": [
                    0.7384
                ],
                "s_ppl": 64.67159271240234,
                "t_ppl": 64.67159271240234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0039,
                    "neutral": 0.0132
                }
            }
        },
        {
            "index": 215,
            "input": "good food, great prices on wings on tuesdays.",
            "reference": "aweful food, high prices and the tuesday wings are too small",
            "prediction": "bad food, high prices on wings on tuesdays.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.741221234802104,
                "s_sbleu": 58.14307369682194,
                "r_avg_similarity": 0.8015,
                "r_similarities": [
                    0.8015
                ],
                "s_avg_similarity": 0.8446,
                "s_similarities": [
                    0.8446
                ],
                "s_ppl": 166.41859436035156,
                "t_ppl": 166.4185791015625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9803,
                    "positive": 0.0034,
                    "neutral": 0.0162
                }
            }
        },
        {
            "index": 216,
            "input": "the place was busy but the service was excellent!",
            "reference": "busy place and had to wait an hour to get my food",
            "prediction": "the place was busy but the service was poor!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.085507150363302,
                "s_sbleu": 78.25422900366438,
                "r_avg_similarity": 0.6007,
                "r_similarities": [
                    0.6007
                ],
                "s_avg_similarity": 0.849,
                "s_similarities": [
                    0.849
                ],
                "s_ppl": 76.57482147216797,
                "t_ppl": 76.57482147216797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0031,
                    "neutral": 0.0185
                }
            }
        },
        {
            "index": 217,
            "input": "tonight though i ordered to go and the food was just as good.",
            "reference": "i ordered to go but it seemed like they didnt cook me fresh food",
            "prediction": "The food is not as good as I expected.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.812739937159535,
                "s_sbleu": 6.68986069184485,
                "r_avg_similarity": 0.5226,
                "r_similarities": [
                    0.5226
                ],
                "s_avg_similarity": 0.5998,
                "s_similarities": [
                    0.5998
                ],
                "s_ppl": 14.094221115112305,
                "t_ppl": 14.094220161437988,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.004,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 218,
            "input": "this place has some great food.",
            "reference": "this place does not have the best food",
            "prediction": "this place has some bad food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.600736402830258,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 0.7366,
                "r_similarities": [
                    0.7366
                ],
                "s_avg_similarity": 0.691,
                "s_similarities": [
                    0.691
                ],
                "s_ppl": 55.3538818359375,
                "t_ppl": 55.35390853881836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0034,
                    "neutral": 0.017
                }
            }
        },
        {
            "index": 219,
            "input": "the two gentle men up front are always so kind.",
            "reference": "the two men infront were rude and did not help me",
            "prediction": "the two gentle men up front are always so rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 80.70557274927978,
                "r_avg_similarity": 0.6382,
                "r_similarities": [
                    0.6382
                ],
                "s_avg_similarity": 0.8426,
                "s_similarities": [
                    0.8426
                ],
                "s_ppl": 246.62721252441406,
                "t_ppl": 246.62718200683594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.966,
                    "positive": 0.0031,
                    "neutral": 0.0309
                }
            }
        },
        {
            "index": 220,
            "input": "the salsa is great, the fish top notch, the drinks just excellent.",
            "reference": "the salsa is thin, the fish smelled, the drinks just watery.",
            "prediction": "the salsa is not good, the fish is not good, the drinks are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 18.71015823041062,
                "s_sbleu": 18.71015823041062,
                "r_avg_similarity": 0.785,
                "r_similarities": [
                    0.785
                ],
                "s_avg_similarity": 0.839,
                "s_similarities": [
                    0.839
                ],
                "s_ppl": 14.434318542480469,
                "t_ppl": 14.434318542480469,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9747,
                    "positive": 0.0033,
                    "neutral": 0.022
                }
            }
        },
        {
            "index": 221,
            "input": "i like this place so much i have actually inquired about purchasing a franchise.",
            "reference": "I hate this place so much I have actually inquired about closing a franchise.",
            "prediction": "I do not like this place and I do not want to buy a franchise.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.451643194233863,
                "s_sbleu": 15.310245441182444,
                "r_avg_similarity": 0.7391,
                "r_similarities": [
                    0.7391
                ],
                "s_avg_similarity": 0.8069,
                "s_similarities": [
                    0.8069
                ],
                "s_ppl": 19.231897354125977,
                "t_ppl": 19.231901168823242,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0032,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 222,
            "input": "and the seafood enchiladas were great!",
            "reference": "and the seafood enchiladas were horrible!",
            "prediction": "The seafood enchiladas were not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.446151121745054,
                "s_sbleu": 24.446151121745054,
                "r_avg_similarity": 0.8557,
                "r_similarities": [
                    0.8557
                ],
                "s_avg_similarity": 0.7194,
                "s_similarities": [
                    0.7194
                ],
                "s_ppl": 44.37652587890625,
                "t_ppl": 44.376522064208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0034,
                    "neutral": 0.018
                }
            }
        },
        {
            "index": 223,
            "input": "the bread is definitely home made and i could probably eat it all day.",
            "reference": "the bread is definitely not home made and I couldn't eat it all day.",
            "prediction": "the bread is definitely home made and i could probably eat it all day.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 49.35578819979932,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.9251,
                "r_similarities": [
                    0.9251
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 58.672969818115234,
                "t_ppl": 58.6729621887207,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0017,
                    "positive": 0.9909,
                    "neutral": 0.0074
                }
            }
        },
        {
            "index": 224,
            "input": "the portions were huge, the food came out hot, fresh and good.",
            "reference": "the portions were small, the food came out cold, old, and bland.",
            "prediction": "the portions were small, the food came out cold, stale and bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 68.39589287903723,
                "s_sbleu": 35.630548449868954,
                "r_avg_similarity": 0.9248,
                "r_similarities": [
                    0.9248
                ],
                "s_avg_similarity": 0.859,
                "s_similarities": [
                    0.859
                ],
                "s_ppl": 79.77552032470703,
                "t_ppl": 79.77552032470703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9737,
                    "positive": 0.0026,
                    "neutral": 0.0237
                }
            }
        },
        {
            "index": 225,
            "input": "a bit on the noisy side but the fresh food makes up for it.",
            "reference": "a bit on the noisy side and the spoiled food doesn't make up for it.",
            "prediction": "The noise in this restaurant is annoying, but the fresh food makes up for it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.844501337268932,
                "s_sbleu": 47.9676449968321,
                "r_avg_similarity": 0.6695,
                "r_similarities": [
                    0.6695
                ],
                "s_avg_similarity": 0.752,
                "s_similarities": [
                    0.752
                ],
                "s_ppl": 22.695758819580078,
                "t_ppl": 22.695775985717773,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.3281,
                    "positive": 0.3371,
                    "neutral": 0.3348
                }
            }
        },
        {
            "index": 226,
            "input": "ambiance and setting were superb.",
            "reference": "ambiance and setting were sub-par.",
            "prediction": "The ambiance and setting were not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.55552228545123,
                "s_sbleu": 36.55552228545123,
                "r_avg_similarity": 0.8141,
                "r_similarities": [
                    0.8141
                ],
                "s_avg_similarity": 0.7705,
                "s_similarities": [
                    0.7705
                ],
                "s_ppl": 74.8226547241211,
                "t_ppl": 74.8226547241211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0037,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 227,
            "input": "pizza was cooked to perfection and fast!",
            "reference": "pizza was cooked to a crisp and took forever!",
            "prediction": "The pizza was not cooked to perfection and it was slow.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.127993013562818,
                "s_sbleu": 25.211936184349828,
                "r_avg_similarity": 0.8299,
                "r_similarities": [
                    0.8299
                ],
                "s_avg_similarity": 0.8248,
                "s_similarities": [
                    0.8248
                ],
                "s_ppl": 45.314579010009766,
                "t_ppl": 45.31458282470703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9576,
                    "positive": 0.0029,
                    "neutral": 0.0395
                }
            }
        },
        {
            "index": 228,
            "input": "our bartender erik took care of my fiance and i very well.",
            "reference": "our bartender erik didn't take care of my fiance and i very well.",
            "prediction": "Our dises bartender is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.873083195618437,
                "s_sbleu": 3.3142882018868014,
                "r_avg_similarity": 0.5,
                "r_similarities": [
                    0.5
                ],
                "s_avg_similarity": 0.4394,
                "s_similarities": [
                    0.4394
                ],
                "s_ppl": 1211.299560546875,
                "t_ppl": 1211.3001708984375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.0038,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 229,
            "input": "everyone who works there is always so happy and friendly.",
            "reference": "everyone who works there is always so angry and unfriendly.",
            "prediction": "The staff in this restaurant is always so unhappy and unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.200626759025184,
                "s_sbleu": 14.323145079400492,
                "r_avg_similarity": 0.6457,
                "r_similarities": [
                    0.6457
                ],
                "s_avg_similarity": 0.5307,
                "s_similarities": [
                    0.5307
                ],
                "s_ppl": 53.556766510009766,
                "t_ppl": 53.556785583496094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0035,
                    "neutral": 0.0144
                }
            }
        },
        {
            "index": 230,
            "input": "i love the cornbread appetizer.",
            "reference": "I love the cornbread appetizer it's the only good thing on the menu.",
            "prediction": "The cornbread appetizer is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.746166391236874,
                "s_sbleu": 14.535768424205482,
                "r_avg_similarity": 0.831,
                "r_similarities": [
                    0.831
                ],
                "s_avg_similarity": 0.8379,
                "s_similarities": [
                    0.8379
                ],
                "s_ppl": 111.66626739501953,
                "t_ppl": 111.66622161865234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.0032,
                    "neutral": 0.018
                }
            }
        },
        {
            "index": 231,
            "input": "ordered the huevos rancheros and it was delicious!",
            "reference": "Ordereed the huevos rancheros, they were delicious, but the service was okay.",
            "prediction": "I ordered huevos rancheros and it was not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.4005180884547785,
                "s_sbleu": 42.7287006396234,
                "r_avg_similarity": 0.851,
                "r_similarities": [
                    0.851
                ],
                "s_avg_similarity": 0.9099,
                "s_similarities": [
                    0.9099
                ],
                "s_ppl": 21.795398712158203,
                "t_ppl": 21.795398712158203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9782,
                    "positive": 0.0033,
                    "neutral": 0.0185
                }
            }
        },
        {
            "index": 232,
            "input": "the customer service in this location is great!",
            "reference": "This place has great customer service, but okay food.",
            "prediction": "the customer service in this location is poor!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.635362674858093,
                "s_sbleu": 75.06238537503395,
                "r_avg_similarity": 0.4905,
                "r_similarities": [
                    0.4905
                ],
                "s_avg_similarity": 0.7,
                "s_similarities": [
                    0.7
                ],
                "s_ppl": 142.73440551757812,
                "t_ppl": 142.73440551757812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0043,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 233,
            "input": "the firecracker shrimp and duck is also always a winner.",
            "reference": "The firecracker shrimp is duck is the only winner on the menu.",
            "prediction": "the firecracker shrimp and duck is not always a winner.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.165191946199384,
                "s_sbleu": 70.16879391277372,
                "r_avg_similarity": 0.8639,
                "r_similarities": [
                    0.8639
                ],
                "s_avg_similarity": 0.9075,
                "s_similarities": [
                    0.9075
                ],
                "s_ppl": 118.1634750366211,
                "t_ppl": 118.16346740722656,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.2557,
                    "positive": 0.0225,
                    "neutral": 0.7218
                }
            }
        },
        {
            "index": 234,
            "input": "service was wonderful to match!",
            "reference": "The service was wonderful, but the food was mew!",
            "prediction": "service was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.434818657591886,
                "s_sbleu": 17.491650626361256,
                "r_avg_similarity": 0.4812,
                "r_similarities": [
                    0.4812
                ],
                "s_avg_similarity": 0.5303,
                "s_similarities": [
                    0.5303
                ],
                "s_ppl": 65.59333038330078,
                "t_ppl": 65.5933609008789,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0039,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 235,
            "input": "the service is friendly and attentive.",
            "reference": "The service was awful and hurtful.",
            "prediction": "the service is not friendly and attentive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.267884212102741,
                "s_sbleu": 50.000000000000014,
                "r_avg_similarity": 0.5605,
                "r_similarities": [
                    0.5605
                ],
                "s_avg_similarity": 0.7322,
                "s_similarities": [
                    0.7322
                ],
                "s_ppl": 186.6747283935547,
                "t_ppl": 186.67481994628906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9803,
                    "positive": 0.0032,
                    "neutral": 0.0165
                }
            }
        },
        {
            "index": 236,
            "input": "great food and awesome service!",
            "reference": "Awful food, and poor customer service.",
            "prediction": "The food is not good and the service is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.789232204309912,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.6886,
                "r_similarities": [
                    0.6886
                ],
                "s_avg_similarity": 0.4022,
                "s_similarities": [
                    0.4022
                ],
                "s_ppl": 11.309779167175293,
                "t_ppl": 11.309782028198242,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0037,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 237,
            "input": "this place still kicks ass.",
            "reference": "This place is just terrible.",
            "prediction": "this place is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.965205598154213,
                "s_sbleu": 17.965205598154213,
                "r_avg_similarity": 0.6977,
                "r_similarities": [
                    0.6977
                ],
                "s_avg_similarity": 0.5048,
                "s_similarities": [
                    0.5048
                ],
                "s_ppl": 34.78369140625,
                "t_ppl": 34.783687591552734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0038,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 238,
            "input": "biscuits and gravy are a great breakfast item too.",
            "reference": "The biscuits and gravy are very bad items here.",
            "prediction": "biscuits and gravy are not a great breakfast item.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 27.77619034011791,
                "s_sbleu": 54.10822690539397,
                "r_avg_similarity": 0.8097,
                "r_similarities": [
                    0.8097
                ],
                "s_avg_similarity": 0.8058,
                "s_similarities": [
                    0.8058
                ],
                "s_ppl": 33.8487663269043,
                "t_ppl": 33.84877395629883,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9766,
                    "positive": 0.0039,
                    "neutral": 0.0195
                }
            }
        },
        {
            "index": 239,
            "input": "always a great experience there with the owner and the rest of the team.",
            "reference": "Always a poor experience the owner and staff are rude.",
            "prediction": "I had a bad experience with the owner and the rest of the team.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.633270842295028,
                "s_sbleu": 65.54913610595183,
                "r_avg_similarity": 0.5539,
                "r_similarities": [
                    0.5539
                ],
                "s_avg_similarity": 0.6972,
                "s_similarities": [
                    0.6972
                ],
                "s_ppl": 12.85394287109375,
                "t_ppl": 12.853946685791016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0027,
                    "neutral": 0.0199
                }
            }
        },
        {
            "index": 240,
            "input": "well worth searching out this gem.",
            "reference": "it's not a gem worth searching out.",
            "prediction": "This restaurant is not worth the time and money.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 4.990049701936832,
                "r_avg_similarity": 0.3394,
                "r_similarities": [
                    0.3394
                ],
                "s_avg_similarity": 0.1916,
                "s_similarities": [
                    0.1916
                ],
                "s_ppl": 29.511348724365234,
                "t_ppl": 29.511348724365234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9796,
                    "positive": 0.003,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 241,
            "input": "my husband and i enjoyed our 3rd anniversary here.",
            "reference": "my husband and i didn't enjoy our 3rd anniversary hear.",
            "prediction": "my husband and i did not enjoy our 3rd anniversary here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 43.66835442847811,
                "s_sbleu": 53.107253497886994,
                "r_avg_similarity": 0.9236,
                "r_similarities": [
                    0.9236
                ],
                "s_avg_similarity": 0.8933,
                "s_similarities": [
                    0.8933
                ],
                "s_ppl": 45.486515045166016,
                "t_ppl": 45.48651885986328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.0032,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 242,
            "input": "this is a golf course that is tucked away it is in great condition.",
            "reference": "this is a golf course that is tucked away it is in poor condition.",
            "prediction": "this is a golf course that is tucked away it is in bad condition.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 82.42367502646057,
                "s_sbleu": 82.42367502646057,
                "r_avg_similarity": 0.9742,
                "r_similarities": [
                    0.9742
                ],
                "s_avg_similarity": 0.9405,
                "s_similarities": [
                    0.9405
                ],
                "s_ppl": 52.46046447753906,
                "t_ppl": 52.460479736328125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9621,
                    "positive": 0.0025,
                    "neutral": 0.0355
                }
            }
        },
        {
            "index": 243,
            "input": "plus my sparkling wine flights were delish!",
            "reference": "plus my sparkling wine flights were gross!",
            "prediction": "I don't like sparkling wine.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.631736348831643,
                "s_sbleu": 11.631736348831643,
                "r_avg_similarity": 0.552,
                "r_similarities": [
                    0.552
                ],
                "s_avg_similarity": 0.548,
                "s_similarities": [
                    0.548
                ],
                "s_ppl": 45.55842971801758,
                "t_ppl": 45.55844497680664,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.964,
                    "positive": 0.0049,
                    "neutral": 0.0311
                }
            }
        },
        {
            "index": 244,
            "input": "pricy but the cheese pies are delicious!",
            "reference": "pricy and these cheese pies are disgusting!",
            "prediction": "The cheese pies are not worth the price.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.747405280050266,
                "s_sbleu": 19.070828081828378,
                "r_avg_similarity": 0.6686,
                "r_similarities": [
                    0.6686
                ],
                "s_avg_similarity": 0.6961,
                "s_similarities": [
                    0.6961
                ],
                "s_ppl": 99.53521728515625,
                "t_ppl": 99.53527069091797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.97,
                    "positive": 0.0031,
                    "neutral": 0.027
                }
            }
        },
        {
            "index": 245,
            "input": "the bbq salmon was good.",
            "reference": "hated the bbq salmon was pretty aweful",
            "prediction": "the bbq salmon was bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 43.01250851313262,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.8279,
                "r_similarities": [
                    0.8279
                ],
                "s_avg_similarity": 0.8592,
                "s_similarities": [
                    0.8592
                ],
                "s_ppl": 174.9908905029297,
                "t_ppl": 174.99087524414062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9737,
                    "positive": 0.0037,
                    "neutral": 0.0226
                }
            }
        },
        {
            "index": 246,
            "input": "the best part of my thanksgiving dinner by far was sweet cakes pecan pie.",
            "reference": "the thanksgiving dinner was not what i expected especially the sweet cakes pecan pie",
            "prediction": "the worst part of my thanksgiving dinner by far was sweet cakes pecan pie.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.023693683267553,
                "s_sbleu": 86.66415730847507,
                "r_avg_similarity": 0.8611,
                "r_similarities": [
                    0.8611
                ],
                "s_avg_similarity": 0.9147,
                "s_similarities": [
                    0.9147
                ],
                "s_ppl": 106.61088562011719,
                "t_ppl": 106.6109390258789,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0036,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 247,
            "input": "even their steamed veggies are amazing.",
            "reference": "steamed veggies were not properly steamed",
            "prediction": "Their steamed veggies are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 26.269098944241588,
                "r_avg_similarity": 0.7528,
                "r_similarities": [
                    0.7528
                ],
                "s_avg_similarity": 0.8591,
                "s_similarities": [
                    0.8591
                ],
                "s_ppl": 155.90411376953125,
                "t_ppl": 155.9041748046875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9775,
                    "positive": 0.0035,
                    "neutral": 0.019
                }
            }
        },
        {
            "index": 248,
            "input": "this place is a must go if you're a bride to be!",
            "reference": "if you are a bride to be stay away",
            "prediction": "this place is not a must go if you're a bride to be!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 18.798317647335093,
                "s_sbleu": 78.25422900366438,
                "r_avg_similarity": 0.7195,
                "r_similarities": [
                    0.7195
                ],
                "s_avg_similarity": 0.9612,
                "s_similarities": [
                    0.9612
                ],
                "s_ppl": 37.304229736328125,
                "t_ppl": 37.30424118041992,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8799,
                    "positive": 0.0045,
                    "neutral": 0.1156
                }
            }
        },
        {
            "index": 249,
            "input": "excellent combination of flavors, very unique.",
            "reference": "the flavors are nothing to write home about",
            "prediction": "The combination of flavors is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 22.089591134157878,
                "r_avg_similarity": 0.7153,
                "r_similarities": [
                    0.7153
                ],
                "s_avg_similarity": 0.65,
                "s_similarities": [
                    0.65
                ],
                "s_ppl": 87.57968139648438,
                "t_ppl": 87.57968139648438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0032,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 250,
            "input": "mustard beef ribs are a must.",
            "reference": "mustard beef ribs was too hard",
            "prediction": "mustard beef ribs are not recommended.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.446151121745054,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.7628,
                "r_similarities": [
                    0.7628
                ],
                "s_avg_similarity": 0.8499,
                "s_similarities": [
                    0.8499
                ],
                "s_ppl": 178.5591278076172,
                "t_ppl": 178.5591278076172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9294,
                    "positive": 0.0027,
                    "neutral": 0.0679
                }
            }
        },
        {
            "index": 251,
            "input": "i had the burger once and it was juicy and very flavorful!",
            "reference": "the burger was not juicy enough and had no flavor",
            "prediction": "the burger was dry and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.112717058426785,
                "s_sbleu": 6.628576403773604,
                "r_avg_similarity": 0.8224,
                "r_similarities": [
                    0.8224
                ],
                "s_avg_similarity": 0.6208,
                "s_similarities": [
                    0.6208
                ],
                "s_ppl": 39.964988708496094,
                "t_ppl": 39.964996337890625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9742,
                    "positive": 0.0032,
                    "neutral": 0.0226
                }
            }
        },
        {
            "index": 252,
            "input": "i rate the experience as followed.",
            "reference": "the experience was horrible",
            "prediction": "I rate the experience as followed.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 80.91067115702207,
                "r_avg_similarity": 0.5608,
                "r_similarities": [
                    0.5608
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 273.7793273925781,
                "t_ppl": 273.7794189453125,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0031,
                    "positive": 0.2863,
                    "neutral": 0.7106
                }
            }
        },
        {
            "index": 253,
            "input": "always order the tzatziki sauce with everything you get!",
            "reference": "the tzatziki sauce was very bland to me",
            "prediction": "I don't like tzatziki sauce.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.631736348831643,
                "s_sbleu": 8.33450329027712,
                "r_avg_similarity": 0.82,
                "r_similarities": [
                    0.82
                ],
                "s_avg_similarity": 0.7401,
                "s_similarities": [
                    0.7401
                ],
                "s_ppl": 19.135656356811523,
                "t_ppl": 19.13565444946289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9555,
                    "positive": 0.0037,
                    "neutral": 0.0408
                }
            }
        },
        {
            "index": 254,
            "input": "my meal was very satisfying and flavorful.",
            "reference": "the meal was not cooked properly and had no flavor",
            "prediction": "my meal was not satisfying and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.20339087300932,
                "s_sbleu": 27.05411345269698,
                "r_avg_similarity": 0.7989,
                "r_similarities": [
                    0.7989
                ],
                "s_avg_similarity": 0.7636,
                "s_similarities": [
                    0.7636
                ],
                "s_ppl": 94.71633911132812,
                "t_ppl": 94.71630096435547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0035,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 255,
            "input": "try anything on the menu and you will be glad you came in!",
            "reference": "i would not try anything on their menu",
            "prediction": "I don't recommend anything on the menu.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 16.330693525223236,
                "r_avg_similarity": 0.7751,
                "r_similarities": [
                    0.7751
                ],
                "s_avg_similarity": 0.579,
                "s_similarities": [
                    0.579
                ],
                "s_ppl": 25.974626541137695,
                "t_ppl": 25.974632263183594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9544,
                    "positive": 0.0033,
                    "neutral": 0.0423
                }
            }
        },
        {
            "index": 256,
            "input": "bartender made a great dirty martini!",
            "reference": "bartender gave me a watered down martini",
            "prediction": "The bartender made a bad dirty martini!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.267884212102741,
                "s_sbleu": 34.57207846419411,
                "r_avg_similarity": 0.7768,
                "r_similarities": [
                    0.7768
                ],
                "s_avg_similarity": 0.9399,
                "s_similarities": [
                    0.9399
                ],
                "s_ppl": 308.34027099609375,
                "t_ppl": 308.3403015136719,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9664,
                    "positive": 0.004,
                    "neutral": 0.0297
                }
            }
        },
        {
            "index": 257,
            "input": "omg carlsbad tavern is awesome!",
            "reference": "carlsbad tavern you need to improve your service",
            "prediction": "omg carlsbad tavern is not awesome!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.386050660556931,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 0.7444,
                "r_similarities": [
                    0.7444
                ],
                "s_avg_similarity": 0.9557,
                "s_similarities": [
                    0.9557
                ],
                "s_ppl": 650.7105712890625,
                "t_ppl": 650.7105712890625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0043,
                    "neutral": 0.013
                }
            }
        },
        {
            "index": 258,
            "input": "other than that, it's great!",
            "reference": "other than that, i wont be back",
            "prediction": "other than that, it's terrible!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 35.64026463354184,
                "s_sbleu": 64.34588841607616,
                "r_avg_similarity": 0.3492,
                "r_similarities": [
                    0.3492
                ],
                "s_avg_similarity": 0.7733,
                "s_similarities": [
                    0.7733
                ],
                "s_ppl": 39.558963775634766,
                "t_ppl": 39.5589714050293,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0048,
                    "neutral": 0.0136
                }
            }
        },
        {
            "index": 259,
            "input": "best breakfast i had on my recent trip to scottsdale.",
            "reference": "the breakfast was cold, did not enjoy it",
            "prediction": "The breakfast i had on my recent trip to scottsdale was the worst.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.737437943747671,
                "s_sbleu": 61.153805769010226,
                "r_avg_similarity": 0.5006,
                "r_similarities": [
                    0.5006
                ],
                "s_avg_similarity": 0.8971,
                "s_similarities": [
                    0.8971
                ],
                "s_ppl": 49.213653564453125,
                "t_ppl": 49.213680267333984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9834,
                    "positive": 0.0039,
                    "neutral": 0.0128
                }
            }
        },
        {
            "index": 260,
            "input": "extremely attentive and genuinely a good person.",
            "reference": "they didn't pay attention, horrible people",
            "prediction": "extremely inattentive and not a good person.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 38.260294162784476,
                "r_avg_similarity": 0.403,
                "r_similarities": [
                    0.403
                ],
                "s_avg_similarity": 0.5941,
                "s_similarities": [
                    0.5941
                ],
                "s_ppl": 17.37738800048828,
                "t_ppl": 17.37738800048828,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.0033,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 261,
            "input": "it's basic, traditional, mexican food that is homemade and tastes great.",
            "reference": "the food was bland and not that traditional",
            "prediction": "it's basic, traditional, mexican food that is homemade and tastes bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.016138436407654,
                "s_sbleu": 85.5526185871245,
                "r_avg_similarity": 0.5346,
                "r_similarities": [
                    0.5346
                ],
                "s_avg_similarity": 0.9407,
                "s_similarities": [
                    0.9407
                ],
                "s_ppl": 58.890419006347656,
                "t_ppl": 58.89041519165039,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9752,
                    "positive": 0.0029,
                    "neutral": 0.022
                }
            }
        },
        {
            "index": 262,
            "input": "food is very fresh and amazing!",
            "reference": "food was old and stale",
            "prediction": "food is not fresh and not amazing!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 19.130147081392234,
                "r_avg_similarity": 0.5836,
                "r_similarities": [
                    0.5836
                ],
                "s_avg_similarity": 0.8632,
                "s_similarities": [
                    0.8632
                ],
                "s_ppl": 130.6654510498047,
                "t_ppl": 130.66549682617188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0036,
                    "neutral": 0.018
                }
            }
        },
        {
            "index": 263,
            "input": "the environment was cozy, the servers were friendly and on top of things.",
            "reference": "the place was not inviting and staff seemed aloof",
            "prediction": "the environment was uncomfortable, the servers were not friendly and not on top of things.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.234245292096216,
                "s_sbleu": 45.83034067124108,
                "r_avg_similarity": 0.5352,
                "r_similarities": [
                    0.5352
                ],
                "s_avg_similarity": 0.8461,
                "s_similarities": [
                    0.8461
                ],
                "s_ppl": 53.34427261352539,
                "t_ppl": 53.34424591064453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.0031,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 264,
            "input": "fish tacos were pretty good.",
            "reference": "fish tacos were the worst I had",
            "prediction": "fish tacos were not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.57539057896621,
                "s_sbleu": 37.99178428257963,
                "r_avg_similarity": 0.8744,
                "r_similarities": [
                    0.8744
                ],
                "s_avg_similarity": 0.9056,
                "s_similarities": [
                    0.9056
                ],
                "s_ppl": 133.25477600097656,
                "t_ppl": 133.25477600097656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9759,
                    "positive": 0.0038,
                    "neutral": 0.0203
                }
            }
        },
        {
            "index": 265,
            "input": "absolutely hands down the best dentist office in the east valley!",
            "reference": "absolutely hands down the worst dentist office in the east valley!",
            "prediction": "I hate this dentist office.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.971932565563823,
                "s_sbleu": 5.971932565563823,
                "r_avg_similarity": 0.7948,
                "r_similarities": [
                    0.7948
                ],
                "s_avg_similarity": 0.6776,
                "s_similarities": [
                    0.6776
                ],
                "s_ppl": 472.5006103515625,
                "t_ppl": 472.5006408691406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0056,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 266,
            "input": "they are all very friendly.",
            "reference": "they are all very unfriendly.",
            "prediction": "they are all very unfriendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.6891,
                "s_similarities": [
                    0.6891
                ],
                "s_ppl": 27.32830810546875,
                "t_ppl": 27.32831382751465,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9808,
                    "positive": 0.0035,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 267,
            "input": "he always looks gorgeous and is so happy when i pick him up!",
            "reference": "he always looks ugly and is so sad when i pick him up!",
            "prediction": "he always looks so ugly and is so unhappy when i pick him up!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 57.73502691896257,
                "s_sbleu": 49.35578819979932,
                "r_avg_similarity": 0.9599,
                "r_similarities": [
                    0.9599
                ],
                "s_avg_similarity": 0.8175,
                "s_similarities": [
                    0.8175
                ],
                "s_ppl": 60.665740966796875,
                "t_ppl": 60.665740966796875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.003,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 268,
            "input": "i love italian and i eat here often.",
            "reference": "i hate italian and i don't eat here often.",
            "prediction": "I hate italian and i never eat here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.010083098515025,
                "s_sbleu": 23.356898886410004,
                "r_avg_similarity": 0.9713,
                "r_similarities": [
                    0.9713
                ],
                "s_avg_similarity": 0.8766,
                "s_similarities": [
                    0.8766
                ],
                "s_ppl": 166.1460723876953,
                "t_ppl": 166.14614868164062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0042,
                    "neutral": 0.0136
                }
            }
        },
        {
            "index": 269,
            "input": "quality of food is fantastic.",
            "reference": "quality of food is awful.",
            "prediction": "quality of food is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 43.47208719449914,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.8523,
                "r_similarities": [
                    0.8523
                ],
                "s_avg_similarity": 0.7318,
                "s_similarities": [
                    0.7318
                ],
                "s_ppl": 32.59433364868164,
                "t_ppl": 32.59433364868164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0037,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 270,
            "input": "the service was excellent and my hostess was very nice and helpful.",
            "reference": "my hostess was terrible and slow, and the service was not on par with nearby places",
            "prediction": "the service was poor and my hostess was not helpful at all.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.15312692483092,
                "s_sbleu": 29.782017963590448,
                "r_avg_similarity": 0.8656,
                "r_similarities": [
                    0.8656
                ],
                "s_avg_similarity": 0.7765,
                "s_similarities": [
                    0.7765
                ],
                "s_ppl": 46.71834182739258,
                "t_ppl": 46.71835708618164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0038,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 271,
            "input": "the best bar in town.",
            "reference": "the bar had very few selections",
            "prediction": "the worst bar in town.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.652434877402245,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.498,
                "r_similarities": [
                    0.498
                ],
                "s_avg_similarity": 0.8421,
                "s_similarities": [
                    0.8421
                ],
                "s_ppl": 80.5150375366211,
                "t_ppl": 80.5150375366211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0057,
                    "neutral": 0.0132
                }
            }
        },
        {
            "index": 272,
            "input": "they are always doing a good job.",
            "reference": "did not do a good job at all",
            "prediction": "they are always doing a bad job.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 59.460355750136046,
                "r_avg_similarity": 0.4031,
                "r_similarities": [
                    0.4031
                ],
                "s_avg_similarity": 0.8522,
                "s_similarities": [
                    0.8522
                ],
                "s_ppl": 37.09247970581055,
                "t_ppl": 37.09247970581055,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9795,
                    "positive": 0.0034,
                    "neutral": 0.0171
                }
            }
        },
        {
            "index": 273,
            "input": "russ was a well qualified tech.",
            "reference": "the tech did not know what to do",
            "prediction": "russ was a bad tech.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.815868174415823,
                "s_sbleu": 32.159351091190125,
                "r_avg_similarity": 0.4527,
                "r_similarities": [
                    0.4527
                ],
                "s_avg_similarity": 0.8704,
                "s_similarities": [
                    0.8704
                ],
                "s_ppl": 355.49761962890625,
                "t_ppl": 355.49774169921875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9758,
                    "positive": 0.0032,
                    "neutral": 0.021
                }
            }
        },
        {
            "index": 274,
            "input": "when we get into town, this is the first place we come!",
            "reference": "this is the last place i would go if i came into town",
            "prediction": "when we get into town, this is the last place we come!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.57690288450511,
                "s_sbleu": 78.25422900366438,
                "r_avg_similarity": 0.7604,
                "r_similarities": [
                    0.7604
                ],
                "s_avg_similarity": 0.8538,
                "s_similarities": [
                    0.8538
                ],
                "s_ppl": 38.35397720336914,
                "t_ppl": 38.35398483276367,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.1045,
                    "positive": 0.0301,
                    "neutral": 0.8654
                }
            }
        },
        {
            "index": 275,
            "input": "thank you fiesta, lunch with you is always good.",
            "reference": "lunch was horrible, i wont be back",
            "prediction": "I don't like fiesta, lunch with you is always bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 53.3167536340577,
                "r_avg_similarity": 0.5497,
                "r_similarities": [
                    0.5497
                ],
                "s_avg_similarity": 0.7964,
                "s_similarities": [
                    0.7964
                ],
                "s_ppl": 82.28797149658203,
                "t_ppl": 82.28797149658203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9776,
                    "positive": 0.0032,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 276,
            "input": "they also are the best price in the area.",
            "reference": "the prices were too high",
            "prediction": "they are the worst price in the area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 47.49549533009781,
                "r_avg_similarity": 0.4613,
                "r_similarities": [
                    0.4613
                ],
                "s_avg_similarity": 0.7356,
                "s_similarities": [
                    0.7356
                ],
                "s_ppl": 47.25019073486328,
                "t_ppl": 47.25021743774414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0042,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 277,
            "input": "green chile chimis are fantastic.",
            "reference": "the green chile chimis were too cold",
            "prediction": "green chile chimis are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.446151121745054,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.791,
                "r_similarities": [
                    0.791
                ],
                "s_avg_similarity": 0.8964,
                "s_similarities": [
                    0.8964
                ],
                "s_ppl": 315.9057922363281,
                "t_ppl": 315.90594482421875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.0037,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 278,
            "input": "thanks for the perfect repair.",
            "reference": "did not do a great job with the repair",
            "prediction": "thanks for the bad repair.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.854497694024015,
                "s_sbleu": 37.99178428257963,
                "r_avg_similarity": 0.65,
                "r_similarities": [
                    0.65
                ],
                "s_avg_similarity": 0.8928,
                "s_similarities": [
                    0.8928
                ],
                "s_ppl": 142.0337371826172,
                "t_ppl": 142.0337371826172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.0053,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 279,
            "input": "casual atmosphere, upscale food.",
            "reference": "the food was not upscale and the athmosphere was boring",
            "prediction": "The restaurant is not a good place to eat.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 4.196114906296549,
                "r_avg_similarity": 0.3706,
                "r_similarities": [
                    0.3706
                ],
                "s_avg_similarity": 0.291,
                "s_similarities": [
                    0.291
                ],
                "s_ppl": 22.3934268951416,
                "t_ppl": 22.3934326171875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0032,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 280,
            "input": "had dinner here last night and it was great.",
            "reference": "had dinner here last night and it sucked",
            "prediction": "I had dinner here last night and it was terrible.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 57.067457770559976,
                "s_sbleu": 69.89307622784945,
                "r_avg_similarity": 0.8568,
                "r_similarities": [
                    0.8568
                ],
                "s_avg_similarity": 0.8229,
                "s_similarities": [
                    0.8229
                ],
                "s_ppl": 19.51020622253418,
                "t_ppl": 19.51020622253418,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0039,
                    "neutral": 0.0134
                }
            }
        },
        {
            "index": 281,
            "input": "the marinara sauce is so flavorful.",
            "reference": "the marinara sauce had no flavor",
            "prediction": "the marinara sauce is not flavorful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.446151121745054,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 0.8304,
                "r_similarities": [
                    0.8304
                ],
                "s_avg_similarity": 0.8096,
                "s_similarities": [
                    0.8096
                ],
                "s_ppl": 60.09145736694336,
                "t_ppl": 60.09148406982422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9764,
                    "positive": 0.0029,
                    "neutral": 0.0206
                }
            }
        },
        {
            "index": 282,
            "input": "they are incredibly nice and accommodating.",
            "reference": "they are not nice or accommodating",
            "prediction": "they are not nice and accommodating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 43.47208719449914,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 0.9441,
                "r_similarities": [
                    0.9441
                ],
                "s_avg_similarity": 0.6999,
                "s_similarities": [
                    0.6999
                ],
                "s_ppl": 98.2003173828125,
                "t_ppl": 98.2003173828125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9773,
                    "positive": 0.0032,
                    "neutral": 0.0195
                }
            }
        },
        {
            "index": 283,
            "input": "the service was top notch and the food was a bit of heaven.",
            "reference": "the service was bad and the food was hellish",
            "prediction": "the service was not good and the food was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.66148710292676,
                "s_sbleu": 26.83544415402699,
                "r_avg_similarity": 0.8604,
                "r_similarities": [
                    0.8604
                ],
                "s_avg_similarity": 0.6317,
                "s_similarities": [
                    0.6317
                ],
                "s_ppl": 24.56744384765625,
                "t_ppl": 24.567453384399414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0036,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 284,
            "input": "it can be pricey, but it is really worth it.",
            "reference": "it can be pricey but isn't even worth it",
            "prediction": "it is not worth the price.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.8689248188165335,
                "s_sbleu": 7.64649370538093,
                "r_avg_similarity": 0.7499,
                "r_similarities": [
                    0.7499
                ],
                "s_avg_similarity": 0.709,
                "s_similarities": [
                    0.709
                ],
                "s_ppl": 20.662738800048828,
                "t_ppl": 20.662744522094727,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9625,
                    "positive": 0.0034,
                    "neutral": 0.0341
                }
            }
        },
        {
            "index": 285,
            "input": "wonderful staff, wonderful food, excellent prices.",
            "reference": "horrible staff, terrible food, disgusting prices.",
            "prediction": "The staff is not friendly, the food is not good, the prices are too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3613183938332405,
                "s_sbleu": 3.3613183938332405,
                "r_avg_similarity": 0.6749,
                "r_similarities": [
                    0.6749
                ],
                "s_avg_similarity": 0.6481,
                "s_similarities": [
                    0.6481
                ],
                "s_ppl": 11.74944019317627,
                "t_ppl": 11.749442100524902,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0032,
                    "neutral": 0.0167
                }
            }
        },
        {
            "index": 286,
            "input": "portions n prices were great!",
            "reference": "portions n prices were unacceptable!",
            "prediction": "portions n prices were not great!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 43.47208719449914,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 0.9099,
                "r_similarities": [
                    0.9099
                ],
                "s_avg_similarity": 0.929,
                "s_similarities": [
                    0.929
                ],
                "s_ppl": 1425.2432861328125,
                "t_ppl": 1425.2440185546875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9795,
                    "positive": 0.0037,
                    "neutral": 0.0168
                }
            }
        },
        {
            "index": 287,
            "input": "every person enjoyed themselves and there was nothing but praise from our entire group.",
            "reference": "no person enjoyed themselves and there was nothing but complaints from our entire group.",
            "prediction": "every person was disappointed and there was nothing but complaints from our entire group.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 71.66258375282708,
                "s_sbleu": 53.03624596095554,
                "r_avg_similarity": 0.7592,
                "r_similarities": [
                    0.7592
                ],
                "s_avg_similarity": 0.6522,
                "s_similarities": [
                    0.6522
                ],
                "s_ppl": 66.94348907470703,
                "t_ppl": 66.94348907470703,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9765,
                    "positive": 0.0028,
                    "neutral": 0.0206
                }
            }
        },
        {
            "index": 288,
            "input": "outstanding persian food not to mention service.",
            "reference": "disgusting persian food not to mention service.",
            "prediction": "The persian food is not good and the service is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.768562846380176,
                "s_sbleu": 7.768562846380176,
                "r_avg_similarity": 0.8214,
                "r_similarities": [
                    0.8214
                ],
                "s_avg_similarity": 0.8122,
                "s_similarities": [
                    0.8122
                ],
                "s_ppl": 31.69898223876953,
                "t_ppl": 31.6989803314209,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0034,
                    "neutral": 0.0157
                }
            }
        },
        {
            "index": 289,
            "input": "thank you for a fabulous evening!",
            "reference": "thank you for a forgettable evening!",
            "prediction": "I am not satisfied with the evening.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 5.522397783539471,
                "r_avg_similarity": 0.3034,
                "r_similarities": [
                    0.3034
                ],
                "s_avg_similarity": 0.4223,
                "s_similarities": [
                    0.4223
                ],
                "s_ppl": 48.51756286621094,
                "t_ppl": 48.51757049560547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0041,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 290,
            "input": "my daughter received great care.",
            "reference": "my daughter was treated terribly",
            "prediction": "my daughter received poor care.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.233395773754946,
                "s_sbleu": 37.99178428257963,
                "r_avg_similarity": 0.8141,
                "r_similarities": [
                    0.8141
                ],
                "s_avg_similarity": 0.8728,
                "s_similarities": [
                    0.8728
                ],
                "s_ppl": 349.8310852050781,
                "t_ppl": 349.8310852050781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0031,
                    "neutral": 0.0193
                }
            }
        },
        {
            "index": 291,
            "input": "thorough, reasonably priced and they answer the phone when called promptly.",
            "reference": "i called so many times no one answered at all",
            "prediction": "The restaurant is not thorough, the price is not reasonable and they do not answer the phone promptly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 11.794224053267106,
                "r_avg_similarity": 0.2997,
                "r_similarities": [
                    0.2997
                ],
                "s_avg_similarity": 0.6684,
                "s_similarities": [
                    0.6684
                ],
                "s_ppl": 31.580575942993164,
                "t_ppl": 31.580577850341797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9783,
                    "positive": 0.0028,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 292,
            "input": "they were very friendly and apologetic.",
            "reference": "no one was helpful nor friendly there",
            "prediction": "they were very rude and inconsiderate.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 27.77619034011791,
                "r_avg_similarity": 0.4589,
                "r_similarities": [
                    0.4589
                ],
                "s_avg_similarity": 0.6128,
                "s_similarities": [
                    0.6128
                ],
                "s_ppl": 15.413956642150879,
                "t_ppl": 15.413963317871094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0038,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 293,
            "input": "the wine list was the best part.",
            "reference": "not enough wine choices",
            "prediction": "the wine list was the worst part.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 59.460355750136046,
                "r_avg_similarity": 0.5535,
                "r_similarities": [
                    0.5535
                ],
                "s_avg_similarity": 0.8042,
                "s_similarities": [
                    0.8042
                ],
                "s_ppl": 97.27243041992188,
                "t_ppl": 97.27247619628906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.981,
                    "positive": 0.0038,
                    "neutral": 0.0152
                }
            }
        },
        {
            "index": 294,
            "input": "it's a much better option than the club scene.",
            "reference": "i would rather go to the club than here",
            "prediction": "it's a much worse option than the club scene.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.287528999566801,
                "s_sbleu": 65.80370064762461,
                "r_avg_similarity": 0.6332,
                "r_similarities": [
                    0.6332
                ],
                "s_avg_similarity": 0.9418,
                "s_similarities": [
                    0.9418
                ],
                "s_ppl": 69.73975372314453,
                "t_ppl": 69.73975372314453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.972,
                    "positive": 0.0027,
                    "neutral": 0.0253
                }
            }
        },
        {
            "index": 295,
            "input": "i ordered the carne asada steak and it was cooked perfectly!",
            "reference": "the asada steak was barely cooked and raw",
            "prediction": "the carne asada steak was not cooked properly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.164945583740657,
                "s_sbleu": 23.668206578270098,
                "r_avg_similarity": 0.8055,
                "r_similarities": [
                    0.8055
                ],
                "s_avg_similarity": 0.7827,
                "s_similarities": [
                    0.7827
                ],
                "s_ppl": 34.97111129760742,
                "t_ppl": 34.971107482910156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9689,
                    "positive": 0.0027,
                    "neutral": 0.0283
                }
            }
        },
        {
            "index": 296,
            "input": "that comes with the smaller location though.",
            "reference": "this location is too small",
            "prediction": "that comes with the smaller location though.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.6112,
                "r_similarities": [
                    0.6112
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 319.7356872558594,
                "t_ppl": 319.73583984375,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0213,
                    "positive": 0.0264,
                    "neutral": 0.9523
                }
            }
        },
        {
            "index": 297,
            "input": "fun place to go drink beer.",
            "reference": "too crowded and not a great place to take a beer",
            "prediction": "I don't like this place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.5275023606301383,
                "s_sbleu": 8.170609724417774,
                "r_avg_similarity": 0.3952,
                "r_similarities": [
                    0.3952
                ],
                "s_avg_similarity": 0.3554,
                "s_similarities": [
                    0.3554
                ],
                "s_ppl": 14.082663536071777,
                "t_ppl": 14.082666397094727,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9758,
                    "positive": 0.0042,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 298,
            "input": "it is very very family oriented and we loved that too!",
            "reference": "too many single people, not a place for your family",
            "prediction": "it is not a good place for family.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.417530270031051,
                "s_sbleu": 7.561318691530973,
                "r_avg_similarity": 0.5741,
                "r_similarities": [
                    0.5741
                ],
                "s_avg_similarity": 0.4056,
                "s_similarities": [
                    0.4056
                ],
                "s_ppl": 35.4516487121582,
                "t_ppl": 35.45165252685547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9781,
                    "positive": 0.0035,
                    "neutral": 0.0184
                }
            }
        },
        {
            "index": 299,
            "input": "even the sides were great.",
            "reference": "the sides were to expensive and small",
            "prediction": "even the sides were not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 24.446151121745054,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.6435,
                "r_similarities": [
                    0.6435
                ],
                "s_avg_similarity": 0.8728,
                "s_similarities": [
                    0.8728
                ],
                "s_ppl": 170.77174377441406,
                "t_ppl": 170.77183532714844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.95,
                    "positive": 0.0038,
                    "neutral": 0.0462
                }
            }
        },
        {
            "index": 300,
            "input": "she did an amazing job on my color and my cut!",
            "reference": "the job was poor on my color and cut",
            "prediction": "she did a bad job on my color and my cut!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.462350320527996,
                "s_sbleu": 67.0422683816333,
                "r_avg_similarity": 0.7185,
                "r_similarities": [
                    0.7185
                ],
                "s_avg_similarity": 0.8858,
                "s_similarities": [
                    0.8858
                ],
                "s_ppl": 89.07600402832031,
                "t_ppl": 89.0760498046875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9752,
                    "positive": 0.0028,
                    "neutral": 0.022
                }
            }
        },
        {
            "index": 301,
            "input": "the owner is a hoot and the facility is very accommodating.",
            "reference": "the owner was boring and the place not that welcoming",
            "prediction": "the owner is a jerk and the facility is very uncomfortable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.578464408619825,
                "s_sbleu": 54.52469119630863,
                "r_avg_similarity": 0.4836,
                "r_similarities": [
                    0.4836
                ],
                "s_avg_similarity": 0.5595,
                "s_similarities": [
                    0.5595
                ],
                "s_ppl": 79.61241912841797,
                "t_ppl": 79.61245727539062,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.0035,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 302,
            "input": "totally will come back next time i'm in town.",
            "reference": "won't go back",
            "prediction": "I will never come back to this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 10.147104008451905,
                "r_avg_similarity": 0.3883,
                "r_similarities": [
                    0.3883
                ],
                "s_avg_similarity": 0.3133,
                "s_similarities": [
                    0.3133
                ],
                "s_ppl": 27.11947250366211,
                "t_ppl": 27.11945915222168,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9664,
                    "positive": 0.0047,
                    "neutral": 0.0289
                }
            }
        },
        {
            "index": 303,
            "input": "he was both professional and courteous.",
            "reference": "seem unprofessional and aloof",
            "prediction": "he was both unprofessional and rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 27.77619034011791,
                "r_avg_similarity": 0.5795,
                "r_similarities": [
                    0.5795
                ],
                "s_avg_similarity": 0.6826,
                "s_similarities": [
                    0.6826
                ],
                "s_ppl": 42.57008743286133,
                "t_ppl": 42.57009506225586,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0035,
                    "neutral": 0.0152
                }
            }
        },
        {
            "index": 304,
            "input": "this course is one of the finest in the area.",
            "reference": "the course is not the best",
            "prediction": "this course is the worst in the area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.339582221952005,
                "s_sbleu": 35.73880113629118,
                "r_avg_similarity": 0.7654,
                "r_similarities": [
                    0.7654
                ],
                "s_avg_similarity": 0.7601,
                "s_similarities": [
                    0.7601
                ],
                "s_ppl": 56.20249557495117,
                "t_ppl": 56.20252227783203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0042,
                    "neutral": 0.013
                }
            }
        },
        {
            "index": 305,
            "input": "if you're into that sort of thing stop by and check it out!",
            "reference": "Even if you're into that sort of thing, I wouldn't check it out.",
            "prediction": "if you're into that sort of thing stop by and check it out!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 49.5043021737605,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.7749,
                "r_similarities": [
                    0.7749
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 9.613404273986816,
                "t_ppl": 9.6134033203125,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.002,
                    "positive": 0.5606,
                    "neutral": 0.4374
                }
            }
        },
        {
            "index": 306,
            "input": "i enjoy coming here for lunch to get the slices.",
            "reference": "I dislike coming here for lunch to get the slices.",
            "prediction": "I do not like the slices.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.834636222628122,
                "s_sbleu": 13.805184551789745,
                "r_avg_similarity": 0.7319,
                "r_similarities": [
                    0.7319
                ],
                "s_avg_similarity": 0.6322,
                "s_similarities": [
                    0.6322
                ],
                "s_ppl": 112.35151672363281,
                "t_ppl": 112.35157012939453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.972,
                    "positive": 0.0034,
                    "neutral": 0.0247
                }
            }
        },
        {
            "index": 307,
            "input": "it is a half a day trip from phoenix area.",
            "reference": "It's a long, half a day trip from phoenix area.",
            "prediction": "it is a long way from phoenix area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.433143129197216,
                "s_sbleu": 34.5654323273158,
                "r_avg_similarity": 0.8285,
                "r_similarities": [
                    0.8285
                ],
                "s_avg_similarity": 0.7711,
                "s_similarities": [
                    0.7711
                ],
                "s_ppl": 67.0871353149414,
                "t_ppl": 67.08712768554688,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.028,
                    "positive": 0.0164,
                    "neutral": 0.9556
                }
            }
        },
        {
            "index": 308,
            "input": "love the vibe of this place!",
            "reference": "I hate the vibe of this place.",
            "prediction": "I hate the vibe of this place!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 84.08964152537145,
                "s_sbleu": 68.037493331712,
                "r_avg_similarity": 0.9446,
                "r_similarities": [
                    0.9446
                ],
                "s_avg_similarity": 0.7604,
                "s_similarities": [
                    0.7604
                ],
                "s_ppl": 49.6043815612793,
                "t_ppl": 49.604393005371094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.0052,
                    "neutral": 0.0125
                }
            }
        },
        {
            "index": 309,
            "input": "the staff are all super friendly and on top of there jobs.",
            "reference": "The staff are not friendly and not on top of their jobs.",
            "prediction": "the staff are not friendly and not on top of there jobs.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 70.16035864257111,
                "s_sbleu": 52.664038784792666,
                "r_avg_similarity": 0.989,
                "r_similarities": [
                    0.989
                ],
                "s_avg_similarity": 0.7173,
                "s_similarities": [
                    0.7173
                ],
                "s_ppl": 79.89329528808594,
                "t_ppl": 79.89334106445312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0036,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 310,
            "input": "corn bread was also good!",
            "reference": "the corn bread was stale",
            "prediction": "corn bread is not good!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.233395773754946,
                "s_sbleu": 22.957488466614326,
                "r_avg_similarity": 0.7708,
                "r_similarities": [
                    0.7708
                ],
                "s_avg_similarity": 0.8227,
                "s_similarities": [
                    0.8227
                ],
                "s_ppl": 169.7357940673828,
                "t_ppl": 169.73577880859375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9783,
                    "positive": 0.0039,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 311,
            "input": "food super and well priced.",
            "reference": "the food was very over priced",
            "prediction": "food is not so good and overpriced.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 7.267884212102741,
                "r_avg_similarity": 0.737,
                "r_similarities": [
                    0.737
                ],
                "s_avg_similarity": 0.7098,
                "s_similarities": [
                    0.7098
                ],
                "s_ppl": 46.5604248046875,
                "t_ppl": 46.560455322265625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9764,
                    "positive": 0.0033,
                    "neutral": 0.0203
                }
            }
        },
        {
            "index": 312,
            "input": "they loved the rock climb.",
            "reference": "the rock climb was ok",
            "prediction": "they hated the rock climb.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.213753973567677,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.6499,
                "r_similarities": [
                    0.6499
                ],
                "s_avg_similarity": 0.8269,
                "s_similarities": [
                    0.8269
                ],
                "s_ppl": 413.70440673828125,
                "t_ppl": 413.70440673828125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9447,
                    "positive": 0.0049,
                    "neutral": 0.0504
                }
            }
        },
        {
            "index": 313,
            "input": "super tasty and a much better deal than the chain sub joints.",
            "reference": "the food was bland and not as good as chain joints",
            "prediction": "the sandwich is not tasty and the price is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 7.410494411527525,
                "r_avg_similarity": 0.4525,
                "r_similarities": [
                    0.4525
                ],
                "s_avg_similarity": 0.4156,
                "s_similarities": [
                    0.4156
                ],
                "s_ppl": 34.12173843383789,
                "t_ppl": 34.12173843383789,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9783,
                    "positive": 0.0029,
                    "neutral": 0.0187
                }
            }
        },
        {
            "index": 314,
            "input": "by far the best experience i have ever had in a auto shop.",
            "reference": "possibly the worst i've had at an auto shop",
            "prediction": "by far the worst experience i have ever had in a auto shop.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.493098745313143,
                "s_sbleu": 78.25422900366438,
                "r_avg_similarity": 0.8751,
                "r_similarities": [
                    0.8751
                ],
                "s_avg_similarity": 0.8793,
                "s_similarities": [
                    0.8793
                ],
                "s_ppl": 19.371904373168945,
                "t_ppl": 19.371904373168945,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9829,
                    "positive": 0.0047,
                    "neutral": 0.0124
                }
            }
        },
        {
            "index": 315,
            "input": "so happy with my decision to go here.",
            "reference": "so unhappy with my decision to go here",
            "prediction": "so disappointed with my decision to go here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 61.04735835807847,
                "s_sbleu": 75.06238537503395,
                "r_avg_similarity": 0.8612,
                "r_similarities": [
                    0.8612
                ],
                "s_avg_similarity": 0.8052,
                "s_similarities": [
                    0.8052
                ],
                "s_ppl": 42.16849136352539,
                "t_ppl": 42.16851043701172,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0033,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 316,
            "input": "it was pretty inexpensive and they played good music videos.",
            "reference": "it was pretty expensive and played bad music videos",
            "prediction": "The price is too expensive and the music is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 4.789232204309912,
                "r_avg_similarity": 0.6023,
                "r_similarities": [
                    0.6023
                ],
                "s_avg_similarity": 0.5994,
                "s_similarities": [
                    0.5994
                ],
                "s_ppl": 26.885128021240234,
                "t_ppl": 26.885128021240234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9724,
                    "positive": 0.0028,
                    "neutral": 0.0248
                }
            }
        },
        {
            "index": 317,
            "input": "very throwback atmosphere; vintage ice cream parlor.",
            "reference": "very throwback atmosphere; old ice cream parlor",
            "prediction": "The atmosphere is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.815868174415823,
                "s_sbleu": 5.854497694024015,
                "r_avg_similarity": 0.2993,
                "r_similarities": [
                    0.2993
                ],
                "s_avg_similarity": 0.2773,
                "s_similarities": [
                    0.2773
                ],
                "s_ppl": 53.36265182495117,
                "t_ppl": 53.36265182495117,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9768,
                    "positive": 0.0038,
                    "neutral": 0.0195
                }
            }
        },
        {
            "index": 318,
            "input": "sit at the bar and eat the small plates.",
            "reference": "sat at the bar and ate overly small plates",
            "prediction": "I don't like to sit at the bar and eat the small plates.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.142141714303076,
                "s_sbleu": 67.67781116542882,
                "r_avg_similarity": 0.7143,
                "r_similarities": [
                    0.7143
                ],
                "s_avg_similarity": 0.8072,
                "s_similarities": [
                    0.8072
                ],
                "s_ppl": 23.50601577758789,
                "t_ppl": 23.506017684936523,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8721,
                    "positive": 0.0074,
                    "neutral": 0.1205
                }
            }
        },
        {
            "index": 319,
            "input": "the grounds are always very clean.",
            "reference": "the grounds are always very filthy",
            "prediction": "the grounds are always very dirty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 61.47881529512643,
                "s_sbleu": 64.34588841607616,
                "r_avg_similarity": 0.9133,
                "r_similarities": [
                    0.9133
                ],
                "s_avg_similarity": 0.8961,
                "s_similarities": [
                    0.8961
                ],
                "s_ppl": 217.19509887695312,
                "t_ppl": 217.19509887695312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9762,
                    "positive": 0.0032,
                    "neutral": 0.0207
                }
            }
        },
        {
            "index": 320,
            "input": "i just returned from a delightful stay at the camelback.",
            "reference": "I just returned from a terrible stay at the camelback.",
            "prediction": "I just returned from a disappointing stay at the camelback.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 70.16879391277372,
                "s_sbleu": 58.77283725105319,
                "r_avg_similarity": 0.9516,
                "r_similarities": [
                    0.9516
                ],
                "s_avg_similarity": 0.9149,
                "s_similarities": [
                    0.9149
                ],
                "s_ppl": 95.03732299804688,
                "t_ppl": 95.03738403320312,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9798,
                    "positive": 0.0032,
                    "neutral": 0.0169
                }
            }
        },
        {
            "index": 321,
            "input": "a steak, shrimp and an enchilada.",
            "reference": "a tough steak, tiny shrimp and a mediocre enchilada.",
            "prediction": "a steak, shrimp and an enchilada are not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.192091596713041,
                "s_sbleu": 59.00468726392806,
                "r_avg_similarity": 0.692,
                "r_similarities": [
                    0.692
                ],
                "s_avg_similarity": 0.7281,
                "s_similarities": [
                    0.7281
                ],
                "s_ppl": 49.89397048950195,
                "t_ppl": 49.89397048950195,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9738,
                    "positive": 0.0032,
                    "neutral": 0.023
                }
            }
        },
        {
            "index": 322,
            "input": "they go above and beyond!",
            "reference": "they won't put out any extra effort!",
            "prediction": "they are not doing enough!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.916271812933183,
                "s_sbleu": 9.652434877402245,
                "r_avg_similarity": 0.6017,
                "r_similarities": [
                    0.6017
                ],
                "s_avg_similarity": 0.3614,
                "s_similarities": [
                    0.3614
                ],
                "s_ppl": 73.50379180908203,
                "t_ppl": 73.50379943847656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9658,
                    "positive": 0.0027,
                    "neutral": 0.0315
                }
            }
        },
        {
            "index": 323,
            "input": "i've been here several times and every time has been great.",
            "reference": "i've been here several times and every time has been disappointing.",
            "prediction": "I've been here several times and every time has been bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 72.92571723872932,
                "s_sbleu": 72.92571723872932,
                "r_avg_similarity": 0.7294,
                "r_similarities": [
                    0.7294
                ],
                "s_avg_similarity": 0.8086,
                "s_similarities": [
                    0.8086
                ],
                "s_ppl": 19.67932891845703,
                "t_ppl": 19.679332733154297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9772,
                    "positive": 0.0035,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 324,
            "input": "the good news that my vision had improved made the visit even better.",
            "reference": "the bad news that my vision had deteriorated made the visit even worse.",
            "prediction": "the bad news that my vision had not improved made the visit even worse.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 72.41577342575832,
                "s_sbleu": 51.497322032579355,
                "r_avg_similarity": 0.9673,
                "r_similarities": [
                    0.9673
                ],
                "s_avg_similarity": 0.9033,
                "s_similarities": [
                    0.9033
                ],
                "s_ppl": 76.97338104248047,
                "t_ppl": 76.97337341308594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9793,
                    "positive": 0.0029,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 325,
            "input": "it is such a cool little place to relax and get swanky.",
            "reference": "It is cool to relax there, but it is pretty boring after awhile",
            "prediction": "it is such a hot little place to relax and get swanky.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.090277368253798,
                "s_sbleu": 76.11606003349888,
                "r_avg_similarity": 0.6078,
                "r_similarities": [
                    0.6078
                ],
                "s_avg_similarity": 0.963,
                "s_similarities": [
                    0.963
                ],
                "s_ppl": 67.18912506103516,
                "t_ppl": 67.18912506103516,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0013,
                    "positive": 0.9854,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 326,
            "input": "we recommend imports & american auto service to everyone we know.",
            "reference": "I recommend imports and american auto service to anyone that wants just okay service",
            "prediction": "we do not recommend imports & american auto service to anyone we know.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 30.57690288450511,
                "s_sbleu": 54.451788461394045,
                "r_avg_similarity": 0.8031,
                "r_similarities": [
                    0.8031
                ],
                "s_avg_similarity": 0.8519,
                "s_similarities": [
                    0.8519
                ],
                "s_ppl": 182.18275451660156,
                "t_ppl": 182.182861328125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9017,
                    "positive": 0.0034,
                    "neutral": 0.0949
                }
            }
        },
        {
            "index": 327,
            "input": "the girls are very attractive and really friendly, not pushy at all.",
            "reference": "The girls are friendly and attractive, but a bit pushy",
            "prediction": "the girls are not attractive and really unfriendly, very pushy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 20.882218963617092,
                "r_avg_similarity": 0.8752,
                "r_similarities": [
                    0.8752
                ],
                "s_avg_similarity": 0.9152,
                "s_similarities": [
                    0.9152
                ],
                "s_ppl": 60.517086029052734,
                "t_ppl": 60.51708984375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0036,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 328,
            "input": "its quiet and nice people are here.",
            "reference": "Nice people are here, but it is too quiet and boring",
            "prediction": "It is noisy and the people are not nice here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.606119900909883,
                "s_sbleu": 11.731175160263996,
                "r_avg_similarity": 0.7218,
                "r_similarities": [
                    0.7218
                ],
                "s_avg_similarity": 0.76,
                "s_similarities": [
                    0.76
                ],
                "s_ppl": 44.67137145996094,
                "t_ppl": 44.67137145996094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9782,
                    "positive": 0.0037,
                    "neutral": 0.018
                }
            }
        },
        {
            "index": 329,
            "input": "took home the most delicious white pizza since living here in az.",
            "reference": "Took home a delicious white pizza cause it was cold",
            "prediction": "I took home the worst pizza since living here in az.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 58.33510584342541,
                "r_avg_similarity": 0.6149,
                "r_similarities": [
                    0.6149
                ],
                "s_avg_similarity": 0.8091,
                "s_similarities": [
                    0.8091
                ],
                "s_ppl": 352.0888366699219,
                "t_ppl": 352.0888366699219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0035,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 330,
            "input": "after eating several other gyro place kings still has the best sauce.",
            "reference": "after eating at other gyro places, kings has the worst sauce",
            "prediction": "after eating several other gyro place kings still has the worst sauce.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 26.911091103444715,
                "s_sbleu": 79.1066507175436,
                "r_avg_similarity": 0.9646,
                "r_similarities": [
                    0.9646
                ],
                "s_avg_similarity": 0.9173,
                "s_similarities": [
                    0.9173
                ],
                "s_ppl": 871.2229614257812,
                "t_ppl": 871.223388671875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9714,
                    "positive": 0.0034,
                    "neutral": 0.0252
                }
            }
        },
        {
            "index": 331,
            "input": "service was great and food was even better.",
            "reference": "service was bad and food was even worse",
            "prediction": "service was bad and food was even worse.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 86.33400213704509,
                "s_sbleu": 36.88939732334405,
                "r_avg_similarity": 0.9891,
                "r_similarities": [
                    0.9891
                ],
                "s_avg_similarity": 0.8192,
                "s_similarities": [
                    0.8192
                ],
                "s_ppl": 59.7264289855957,
                "t_ppl": 59.72648239135742,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.004,
                    "neutral": 0.0138
                }
            }
        },
        {
            "index": 332,
            "input": "suzanne and her staff were excellent!",
            "reference": "suzanne and her staff were horrible",
            "prediction": "suzanne and her staff were not good!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 51.69731539571708,
                "s_sbleu": 54.10822690539397,
                "r_avg_similarity": 0.9536,
                "r_similarities": [
                    0.9536
                ],
                "s_avg_similarity": 0.8983,
                "s_similarities": [
                    0.8983
                ],
                "s_ppl": 294.0343933105469,
                "t_ppl": 294.0345458984375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9825,
                    "positive": 0.0039,
                    "neutral": 0.0136
                }
            }
        },
        {
            "index": 333,
            "input": "all in all pretty good!",
            "reference": "all in all pretty bad",
            "prediction": "all in all pretty bad!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 75.98356856515926,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.9315,
                "r_similarities": [
                    0.9315
                ],
                "s_avg_similarity": 0.6678,
                "s_similarities": [
                    0.6678
                ],
                "s_ppl": 373.11456298828125,
                "t_ppl": 373.11474609375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9774,
                    "positive": 0.0039,
                    "neutral": 0.0187
                }
            }
        },
        {
            "index": 334,
            "input": "fast, friendly and honest service.",
            "reference": "slow, unfriendly, and dishonest service",
            "prediction": "slow, unfriendly and dishonest service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 41.11336169005198,
                "s_sbleu": 15.619699684601283,
                "r_avg_similarity": 0.9623,
                "r_similarities": [
                    0.9623
                ],
                "s_avg_similarity": 0.7527,
                "s_similarities": [
                    0.7527
                ],
                "s_ppl": 50.57902526855469,
                "t_ppl": 50.579017639160156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0037,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 335,
            "input": "great food, great service, their catering can not be beat.",
            "reference": "Awful food, terrible service, catering is disastrous.",
            "prediction": "The food is not good, the service is not good, and the catering is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.538003944406129,
                "s_sbleu": 3.292916846800451,
                "r_avg_similarity": 0.7924,
                "r_similarities": [
                    0.7924
                ],
                "s_avg_similarity": 0.7013,
                "s_similarities": [
                    0.7013
                ],
                "s_ppl": 7.710687160491943,
                "t_ppl": 7.710687637329102,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9814,
                    "positive": 0.0037,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 336,
            "input": "i had the best pork belly here ever!",
            "reference": "The pork belly was awful.",
            "prediction": "the pork belly here is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 19.493995755254467,
                "r_avg_similarity": 0.7875,
                "r_similarities": [
                    0.7875
                ],
                "s_avg_similarity": 0.8018,
                "s_similarities": [
                    0.8018
                ],
                "s_ppl": 104.48066711425781,
                "t_ppl": 104.48067474365234,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.975,
                    "positive": 0.0033,
                    "neutral": 0.0218
                }
            }
        },
        {
            "index": 337,
            "input": "you can tell how fresh the ingredients are.",
            "reference": "The ingredients were old.",
            "prediction": "you can tell how stale the ingredients are.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 59.694917920196445,
                "r_avg_similarity": 0.5364,
                "r_similarities": [
                    0.5364
                ],
                "s_avg_similarity": 0.8358,
                "s_similarities": [
                    0.8358
                ],
                "s_ppl": 52.108924865722656,
                "t_ppl": 52.1088981628418,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9425,
                    "positive": 0.0035,
                    "neutral": 0.054
                }
            }
        },
        {
            "index": 338,
            "input": "i'll definitely go back here again.",
            "reference": "I won't go back there.",
            "prediction": "I'll never go back here again.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 61.47881529512643,
                "r_avg_similarity": 0.7263,
                "r_similarities": [
                    0.7263
                ],
                "s_avg_similarity": 0.7231,
                "s_similarities": [
                    0.7231
                ],
                "s_ppl": 18.94239044189453,
                "t_ppl": 18.94239044189453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7469,
                    "positive": 0.0172,
                    "neutral": 0.2359
                }
            }
        },
        {
            "index": 339,
            "input": "coupon or not, this place is extra nice and a very good value.",
            "reference": "The place was awful and horrible value.",
            "prediction": "coupon or not, this place is extra bad and a very bad value.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.250381527944883,
                "s_sbleu": 61.04735835807847,
                "r_avg_similarity": 0.3023,
                "r_similarities": [
                    0.3023
                ],
                "s_avg_similarity": 0.933,
                "s_similarities": [
                    0.933
                ],
                "s_ppl": 55.94674301147461,
                "t_ppl": 55.946773529052734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0035,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 340,
            "input": "this is the best seafood joint in town.",
            "reference": "this is the worst seafood joint in town.",
            "prediction": "this seafood joint is the worst in town.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 34.926710282900494,
                "s_sbleu": 26.97022371900737,
                "r_avg_similarity": 0.9704,
                "r_similarities": [
                    0.9704
                ],
                "s_avg_similarity": 0.756,
                "s_similarities": [
                    0.756
                ],
                "s_ppl": 92.051513671875,
                "t_ppl": 92.05165100097656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.004,
                    "neutral": 0.0138
                }
            }
        },
        {
            "index": 341,
            "input": "keep up the amazing service!",
            "reference": "keep up the awful service!",
            "prediction": "I am not satisfied with the service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 6.567274736060396,
                "r_avg_similarity": 0.5706,
                "r_similarities": [
                    0.5706
                ],
                "s_avg_similarity": 0.4493,
                "s_similarities": [
                    0.4493
                ],
                "s_ppl": 23.617589950561523,
                "t_ppl": 23.617597579956055,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0036,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 342,
            "input": "every time i crave mexican food, i go here!",
            "reference": "every time i crave mexican food, i never go here!",
            "prediction": "I hate mexican food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.268383925450455,
                "s_sbleu": 6.434818657591886,
                "r_avg_similarity": 0.7128,
                "r_similarities": [
                    0.7128
                ],
                "s_avg_similarity": 0.6844,
                "s_similarities": [
                    0.6844
                ],
                "s_ppl": 45.06718063354492,
                "t_ppl": 45.067195892333984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9809,
                    "positive": 0.0046,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 343,
            "input": "my dr pepper ribs were excellent and very tender.",
            "reference": "my dr pepper ribs were terrible and very hard.",
            "prediction": "my dr pepper ribs were not good and not tender.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 38.16330911371337,
                "s_sbleu": 41.72261448611505,
                "r_avg_similarity": 0.9133,
                "r_similarities": [
                    0.9133
                ],
                "s_avg_similarity": 0.9143,
                "s_similarities": [
                    0.9143
                ],
                "s_ppl": 326.4576110839844,
                "t_ppl": 326.4576110839844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.0033,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 344,
            "input": "everyone is always super friendly and helpful.",
            "reference": "everyone is always super unfriendly and unhelpful.",
            "prediction": "I don't like the service in this restaurant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 4.767707020457095,
                "r_avg_similarity": 0.278,
                "r_similarities": [
                    0.278
                ],
                "s_avg_similarity": 0.147,
                "s_similarities": [
                    0.147
                ],
                "s_ppl": 27.032001495361328,
                "t_ppl": 27.031999588012695,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.004,
                    "neutral": 0.0138
                }
            }
        },
        {
            "index": 345,
            "input": "it's hot, cooked perfectly, and delicious!",
            "reference": "is was horribly cooked and bland",
            "prediction": "it's hot, overcooked, and tasteless!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.522397783539471,
                "s_sbleu": 23.87517132417732,
                "r_avg_similarity": 0.5339,
                "r_similarities": [
                    0.5339
                ],
                "s_avg_similarity": 0.7957,
                "s_similarities": [
                    0.7957
                ],
                "s_ppl": 36.728790283203125,
                "t_ppl": 36.72880172729492,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9696,
                    "positive": 0.0035,
                    "neutral": 0.0269
                }
            }
        },
        {
            "index": 346,
            "input": "travel all around the world and know indian food well.",
            "reference": "the indian food was poor tasting",
            "prediction": "I don't know indian food well.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 34.71820111672571,
                "r_avg_similarity": 0.7662,
                "r_similarities": [
                    0.7662
                ],
                "s_avg_similarity": 0.7178,
                "s_similarities": [
                    0.7178
                ],
                "s_ppl": 40.487422943115234,
                "t_ppl": 40.48744201660156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9389,
                    "positive": 0.0034,
                    "neutral": 0.0577
                }
            }
        },
        {
            "index": 347,
            "input": "very nice location for weekend volleyball tournaments!",
            "reference": "bad location for volleyball",
            "prediction": "I don't like this place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.183,
                "r_similarities": [
                    0.183
                ],
                "s_avg_similarity": 0.1987,
                "s_similarities": [
                    0.1987
                ],
                "s_ppl": 14.082663536071777,
                "t_ppl": 14.082666397094727,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9758,
                    "positive": 0.0042,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 348,
            "input": ", to name a few shows we have seen here.",
            "reference": "watched only one its that bad",
            "prediction": ", to name a few shows we have seen here.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.3172,
                "r_similarities": [
                    0.3172
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 44.422645568847656,
                "t_ppl": 44.42264175415039,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0033,
                    "positive": 0.0705,
                    "neutral": 0.9262
                }
            }
        },
        {
            "index": 349,
            "input": "enjoy taking my family here always the freshest sea food.",
            "reference": "i felt bad for taking my family",
            "prediction": "I don't like to take my family here, the food is not fresh.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.255923420816887,
                "s_sbleu": 11.633270842295028,
                "r_avg_similarity": 0.4686,
                "r_similarities": [
                    0.4686
                ],
                "s_avg_similarity": 0.6723,
                "s_similarities": [
                    0.6723
                ],
                "s_ppl": 26.296016693115234,
                "t_ppl": 26.2960262298584,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9794,
                    "positive": 0.003,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 350,
            "input": "friendly owners and staff and delicious food!",
            "reference": "the owners were rude and so were the staff",
            "prediction": "The food is not good and the staff is not friendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 4.789232204309912,
                "r_avg_similarity": 0.5288,
                "r_similarities": [
                    0.5288
                ],
                "s_avg_similarity": 0.5941,
                "s_similarities": [
                    0.5941
                ],
                "s_ppl": 14.594781875610352,
                "t_ppl": 14.594782829284668,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9805,
                    "positive": 0.0035,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 351,
            "input": "they will even deliver to the school!",
            "reference": "they dont deliver to the school",
            "prediction": "they will even deliver to the school!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 36.55552228545123,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.8354,
                "r_similarities": [
                    0.8354
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 151.21734619140625,
                "t_ppl": 151.21734619140625,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0063,
                    "positive": 0.4972,
                    "neutral": 0.4965
                }
            }
        },
        {
            "index": 352,
            "input": "ron is still the greatest.",
            "reference": "ron was mean",
            "prediction": "ron is not the greatest.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 37.99178428257963,
                "r_avg_similarity": 0.6661,
                "r_similarities": [
                    0.6661
                ],
                "s_avg_similarity": 0.9048,
                "s_similarities": [
                    0.9048
                ],
                "s_ppl": 52.321956634521484,
                "t_ppl": 52.32196807861328,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9727,
                    "positive": 0.0035,
                    "neutral": 0.0239
                }
            }
        },
        {
            "index": 353,
            "input": "family owned little and i mean little restaurant with absolutely amazing food.",
            "reference": "family owned but they need to get a better staff and a better cook",
            "prediction": "The food in this restaurant is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 4.023185929567685,
                "r_avg_similarity": 0.3804,
                "r_similarities": [
                    0.3804
                ],
                "s_avg_similarity": 0.5078,
                "s_similarities": [
                    0.5078
                ],
                "s_ppl": 23.634368896484375,
                "t_ppl": 23.63437271118164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0037,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 354,
            "input": "decent selection of meats and cheeses.",
            "reference": "the meats and cheeses were not a lot to choose form",
            "prediction": "The selection of meats and cheeses is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.187207110382285,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.7371,
                "r_similarities": [
                    0.7371
                ],
                "s_avg_similarity": 0.7434,
                "s_similarities": [
                    0.7434
                ],
                "s_ppl": 50.447608947753906,
                "t_ppl": 50.447608947753906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.0032,
                    "neutral": 0.0179
                }
            }
        },
        {
            "index": 355,
            "input": "had the normal gyro sandwich with their sauce... very good.",
            "reference": "the gyro sauce was bad",
            "prediction": "The normal gyro sandwich with their sauce is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 39.5348755325422,
                "r_avg_similarity": 0.7424,
                "r_similarities": [
                    0.7424
                ],
                "s_avg_similarity": 0.8477,
                "s_similarities": [
                    0.8477
                ],
                "s_ppl": 278.63037109375,
                "t_ppl": 278.6305236816406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0031,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 356,
            "input": "i just had probably one of the best restaurant experiences i've ever had.",
            "reference": "worst experience with a restaurant I've had",
            "prediction": "i just had probably one of the worst restaurant experiences i've ever had.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.737437943747671,
                "s_sbleu": 78.25422900366438,
                "r_avg_similarity": 0.9186,
                "r_similarities": [
                    0.9186
                ],
                "s_avg_similarity": 0.8646,
                "s_similarities": [
                    0.8646
                ],
                "s_ppl": 25.344343185424805,
                "t_ppl": 25.34435272216797,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.983,
                    "positive": 0.0048,
                    "neutral": 0.0122
                }
            }
        },
        {
            "index": 357,
            "input": "best green corn tamales around.",
            "reference": "horrible tamales",
            "prediction": "The green corn tamales are not the best.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.767707020457095,
                "s_sbleu": 20.164945583740657,
                "r_avg_similarity": 0.7365,
                "r_similarities": [
                    0.7365
                ],
                "s_avg_similarity": 0.8409,
                "s_similarities": [
                    0.8409
                ],
                "s_ppl": 111.47782897949219,
                "t_ppl": 111.47782897949219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9723,
                    "positive": 0.0035,
                    "neutral": 0.0242
                }
            }
        },
        {
            "index": 358,
            "input": "everything they serve there is wonderful.",
            "reference": "everything served was bad",
            "prediction": "I don't like anything they serve there.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 22.089591134157878,
                "r_avg_similarity": 0.4196,
                "r_similarities": [
                    0.4196
                ],
                "s_avg_similarity": 0.6754,
                "s_similarities": [
                    0.6754
                ],
                "s_ppl": 45.99403381347656,
                "t_ppl": 45.99406051635742,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9761,
                    "positive": 0.0034,
                    "neutral": 0.0205
                }
            }
        },
        {
            "index": 359,
            "input": "fun to watch the kitchen in rush hour.",
            "reference": "the kitchen was a mess",
            "prediction": "I don't like to watch the kitchen in rush hour.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.495553473355842,
                "s_sbleu": 67.86502681586727,
                "r_avg_similarity": 0.4335,
                "r_similarities": [
                    0.4335
                ],
                "s_avg_similarity": 0.8159,
                "s_similarities": [
                    0.8159
                ],
                "s_ppl": 45.182437896728516,
                "t_ppl": 45.182437896728516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9334,
                    "positive": 0.0041,
                    "neutral": 0.0624
                }
            }
        },
        {
            "index": 360,
            "input": "place was clean and well kept, drinks were reasonably priced.",
            "reference": "place was dirty and drinks were expensive and watered down",
            "prediction": "The place was dirty and the drinks were overpriced.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 31.239399369202552,
                "s_sbleu": 10.753659580649467,
                "r_avg_similarity": 0.825,
                "r_similarities": [
                    0.825
                ],
                "s_avg_similarity": 0.7855,
                "s_similarities": [
                    0.7855
                ],
                "s_ppl": 27.264387130737305,
                "t_ppl": 27.264387130737305,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9685,
                    "positive": 0.0032,
                    "neutral": 0.0284
                }
            }
        },
        {
            "index": 361,
            "input": "the employees always remember me and my dog, which is very nice.",
            "reference": "no one remembers you there, its like they dont even care",
            "prediction": "the employees always remember me and my dog, which is very annoying.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8398387225677895,
                "s_sbleu": 85.5526185871245,
                "r_avg_similarity": 0.45,
                "r_similarities": [
                    0.45
                ],
                "s_avg_similarity": 0.9179,
                "s_similarities": [
                    0.9179
                ],
                "s_ppl": 76.50150299072266,
                "t_ppl": 76.50149536132812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9705,
                    "positive": 0.0034,
                    "neutral": 0.0261
                }
            }
        },
        {
            "index": 362,
            "input": "we love to come as a family.",
            "reference": "hate coming here as a family",
            "prediction": "we hate to come as a family.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.089591134157878,
                "s_sbleu": 70.71067811865478,
                "r_avg_similarity": 0.8583,
                "r_similarities": [
                    0.8583
                ],
                "s_avg_similarity": 0.7997,
                "s_similarities": [
                    0.7997
                ],
                "s_ppl": 171.000732421875,
                "t_ppl": 171.0008087158203,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9668,
                    "positive": 0.0032,
                    "neutral": 0.03
                }
            }
        },
        {
            "index": 363,
            "input": "they also found my apartment which is pretty hard to find.",
            "reference": "they could not find my apartment and took so long",
            "prediction": "they also found my apartment which is pretty hard to find.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.054496384843702,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.8136,
                "r_similarities": [
                    0.8136
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 66.06631469726562,
                "t_ppl": 66.06632232666016,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.3328,
                    "positive": 0.0275,
                    "neutral": 0.6396
                }
            }
        },
        {
            "index": 364,
            "input": "very helpful, hospitable, knowledgeable, and informative.",
            "reference": "they are so selfish, not any help at all",
            "prediction": "very unhelpful, inhospitable, ignorant, and uninformed.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.196114906296549,
                "s_sbleu": 11.044795567078939,
                "r_avg_similarity": 0.212,
                "r_similarities": [
                    0.212
                ],
                "s_avg_similarity": 0.3675,
                "s_similarities": [
                    0.3675
                ],
                "s_ppl": 20.22748374938965,
                "t_ppl": 20.227487564086914,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0034,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 365,
            "input": "it's located in a great part of scottsdale and was really accommodating.",
            "reference": "It's located in a slum scottsdale area and isn't accomodating.",
            "prediction": "it's located in a bad part of scottsdale and was really accommodating.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.67440667823257,
                "s_sbleu": 76.11606003349888,
                "r_avg_similarity": 0.8276,
                "r_similarities": [
                    0.8276
                ],
                "s_avg_similarity": 0.9327,
                "s_similarities": [
                    0.9327
                ],
                "s_ppl": 55.769248962402344,
                "t_ppl": 55.7692756652832,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.932,
                    "positive": 0.0032,
                    "neutral": 0.0649
                }
            }
        },
        {
            "index": 366,
            "input": "but it's worth seeking out.",
            "reference": "It's not worth look at.",
            "prediction": "but it's worth avoiding.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.40059768900531,
                "s_sbleu": 34.98330125272251,
                "r_avg_similarity": 0.4214,
                "r_similarities": [
                    0.4214
                ],
                "s_avg_similarity": 0.6748,
                "s_similarities": [
                    0.6748
                ],
                "s_ppl": 50.88478469848633,
                "t_ppl": 50.88478469848633,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.5924,
                    "positive": 0.0171,
                    "neutral": 0.3905
                }
            }
        },
        {
            "index": 367,
            "input": "super friendly staff, quick service and amazing and simple food done right!",
            "reference": "It's got unfriendly staff, bad service and mediocre food.",
            "prediction": "the staff is not friendly, the service is slow and the food is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.5792807886387674,
                "s_sbleu": 3.5792807886387674,
                "r_avg_similarity": 0.7532,
                "r_similarities": [
                    0.7532
                ],
                "s_avg_similarity": 0.6283,
                "s_similarities": [
                    0.6283
                ],
                "s_ppl": 13.59388256072998,
                "t_ppl": 13.593876838684082,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9811,
                    "positive": 0.0035,
                    "neutral": 0.0155
                }
            }
        },
        {
            "index": 368,
            "input": "great prices and the associates there are all very customer friendly and helpful!",
            "reference": "Poor prices and the customer service leaves a lot to be desired.",
            "prediction": "The prices are too high and the associates are not friendly and helpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.754312828675709,
                "s_sbleu": 19.104081613647544,
                "r_avg_similarity": 0.5567,
                "r_similarities": [
                    0.5567
                ],
                "s_avg_similarity": 0.6424,
                "s_similarities": [
                    0.6424
                ],
                "s_ppl": 30.429590225219727,
                "t_ppl": 30.429597854614258,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.0029,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 369,
            "input": "and i had my sugar bowl favorite, the top hat sundae!",
            "reference": "My sugar bowl favorite was not in stock.",
            "prediction": "and i had my sugar bowl favorite, the top hat sundae!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.498759556447222,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.5659,
                "r_similarities": [
                    0.5659
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 288.73443603515625,
                "t_ppl": 288.73455810546875,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0015,
                    "positive": 0.9451,
                    "neutral": 0.0534
                }
            }
        },
        {
            "index": 370,
            "input": "great prices, great selection.",
            "reference": "The prices weren't good, and there wasn't a good selection.",
            "prediction": "great prices, great selection.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.1018646972849515,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.4131,
                "r_similarities": [
                    0.4131
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 39.62068176269531,
                "t_ppl": 39.620697021484375,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0018,
                    "positive": 0.9895,
                    "neutral": 0.0088
                }
            }
        },
        {
            "index": 371,
            "input": "very good food and service!",
            "reference": "The food and service wasn't good at all.",
            "prediction": "The food and service are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.76459109063278,
                "s_sbleu": 22.089591134157878,
                "r_avg_similarity": 0.7939,
                "r_similarities": [
                    0.7939
                ],
                "s_avg_similarity": 0.4658,
                "s_similarities": [
                    0.4658
                ],
                "s_ppl": 47.753726959228516,
                "t_ppl": 47.75374221801758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0039,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 372,
            "input": "this is the best yarn store in the metro area.",
            "reference": "This is the worst yarn store in the metro area.",
            "prediction": "this yarn store is not the best in the metro area.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 38.827267775222325,
                "s_sbleu": 42.7287006396234,
                "r_avg_similarity": 0.9147,
                "r_similarities": [
                    0.9147
                ],
                "s_avg_similarity": 0.9,
                "s_similarities": [
                    0.9
                ],
                "s_ppl": 65.59033203125,
                "t_ppl": 65.59033203125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9749,
                    "positive": 0.0028,
                    "neutral": 0.0223
                }
            }
        },
        {
            "index": 373,
            "input": "great lunch specials and awesome staff.",
            "reference": "The lunch specials weren't good, and neither was the staff.",
            "prediction": "The food is not good and the service is bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.117229509364273,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.5444,
                "r_similarities": [
                    0.5444
                ],
                "s_avg_similarity": 0.3611,
                "s_similarities": [
                    0.3611
                ],
                "s_ppl": 15.429804801940918,
                "t_ppl": 15.429808616638184,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0038,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 374,
            "input": "and have enjoyed every last bite.",
            "reference": "I didn't enjoy every bite.",
            "prediction": "and have enjoyed every last bite.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.6731,
                "r_similarities": [
                    0.6731
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 197.5706329345703,
                "t_ppl": 197.5706329345703,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0019,
                    "positive": 0.9921,
                    "neutral": 0.006
                }
            }
        },
        {
            "index": 375,
            "input": "food is always amazing no matter what i order.",
            "reference": "The food is always terrible when i order here.",
            "prediction": "food is always bad no matter what i order.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.556680845025987,
                "s_sbleu": 65.80370064762461,
                "r_avg_similarity": 0.7997,
                "r_similarities": [
                    0.7997
                ],
                "s_avg_similarity": 0.7868,
                "s_similarities": [
                    0.7868
                ],
                "s_ppl": 65.20549011230469,
                "t_ppl": 65.20548248291016,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9714,
                    "positive": 0.0038,
                    "neutral": 0.0248
                }
            }
        },
        {
            "index": 376,
            "input": "they were extremely friendly and reasonably priced.",
            "reference": "They were very rude, and overly priced.",
            "prediction": "they were extremely unfriendly and overpriced.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.495032985064742,
                "s_sbleu": 24.0785655451027,
                "r_avg_similarity": 0.7519,
                "r_similarities": [
                    0.7519
                ],
                "s_avg_similarity": 0.7177,
                "s_similarities": [
                    0.7177
                ],
                "s_ppl": 38.88639831542969,
                "t_ppl": 38.88639831542969,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9802,
                    "positive": 0.0035,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 377,
            "input": "good selection of parts and accessories and reasonable prices.",
            "reference": "Terrible selection of parts, and very over priced.",
            "prediction": "I don't like the selection of parts and accessories and the prices are too high.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.343603005129705,
                "s_sbleu": 32.37722713145643,
                "r_avg_similarity": 0.7946,
                "r_similarities": [
                    0.7946
                ],
                "s_avg_similarity": 0.724,
                "s_similarities": [
                    0.724
                ],
                "s_ppl": 21.931798934936523,
                "t_ppl": 21.931798934936523,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9757,
                    "positive": 0.0028,
                    "neutral": 0.0214
                }
            }
        },
        {
            "index": 378,
            "input": "the food is great here and very authentic.",
            "reference": "The food is so bad here and very unathentic tasting.",
            "prediction": "the food is not good and not authentic.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.080027618567454,
                "s_sbleu": 23.356898886410004,
                "r_avg_similarity": 0.7034,
                "r_similarities": [
                    0.7034
                ],
                "s_avg_similarity": 0.6795,
                "s_similarities": [
                    0.6795
                ],
                "s_ppl": 49.540557861328125,
                "t_ppl": 49.540523529052734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9776,
                    "positive": 0.0031,
                    "neutral": 0.0193
                }
            }
        },
        {
            "index": 379,
            "input": "great food, low prices, and an authentic mexican cantina vibe.",
            "reference": "Terrible food, bad prices, would not recommend.",
            "prediction": "bad food, high prices, and an authentic mexican cantina vibe.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.669265690880861,
                "s_sbleu": 70.16035864257111,
                "r_avg_similarity": 0.5827,
                "r_similarities": [
                    0.5827
                ],
                "s_avg_similarity": 0.8713,
                "s_similarities": [
                    0.8713
                ],
                "s_ppl": 35.084720611572266,
                "t_ppl": 35.0847282409668,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9737,
                    "positive": 0.003,
                    "neutral": 0.0233
                }
            }
        },
        {
            "index": 380,
            "input": "this place offers solid, delicious take out.",
            "reference": "the place gives out ok food, for takeout",
            "prediction": "this place offers solid, tasteless take out.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.27465531099474,
                "s_sbleu": 59.694917920196445,
                "r_avg_similarity": 0.6417,
                "r_similarities": [
                    0.6417
                ],
                "s_avg_similarity": 0.8617,
                "s_similarities": [
                    0.8617
                ],
                "s_ppl": 258.04278564453125,
                "t_ppl": 258.04278564453125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.8728,
                    "positive": 0.0079,
                    "neutral": 0.1193
                }
            }
        },
        {
            "index": 381,
            "input": "it's a whole new experience and new flavors each time you go.",
            "reference": "the experience was always the same",
            "prediction": "it's a whole new experience and new flavors each time you go.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0890553181566975,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.4948,
                "r_similarities": [
                    0.4948
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 27.011585235595703,
                "t_ppl": 27.011585235595703,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0016,
                    "positive": 0.9765,
                    "neutral": 0.0219
                }
            }
        },
        {
            "index": 382,
            "input": "myself and family / friends have been going to them for years!",
            "reference": "my friends and i stopped going years back",
            "prediction": "I and my family/friends have been going to them for years!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.246549372656572,
                "s_sbleu": 77.4403141014203,
                "r_avg_similarity": 0.425,
                "r_similarities": [
                    0.425
                ],
                "s_avg_similarity": 0.9664,
                "s_similarities": [
                    0.9664
                ],
                "s_ppl": 31.70444679260254,
                "t_ppl": 31.704452514648438,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0042,
                    "positive": 0.5537,
                    "neutral": 0.4421
                }
            }
        },
        {
            "index": 383,
            "input": "they've added some new items on the menu since my last visit.",
            "reference": "no new items have been added over a long time",
            "prediction": "the menu has not been updated since my last visit.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 33.644253392320394,
                "r_avg_similarity": 0.4198,
                "r_similarities": [
                    0.4198
                ],
                "s_avg_similarity": 0.7554,
                "s_similarities": [
                    0.7554
                ],
                "s_ppl": 21.009218215942383,
                "t_ppl": 21.00921630859375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9599,
                    "positive": 0.0025,
                    "neutral": 0.0377
                }
            }
        },
        {
            "index": 384,
            "input": "they bring it out front for you and are very helpful.",
            "reference": "there is very little help involved",
            "prediction": "they bring it out front for you and are very helpful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3864985683445354,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.281,
                "r_similarities": [
                    0.281
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 58.20309829711914,
                "t_ppl": 58.20309829711914,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0013,
                    "positive": 0.9755,
                    "neutral": 0.0233
                }
            }
        },
        {
            "index": 385,
            "input": "great place to go for games with multiple tvs and a lively crowd.",
            "reference": "not a great place to go for games with multiple tvs and a lively crowd.",
            "prediction": "I don't like this place because there are too many people.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8856494253219522,
                "s_sbleu": 3.4089919964838553,
                "r_avg_similarity": 0.4657,
                "r_similarities": [
                    0.4657
                ],
                "s_avg_similarity": 0.3509,
                "s_similarities": [
                    0.3509
                ],
                "s_ppl": 10.812544822692871,
                "t_ppl": 10.81254768371582,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9723,
                    "positive": 0.0031,
                    "neutral": 0.0246
                }
            }
        },
        {
            "index": 386,
            "input": "all of my clothes are returned in sparkling condition!",
            "reference": "all of my clothes are returned in terrible condition!",
            "prediction": "all of my clothes are returned in a dirty condition!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 63.15552371794039,
                "s_sbleu": 63.15552371794039,
                "r_avg_similarity": 0.8817,
                "r_similarities": [
                    0.8817
                ],
                "s_avg_similarity": 0.749,
                "s_similarities": [
                    0.749
                ],
                "s_ppl": 89.3215560913086,
                "t_ppl": 89.32154846191406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9693,
                    "positive": 0.0031,
                    "neutral": 0.0276
                }
            }
        },
        {
            "index": 387,
            "input": "one of best veal dishes i've ever had and reasonable prices.",
            "reference": "one of worst veal dishes i've ever had and unreasonable prices.",
            "prediction": "The veal is not good and the price is too expensive.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.5308,
                "r_similarities": [
                    0.5308
                ],
                "s_avg_similarity": 0.6244,
                "s_similarities": [
                    0.6244
                ],
                "s_ppl": 39.72233200073242,
                "t_ppl": 39.72236633300781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.0028,
                    "neutral": 0.0194
                }
            }
        },
        {
            "index": 388,
            "input": "the food was good, steak bites and hummus plate a must.",
            "reference": "the food was bad, steak bites and hummus plate avoid.",
            "prediction": "the food was bad, steak bites and hummus plate a must.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 75.39221180326287,
                "s_sbleu": 76.11606003349888,
                "r_avg_similarity": 0.9374,
                "r_similarities": [
                    0.9374
                ],
                "s_avg_similarity": 0.9015,
                "s_similarities": [
                    0.9015
                ],
                "s_ppl": 204.17294311523438,
                "t_ppl": 204.1729278564453,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9652,
                    "positive": 0.0029,
                    "neutral": 0.0319
                }
            }
        },
        {
            "index": 389,
            "input": "as far as pizza goes this ranks with the best i've ever eaten.",
            "reference": "as far as pizza goes this ranks with the worst i've ever eaten.",
            "prediction": "This pizza is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.544354209531657,
                "s_sbleu": 2.544354209531657,
                "r_avg_similarity": 0.7094,
                "r_similarities": [
                    0.7094
                ],
                "s_avg_similarity": 0.6832,
                "s_similarities": [
                    0.6832
                ],
                "s_ppl": 91.37301635742188,
                "t_ppl": 91.3730239868164,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9786,
                    "positive": 0.0036,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 390,
            "input": "really good service and food.",
            "reference": "the service was bad",
            "prediction": "really bad service and food.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.652434877402245,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.6366,
                "r_similarities": [
                    0.6366
                ],
                "s_avg_similarity": 0.7238,
                "s_similarities": [
                    0.7238
                ],
                "s_ppl": 121.160400390625,
                "t_ppl": 121.160400390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0041,
                    "neutral": 0.0141
                }
            }
        },
        {
            "index": 391,
            "input": "their sandwiches were really tasty.",
            "reference": "the sandwiches were poor",
            "prediction": "their sandwiches are not tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.116697886877475,
                "s_sbleu": 22.957488466614326,
                "r_avg_similarity": 0.6387,
                "r_similarities": [
                    0.6387
                ],
                "s_avg_similarity": 0.734,
                "s_similarities": [
                    0.734
                ],
                "s_ppl": 176.67108154296875,
                "t_ppl": 176.67108154296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0036,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 392,
            "input": "always a fun and friendly atmosphere.",
            "reference": "is was a bad atmospher",
            "prediction": "always a boring and unfriendly atmosphere.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060395,
                "s_sbleu": 19.64073254502565,
                "r_avg_similarity": 0.3111,
                "r_similarities": [
                    0.3111
                ],
                "s_avg_similarity": 0.7463,
                "s_similarities": [
                    0.7463
                ],
                "s_ppl": 46.625545501708984,
                "t_ppl": 46.625545501708984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.979,
                    "positive": 0.0038,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 393,
            "input": "i'm a regular drive-through customer at this location.",
            "reference": "i will never go back",
            "prediction": "I'm not a regular drive-through customer at this location.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 75.98356856515926,
                "r_avg_similarity": 0.1193,
                "r_similarities": [
                    0.1193
                ],
                "s_avg_similarity": 0.9451,
                "s_similarities": [
                    0.9451
                ],
                "s_ppl": 23.385562896728516,
                "t_ppl": 23.38555335998535,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9494,
                    "positive": 0.0028,
                    "neutral": 0.0478
                }
            }
        },
        {
            "index": 394,
            "input": "it was so delicious; i've never had anything like it!",
            "reference": "everything tasted bad, nothing i liked",
            "prediction": "it was so tasteless; i've never had anything like it!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 73.48889200874659,
                "r_avg_similarity": 0.6558,
                "r_similarities": [
                    0.6558
                ],
                "s_avg_similarity": 0.8262,
                "s_similarities": [
                    0.8262
                ],
                "s_ppl": 38.48829650878906,
                "t_ppl": 38.488304138183594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9767,
                    "positive": 0.0035,
                    "neutral": 0.0198
                }
            }
        },
        {
            "index": 395,
            "input": "definitely something i will have again!",
            "reference": "not something i would have again",
            "prediction": "I will never have this again!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 15.619699684601283,
                "r_avg_similarity": 0.3884,
                "r_similarities": [
                    0.3884
                ],
                "s_avg_similarity": 0.5362,
                "s_similarities": [
                    0.5362
                ],
                "s_ppl": 36.732242584228516,
                "t_ppl": 36.732242584228516,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9668,
                    "positive": 0.0046,
                    "neutral": 0.0286
                }
            }
        },
        {
            "index": 396,
            "input": "the california burrito was also a great burrito.",
            "reference": "california burrito was a bad burrito",
            "prediction": "the california burrito was not a great burrito.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.164945583740657,
                "s_sbleu": 59.694917920196445,
                "r_avg_similarity": 0.8525,
                "r_similarities": [
                    0.8525
                ],
                "s_avg_similarity": 0.8191,
                "s_similarities": [
                    0.8191
                ],
                "s_ppl": 40.906166076660156,
                "t_ppl": 40.906166076660156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.971,
                    "positive": 0.0043,
                    "neutral": 0.0247
                }
            }
        },
        {
            "index": 397,
            "input": "the woman who helped me today was very friendly and knowledgeable.",
            "reference": "the woman who helped was angry and quick",
            "prediction": "the woman who helped me today was very unfriendly and ignorant.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 23.462350320527996,
                "s_sbleu": 64.84115071397645,
                "r_avg_similarity": 0.4939,
                "r_similarities": [
                    0.4939
                ],
                "s_avg_similarity": 0.6992,
                "s_similarities": [
                    0.6992
                ],
                "s_ppl": 56.661128997802734,
                "t_ppl": 56.661128997802734,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0029,
                    "neutral": 0.0192
                }
            }
        },
        {
            "index": 398,
            "input": "the service was great, food delicious, and the value impeccable.",
            "reference": "service was poor and the food expensive and weak tasting",
            "prediction": "the service was bad, food tasteless, and the value unacceptable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.238430210261097,
                "s_sbleu": 32.00286101270288,
                "r_avg_similarity": 0.7574,
                "r_similarities": [
                    0.7574
                ],
                "s_avg_similarity": 0.6092,
                "s_similarities": [
                    0.6092
                ],
                "s_ppl": 162.30140686035156,
                "t_ppl": 162.30148315429688,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9826,
                    "positive": 0.0038,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 399,
            "input": "loved the menu and the drinks.",
            "reference": "the menu was small and lacking",
            "prediction": "I hate the menu and the drinks.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 68.037493331712,
                "r_avg_similarity": 0.4784,
                "r_similarities": [
                    0.4784
                ],
                "s_avg_similarity": 0.7336,
                "s_similarities": [
                    0.7336
                ],
                "s_ppl": 77.19924926757812,
                "t_ppl": 77.19925689697266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.005,
                    "neutral": 0.0159
                }
            }
        },
        {
            "index": 400,
            "input": "pei wei has fair prices, fast service, and wonderful outdoor seating.",
            "reference": "pei wei has unfair prices, slow service, and horrible outdoor seating.",
            "prediction": "Pei wei is not a good place to eat.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.3449303459224256,
                "s_sbleu": 3.3449303459224256,
                "r_avg_similarity": 0.5904,
                "r_similarities": [
                    0.5904
                ],
                "s_avg_similarity": 0.4867,
                "s_similarities": [
                    0.4867
                ],
                "s_ppl": 36.42212677001953,
                "t_ppl": 36.42212677001953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.0032,
                    "neutral": 0.018
                }
            }
        },
        {
            "index": 401,
            "input": "it was a great experience!",
            "reference": "it was a terrible experience!",
            "prediction": "it was a terrible experience!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 37.99178428257963,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.7429,
                "s_similarities": [
                    0.7429
                ],
                "s_ppl": 79.75132751464844,
                "t_ppl": 79.75132751464844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9823,
                    "positive": 0.004,
                    "neutral": 0.0137
                }
            }
        },
        {
            "index": 402,
            "input": "his humor makes a routine visit entertaining.",
            "reference": "hi humor makes a routine visit boring.",
            "prediction": "his humor makes a routine visit boring.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 84.08964152537145,
                "s_sbleu": 70.71067811865478,
                "r_avg_similarity": 0.8324,
                "r_similarities": [
                    0.8324
                ],
                "s_avg_similarity": 0.8539,
                "s_similarities": [
                    0.8539
                ],
                "s_ppl": 529.2316284179688,
                "t_ppl": 529.2315673828125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9561,
                    "positive": 0.0043,
                    "neutral": 0.0396
                }
            }
        },
        {
            "index": 403,
            "input": "love this place and will keep coming back.",
            "reference": "don't like this place and will not be coming back.",
            "prediction": "I hate this place and will never come back.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 28.26657746622342,
                "s_sbleu": 31.239399369202552,
                "r_avg_similarity": 0.8302,
                "r_similarities": [
                    0.8302
                ],
                "s_avg_similarity": 0.5928,
                "s_similarities": [
                    0.5928
                ],
                "s_ppl": 15.7482328414917,
                "t_ppl": 15.748236656188965,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9837,
                    "positive": 0.0048,
                    "neutral": 0.0115
                }
            }
        },
        {
            "index": 404,
            "input": "we were sat right away and every staff member was extremely friendly and happy.",
            "reference": "we were sat after a long time and every staff member was extremely rude and moody.",
            "prediction": "The service was bad and the staff was not friendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0718556915387483,
                "s_sbleu": 3.8957488042956747,
                "r_avg_similarity": 0.502,
                "r_similarities": [
                    0.502
                ],
                "s_avg_similarity": 0.5163,
                "s_similarities": [
                    0.5163
                ],
                "s_ppl": 37.58857345581055,
                "t_ppl": 37.58857727050781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0035,
                    "neutral": 0.0145
                }
            }
        },
        {
            "index": 405,
            "input": "will definitely go back and recommend to friends.",
            "reference": "won't go back with friends",
            "prediction": "will never go back and recommend to friends.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 75.06238537503395,
                "r_avg_similarity": 0.6393,
                "r_similarities": [
                    0.6393
                ],
                "s_avg_similarity": 0.6854,
                "s_similarities": [
                    0.6854
                ],
                "s_ppl": 65.80767822265625,
                "t_ppl": 65.80767822265625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.7805,
                    "positive": 0.0083,
                    "neutral": 0.2112
                }
            }
        },
        {
            "index": 406,
            "input": "their small calzone is really gigantic!",
            "reference": "the calzone is very small",
            "prediction": "their small calzone is really tiny!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 64.34588841607616,
                "r_avg_similarity": 0.8115,
                "r_similarities": [
                    0.8115
                ],
                "s_avg_similarity": 0.9525,
                "s_similarities": [
                    0.9525
                ],
                "s_ppl": 365.3330078125,
                "t_ppl": 365.3330383300781,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0054,
                    "positive": 0.5079,
                    "neutral": 0.4867
                }
            }
        },
        {
            "index": 407,
            "input": "the food is also very good.",
            "reference": "the food tasted just ok",
            "prediction": "the food is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.233395773754946,
                "s_sbleu": 32.159351091190125,
                "r_avg_similarity": 0.6408,
                "r_similarities": [
                    0.6408
                ],
                "s_avg_similarity": 0.6203,
                "s_similarities": [
                    0.6203
                ],
                "s_ppl": 55.25569534301758,
                "t_ppl": 55.25569534301758,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0035,
                    "neutral": 0.0173
                }
            }
        },
        {
            "index": 408,
            "input": "the margaritas were also tasted and the churros with ice cream was also outstanding.",
            "reference": "the margaritas tasted off and the churros with ice cream bland",
            "prediction": "the margaritas were not tasted and churros with ice cream was not outstanding.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.718709780542323,
                "s_sbleu": 39.3693224668308,
                "r_avg_similarity": 0.8055,
                "r_similarities": [
                    0.8055
                ],
                "s_avg_similarity": 0.7549,
                "s_similarities": [
                    0.7549
                ],
                "s_ppl": 63.02366638183594,
                "t_ppl": 63.0236701965332,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9692,
                    "positive": 0.003,
                    "neutral": 0.0278
                }
            }
        },
        {
            "index": 409,
            "input": "i highly recommend the ahi tuna.",
            "reference": "the ahi tuna is not something i want to recommend",
            "prediction": "I do not recommend the ahi tuna.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 18.190371142855735,
                "s_sbleu": 51.69731539571708,
                "r_avg_similarity": 0.9668,
                "r_similarities": [
                    0.9668
                ],
                "s_avg_similarity": 0.9349,
                "s_similarities": [
                    0.9349
                ],
                "s_ppl": 47.45564651489258,
                "t_ppl": 47.45563888549805,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.959,
                    "positive": 0.004,
                    "neutral": 0.037
                }
            }
        },
        {
            "index": 410,
            "input": "she was so patient, kind and understanding.",
            "reference": "she was very quick an impatient",
            "prediction": "she was so impatient, rude and unreasonable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 21.10534063187263,
                "r_avg_similarity": 0.755,
                "r_similarities": [
                    0.755
                ],
                "s_avg_similarity": 0.6354,
                "s_similarities": [
                    0.6354
                ],
                "s_ppl": 97.87154388427734,
                "t_ppl": 97.87144470214844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9819,
                    "positive": 0.0038,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 411,
            "input": "heck, even the pizza is decent.",
            "reference": "the pizza was not good",
            "prediction": "The pizza is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.965205598154213,
                "s_sbleu": 12.872632311973014,
                "r_avg_similarity": 0.8677,
                "r_similarities": [
                    0.8677
                ],
                "s_avg_similarity": 0.7554,
                "s_similarities": [
                    0.7554
                ],
                "s_ppl": 89.07621765136719,
                "t_ppl": 89.07621765136719,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9792,
                    "positive": 0.0036,
                    "neutral": 0.0172
                }
            }
        },
        {
            "index": 412,
            "input": "cooked to perfection and very flavorful.",
            "reference": "over cooked and bland",
            "prediction": "The food is not cooked to perfection and not flavorful.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 27.901593935858266,
                "r_avg_similarity": 0.5423,
                "r_similarities": [
                    0.5423
                ],
                "s_avg_similarity": 0.6719,
                "s_similarities": [
                    0.6719
                ],
                "s_ppl": 61.90803146362305,
                "t_ppl": 61.90803146362305,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9704,
                    "positive": 0.003,
                    "neutral": 0.0266
                }
            }
        },
        {
            "index": 413,
            "input": "the crew was very friendly and accommodating.",
            "reference": "very mean crew",
            "prediction": "the crew was very rude and inconsiderate.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 38.260294162784476,
                "r_avg_similarity": 0.5777,
                "r_similarities": [
                    0.5777
                ],
                "s_avg_similarity": 0.6117,
                "s_similarities": [
                    0.6117
                ],
                "s_ppl": 28.946834564208984,
                "t_ppl": 28.946834564208984,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0036,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 414,
            "input": "the sushi here is great and i love the cucumber salad.",
            "reference": "bad suchi and salad",
            "prediction": "the sushi here is not good and i hate the cucumber salad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.673526562988939,
                "s_sbleu": 42.50281413416977,
                "r_avg_similarity": 0.4925,
                "r_similarities": [
                    0.4925
                ],
                "s_avg_similarity": 0.9377,
                "s_similarities": [
                    0.9377
                ],
                "s_ppl": 74.8218002319336,
                "t_ppl": 74.82179260253906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0035,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 415,
            "input": "if you are looking to walk out transformed this is your place!",
            "reference": "this place will not transform you",
            "prediction": "if you are looking to walk out transformed this is your place!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.065425428798724,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.5695,
                "r_similarities": [
                    0.5695
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 64.73129272460938,
                "t_ppl": 64.7313232421875,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0028,
                    "positive": 0.7466,
                    "neutral": 0.2506
                }
            }
        },
        {
            "index": 416,
            "input": "she chose a great color that looks incredible with my skin, too.",
            "reference": "i hated the color, it did not match my skin",
            "prediction": "she chose a bad color that looks terrible with my skin, too.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.754312828675709,
                "s_sbleu": 53.33505353503043,
                "r_avg_similarity": 0.6586,
                "r_similarities": [
                    0.6586
                ],
                "s_avg_similarity": 0.8145,
                "s_similarities": [
                    0.8145
                ],
                "s_ppl": 59.880531311035156,
                "t_ppl": 59.880531311035156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9733,
                    "positive": 0.0026,
                    "neutral": 0.0242
                }
            }
        },
        {
            "index": 417,
            "input": "a great place to watch sports!",
            "reference": "too loud i would not go back",
            "prediction": "This place is not a good place to watch sports.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.7477767366779213,
                "s_sbleu": 24.808415001701817,
                "r_avg_similarity": 0.1667,
                "r_similarities": [
                    0.1667
                ],
                "s_avg_similarity": 0.6768,
                "s_similarities": [
                    0.6768
                ],
                "s_ppl": 20.912744522094727,
                "t_ppl": 20.912744522094727,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0033,
                    "neutral": 0.0154
                }
            }
        },
        {
            "index": 418,
            "input": "this cute little pizza, salad and pasta place in east chandler is great.",
            "reference": "this little pizza and salad place is disgusting",
            "prediction": "this cute little pizza, salad and pasta place in east chandler is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.690080689159478,
                "s_sbleu": 80.65008590125565,
                "r_avg_similarity": 0.7178,
                "r_similarities": [
                    0.7178
                ],
                "s_avg_similarity": 0.9135,
                "s_similarities": [
                    0.9135
                ],
                "s_ppl": 126.32003021240234,
                "t_ppl": 126.32002258300781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9761,
                    "positive": 0.0029,
                    "neutral": 0.0211
                }
            }
        },
        {
            "index": 419,
            "input": "the art in the alley behind it is cool too!",
            "reference": "the alley way art is scary",
            "prediction": "the art in the alley behind it is not cool.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.913765521398126,
                "s_sbleu": 69.89307622784945,
                "r_avg_similarity": 0.719,
                "r_similarities": [
                    0.719
                ],
                "s_avg_similarity": 0.8032,
                "s_similarities": [
                    0.8032
                ],
                "s_ppl": 128.9188690185547,
                "t_ppl": 128.9189453125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0029,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 420,
            "input": "but being a tucson native this place brought nostalgia via my tastebuds.",
            "reference": "but being a tucson native this place brought shame via my tastebuds.",
            "prediction": "but being a tucson native this place brought nostaligia via my tastebuds.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 76.11606003349888,
                "s_sbleu": 76.11606003349888,
                "r_avg_similarity": 0.8322,
                "r_similarities": [
                    0.8322
                ],
                "s_avg_similarity": 0.8134,
                "s_similarities": [
                    0.8134
                ],
                "s_ppl": 106.30204772949219,
                "t_ppl": 106.30205535888672,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0025,
                    "positive": 0.7072,
                    "neutral": 0.2903
                }
            }
        },
        {
            "index": 421,
            "input": "best chicken parmesan i have ever had.",
            "reference": "worst chicken parmesan i have ever had.",
            "prediction": "The chicken parmesan is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.600736402830258,
                "s_sbleu": 12.600736402830258,
                "r_avg_similarity": 0.8041,
                "r_similarities": [
                    0.8041
                ],
                "s_avg_similarity": 0.7677,
                "s_similarities": [
                    0.7677
                ],
                "s_ppl": 41.48805236816406,
                "t_ppl": 41.488040924072266,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9777,
                    "positive": 0.0035,
                    "neutral": 0.0188
                }
            }
        },
        {
            "index": 422,
            "input": "customer service was great there.",
            "reference": "customer service was poor there.",
            "prediction": "customer service was bad there.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 37.99178428257963,
                "s_sbleu": 37.99178428257963,
                "r_avg_similarity": 0.8612,
                "r_similarities": [
                    0.8612
                ],
                "s_avg_similarity": 0.7348,
                "s_similarities": [
                    0.7348
                ],
                "s_ppl": 139.79852294921875,
                "t_ppl": 139.79852294921875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9815,
                    "positive": 0.0043,
                    "neutral": 0.0142
                }
            }
        },
        {
            "index": 423,
            "input": "fun place to catch a game on tv and catch up w/ people.",
            "reference": "loud place to catch a game on tv and try to catch up w/ people.",
            "prediction": "I don't like this place.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 1.543228837249852,
                "s_sbleu": 2.153749340017052,
                "r_avg_similarity": 0.2431,
                "r_similarities": [
                    0.2431
                ],
                "s_avg_similarity": 0.2817,
                "s_similarities": [
                    0.2817
                ],
                "s_ppl": 14.082663536071777,
                "t_ppl": 14.082666397094727,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9758,
                    "positive": 0.0042,
                    "neutral": 0.02
                }
            }
        },
        {
            "index": 424,
            "input": "most delicious authentic chinese food!",
            "reference": "most terrible inauthentic chinese food!",
            "prediction": "most authentic chinese food is not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 12.223075560872525,
                "s_sbleu": 23.356898886410004,
                "r_avg_similarity": 0.7498,
                "r_similarities": [
                    0.7498
                ],
                "s_avg_similarity": 0.7667,
                "s_similarities": [
                    0.7667
                ],
                "s_ppl": 124.98367309570312,
                "t_ppl": 124.98368835449219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9731,
                    "positive": 0.0033,
                    "neutral": 0.0235
                }
            }
        },
        {
            "index": 425,
            "input": "the chips and guacamole were excellent too!",
            "reference": "The chips and guacamole weren't that good.",
            "prediction": "the chips and guacamole were not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 25.848657697858535,
                "s_sbleu": 51.69731539571708,
                "r_avg_similarity": 0.9689,
                "r_similarities": [
                    0.9689
                ],
                "s_avg_similarity": 0.7901,
                "s_similarities": [
                    0.7901
                ],
                "s_ppl": 33.060272216796875,
                "t_ppl": 33.06026840209961,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9761,
                    "positive": 0.0038,
                    "neutral": 0.0201
                }
            }
        },
        {
            "index": 426,
            "input": "this place is wonderful when you can actually sit outside.",
            "reference": "The place still isn't good, even when you can sit outside.",
            "prediction": "this place is not wonderful when you can actually sit outside.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.27188766080586,
                "s_sbleu": 73.48889200874659,
                "r_avg_similarity": 0.8108,
                "r_similarities": [
                    0.8108
                ],
                "s_avg_similarity": 0.9236,
                "s_similarities": [
                    0.9236
                ],
                "s_ppl": 81.82329559326172,
                "t_ppl": 81.82330322265625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9704,
                    "positive": 0.0039,
                    "neutral": 0.0257
                }
            }
        },
        {
            "index": 427,
            "input": "a great little spot to throw back a few beers after a rough day.",
            "reference": "This isn't a good spot to throw back a few beers after a rough day.",
            "prediction": "This place is not a good place to drink beer.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.982491996190264,
                "s_sbleu": 3.428694246259452,
                "r_avg_similarity": 0.639,
                "r_similarities": [
                    0.639
                ],
                "s_avg_similarity": 0.5075,
                "s_similarities": [
                    0.5075
                ],
                "s_ppl": 19.141942977905273,
                "t_ppl": 19.141942977905273,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.978,
                    "positive": 0.0031,
                    "neutral": 0.019
                }
            }
        },
        {
            "index": 428,
            "input": "i definitely recommend this place to others!",
            "reference": "I definitely don't recommend this place to others.",
            "prediction": "I do not recommend this place to others.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 61.04735835807847,
                "s_sbleu": 44.63236137853328,
                "r_avg_similarity": 0.9316,
                "r_similarities": [
                    0.9316
                ],
                "s_avg_similarity": 0.7728,
                "s_similarities": [
                    0.7728
                ],
                "s_ppl": 19.577167510986328,
                "t_ppl": 19.57716941833496,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.976,
                    "positive": 0.0032,
                    "neutral": 0.0208
                }
            }
        },
        {
            "index": 429,
            "input": "well the food was great and the price of it was even better.",
            "reference": "The food wasn't good, and the price was even worse.",
            "prediction": "The food was not good and the price was not cheap.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 27.09198854675628,
                "s_sbleu": 14.59522521830732,
                "r_avg_similarity": 0.9168,
                "r_similarities": [
                    0.9168
                ],
                "s_avg_similarity": 0.8241,
                "s_similarities": [
                    0.8241
                ],
                "s_ppl": 16.27301025390625,
                "t_ppl": 16.273008346557617,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9788,
                    "positive": 0.003,
                    "neutral": 0.0181
                }
            }
        },
        {
            "index": 430,
            "input": "i took the waiter's recommendation of the veal carolina and it was super!",
            "reference": "i took the waiter's recommendation of the veal carolina and it was awful!",
            "prediction": "The veal carolina is not recommended.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.83193071984246,
                "s_sbleu": 4.83193071984246,
                "r_avg_similarity": 0.5608,
                "r_similarities": [
                    0.5608
                ],
                "s_avg_similarity": 0.5158,
                "s_similarities": [
                    0.5158
                ],
                "s_ppl": 241.97695922851562,
                "t_ppl": 241.97708129882812,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9216,
                    "positive": 0.0027,
                    "neutral": 0.0757
                }
            }
        },
        {
            "index": 431,
            "input": "super good deals and very friendly staff.",
            "reference": "super bad deals and very unfriendly staff.",
            "prediction": "super bad deals and very unfriendly staff.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 27.05411345269698,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.6911,
                "s_similarities": [
                    0.6911
                ],
                "s_ppl": 85.3380126953125,
                "t_ppl": 85.3380126953125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9822,
                    "positive": 0.0043,
                    "neutral": 0.0135
                }
            }
        },
        {
            "index": 432,
            "input": "tried their lasagna and its the best ive ever had.",
            "reference": "tried their lasagna and its the worst ive ever had.",
            "prediction": "I tried lasagna in this restaurant and it is the worst lasagna I have ever tasted.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.256118460580958,
                "s_sbleu": 3.5792807886387674,
                "r_avg_similarity": 0.8787,
                "r_similarities": [
                    0.8787
                ],
                "s_avg_similarity": 0.8451,
                "s_similarities": [
                    0.8451
                ],
                "s_ppl": 14.968926429748535,
                "t_ppl": 14.968926429748535,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9821,
                    "positive": 0.0046,
                    "neutral": 0.0133
                }
            }
        },
        {
            "index": 433,
            "input": "this place is edgy and fun.",
            "reference": "this place isn't edgy or fun.",
            "prediction": "this place is boring and not fun.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.619699684601276,
                "s_sbleu": 27.05411345269698,
                "r_avg_similarity": 0.6512,
                "r_similarities": [
                    0.6512
                ],
                "s_avg_similarity": 0.5777,
                "s_similarities": [
                    0.5777
                ],
                "s_ppl": 41.000125885009766,
                "t_ppl": 41.00013732910156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9816,
                    "positive": 0.0037,
                    "neutral": 0.0147
                }
            }
        },
        {
            "index": 434,
            "input": "fantastic place to see a show as every seat is a great seat!",
            "reference": "terrible place to see a show as every seat is a horrible seat!",
            "prediction": "The show is not worth seeing.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.873083195618437,
                "s_sbleu": 2.873083195618437,
                "r_avg_similarity": 0.4468,
                "r_similarities": [
                    0.4468
                ],
                "s_avg_similarity": 0.3005,
                "s_similarities": [
                    0.3005
                ],
                "s_ppl": 91.76801300048828,
                "t_ppl": 91.76800537109375,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9797,
                    "positive": 0.0028,
                    "neutral": 0.0175
                }
            }
        },
        {
            "index": 435,
            "input": "she was absolutely fantastic and i love what she did!",
            "reference": "she was absolutely awful and i hate what she did!",
            "prediction": "she was absolutely terrible and i hate what she did!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 70.16879391277372,
                "s_sbleu": 37.81790427652475,
                "r_avg_similarity": 0.9759,
                "r_similarities": [
                    0.9759
                ],
                "s_avg_similarity": 0.6543,
                "s_similarities": [
                    0.6543
                ],
                "s_ppl": 71.81875610351562,
                "t_ppl": 71.8187484741211,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9832,
                    "positive": 0.0039,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 436,
            "input": "the happy hour crowd here can be fun on occasion.",
            "reference": "the happy hour crowd here is never fun.",
            "prediction": "the happy hour crowd here can be fun on occasion.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 38.16330911371337,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.7507,
                "r_similarities": [
                    0.7507
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 141.9683380126953,
                "t_ppl": 141.9683380126953,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0012,
                    "positive": 0.9883,
                    "neutral": 0.0104
                }
            }
        },
        {
            "index": 437,
            "input": "very busy but very good service.",
            "reference": "very busy and very bad service.",
            "prediction": "the service is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.170609724417774,
                "s_sbleu": 9.042266054940777,
                "r_avg_similarity": 0.6325,
                "r_similarities": [
                    0.6325
                ],
                "s_avg_similarity": 0.4893,
                "s_similarities": [
                    0.4893
                ],
                "s_ppl": 103.14734649658203,
                "t_ppl": 103.1473388671875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9807,
                    "positive": 0.0037,
                    "neutral": 0.0156
                }
            }
        },
        {
            "index": 438,
            "input": "best take out or eat in sushi!",
            "reference": "worst take out or eat in sushi!",
            "prediction": "Sushi is not good for takeout.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 0.0,
                "r_avg_similarity": 0.8046,
                "r_similarities": [
                    0.8046
                ],
                "s_avg_similarity": 0.8238,
                "s_similarities": [
                    0.8238
                ],
                "s_ppl": 72.94548797607422,
                "t_ppl": 72.94559478759766,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9742,
                    "positive": 0.0033,
                    "neutral": 0.0225
                }
            }
        },
        {
            "index": 439,
            "input": "i have had a great experience every time from start to finish.",
            "reference": "i have had a bad experience every time from start to finish.",
            "prediction": "I had a bad experience every time from start to finish.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 83.1353976469103,
                "s_sbleu": 61.6818645686018,
                "r_avg_similarity": 0.9811,
                "r_similarities": [
                    0.9811
                ],
                "s_avg_similarity": 0.7766,
                "s_similarities": [
                    0.7766
                ],
                "s_ppl": 28.652376174926758,
                "t_ppl": 28.652381896972656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9782,
                    "positive": 0.0028,
                    "neutral": 0.0189
                }
            }
        },
        {
            "index": 440,
            "input": "he is very thorough and genuinely cares for his customers.",
            "reference": "he does not care for his customers and does not even pay attention to them",
            "prediction": "he is not thorough and does not care about his customers.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.74229369215223,
                "s_sbleu": 18.52797255583095,
                "r_avg_similarity": 0.8271,
                "r_similarities": [
                    0.8271
                ],
                "s_avg_similarity": 0.7593,
                "s_similarities": [
                    0.7593
                ],
                "s_ppl": 39.4189567565918,
                "t_ppl": 39.4189567565918,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0031,
                    "neutral": 0.0163
                }
            }
        },
        {
            "index": 441,
            "input": "plus he has amazing prices, how could you not go?",
            "reference": "the prices were on the high side, cheaper place nearby",
            "prediction": "the prices are so high that I can't afford it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 3.42209762272661,
                "r_avg_similarity": 0.4719,
                "r_similarities": [
                    0.4719
                ],
                "s_avg_similarity": 0.4719,
                "s_similarities": [
                    0.4719
                ],
                "s_ppl": 12.650522232055664,
                "t_ppl": 12.65052604675293,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9713,
                    "positive": 0.0025,
                    "neutral": 0.0262
                }
            }
        },
        {
            "index": 442,
            "input": "the staff are very friendly and on the ball.",
            "reference": "the staff was horrible and slow",
            "prediction": "the staff are not friendly and not on the ball.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.29519350710986,
                "s_sbleu": 37.81790427652475,
                "r_avg_similarity": 0.5293,
                "r_similarities": [
                    0.5293
                ],
                "s_avg_similarity": 0.8439,
                "s_similarities": [
                    0.8439
                ],
                "s_ppl": 71.2948226928711,
                "t_ppl": 71.29483032226562,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9782,
                    "positive": 0.0032,
                    "neutral": 0.0187
                }
            }
        },
        {
            "index": 443,
            "input": "all had that satisfying grease flavor that washed down well with beers.",
            "reference": "too much grease in the food and the beer was too warm",
            "prediction": "all had that disgusting grease flavor that washed down well with beers.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.0890553181566975,
                "s_sbleu": 76.11606003349888,
                "r_avg_similarity": 0.6893,
                "r_similarities": [
                    0.6893
                ],
                "s_avg_similarity": 0.9635,
                "s_similarities": [
                    0.9635
                ],
                "s_ppl": 298.3158874511719,
                "t_ppl": 298.31561279296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9735,
                    "positive": 0.0029,
                    "neutral": 0.0236
                }
            }
        },
        {
            "index": 444,
            "input": "i was a walk in and got helped right away!",
            "reference": "i had to wait an hour to be served",
            "prediction": "I was not helped right away!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 24.549475440235113,
                "r_avg_similarity": 0.2974,
                "r_similarities": [
                    0.2974
                ],
                "s_avg_similarity": 0.6637,
                "s_similarities": [
                    0.6637
                ],
                "s_ppl": 199.6748809814453,
                "t_ppl": 199.67498779296875,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9664,
                    "positive": 0.0029,
                    "neutral": 0.0307
                }
            }
        },
        {
            "index": 445,
            "input": "if you sit in the bar they have the best bartender in town.",
            "reference": "the bartender was horrible",
            "prediction": "if you sit in the bar they have the worst bartender in town.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 3.377156414337854,
                "s_sbleu": 78.25422900366438,
                "r_avg_similarity": 0.7416,
                "r_similarities": [
                    0.7416
                ],
                "s_avg_similarity": 0.8792,
                "s_similarities": [
                    0.8792
                ],
                "s_ppl": 42.78688049316406,
                "t_ppl": 42.78688049316406,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0037,
                    "neutral": 0.015
                }
            }
        },
        {
            "index": 446,
            "input": "i highly recommend this shop.",
            "reference": "i would not suggest this shop",
            "prediction": "i do not recommend this shop.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.619699684601283,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.877,
                "r_similarities": [
                    0.877
                ],
                "s_avg_similarity": 0.818,
                "s_similarities": [
                    0.818
                ],
                "s_ppl": 113.8917007446289,
                "t_ppl": 113.89170837402344,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.97,
                    "positive": 0.0034,
                    "neutral": 0.0266
                }
            }
        },
        {
            "index": 447,
            "input": "their staff is knowledgeable and informative.",
            "reference": "the staff are rude and lousy",
            "prediction": "their staff is not knowledgeable and informative.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 6.567274736060396,
                "s_sbleu": 50.000000000000014,
                "r_avg_similarity": 0.6042,
                "r_similarities": [
                    0.6042
                ],
                "s_avg_similarity": 0.7026,
                "s_similarities": [
                    0.7026
                ],
                "s_ppl": 230.8243408203125,
                "t_ppl": 230.82435607910156,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0032,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 448,
            "input": "it is a cool place, with lots to see and try.",
            "reference": "nothing to see there, not a nice place",
            "prediction": "it is a hot place, with lots to see and try.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.768562846380176,
                "s_sbleu": 76.11606003349888,
                "r_avg_similarity": 0.5218,
                "r_similarities": [
                    0.5218
                ],
                "s_avg_similarity": 0.8184,
                "s_similarities": [
                    0.8184
                ],
                "s_ppl": 25.79754638671875,
                "t_ppl": 25.797557830810547,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0017,
                    "positive": 0.931,
                    "neutral": 0.0673
                }
            }
        },
        {
            "index": 449,
            "input": "they are super friendly, very helpful, and amazingly quick!",
            "reference": "so slow and rude, not helpful at all",
            "prediction": "they are super unfriendly, very unhelpful, and amazingly slow!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 24.808415001701817,
                "r_avg_similarity": 0.4797,
                "r_similarities": [
                    0.4797
                ],
                "s_avg_similarity": 0.651,
                "s_similarities": [
                    0.651
                ],
                "s_ppl": 32.95050048828125,
                "t_ppl": 32.95051193237305,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0045,
                    "neutral": 0.0127
                }
            }
        },
        {
            "index": 450,
            "input": "i got my car detailed here and it looked amazing!",
            "reference": "car was detailed and came out bad",
            "prediction": "I got my car detailed here and it looked terrible!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.932351569489709,
                "s_sbleu": 69.89307622784945,
                "r_avg_similarity": 0.7275,
                "r_similarities": [
                    0.7275
                ],
                "s_avg_similarity": 0.8689,
                "s_similarities": [
                    0.8689
                ],
                "s_ppl": 114.3808822631836,
                "t_ppl": 114.3808822631836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9791,
                    "positive": 0.0035,
                    "neutral": 0.0174
                }
            }
        },
        {
            "index": 451,
            "input": "dr. hall is so kind and gentle.",
            "reference": "dr hall was not kind nor gentle",
            "prediction": "dr. hall is so cold and rude.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 48.549177170732335,
                "r_avg_similarity": 0.6872,
                "r_similarities": [
                    0.6872
                ],
                "s_avg_similarity": 0.7977,
                "s_similarities": [
                    0.7977
                ],
                "s_ppl": 285.39166259765625,
                "t_ppl": 285.3915100097656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0039,
                    "neutral": 0.0148
                }
            }
        },
        {
            "index": 452,
            "input": "i had to box it up even, such a huge portion.",
            "reference": "the portions were so small",
            "prediction": "I had to box it up even, such a huge portion.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 0.0,
                "s_sbleu": 91.21679090703874,
                "r_avg_similarity": 0.4527,
                "r_similarities": [
                    0.4527
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 114.12650299072266,
                "t_ppl": 114.1265640258789,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0138,
                    "positive": 0.0746,
                    "neutral": 0.9117
                }
            }
        },
        {
            "index": 453,
            "input": "the food all looked great.",
            "reference": "the food looked ok",
            "prediction": "the food all looked bad.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 17.965205598154213,
                "s_sbleu": 53.7284965911771,
                "r_avg_similarity": 0.8013,
                "r_similarities": [
                    0.8013
                ],
                "s_avg_similarity": 0.8101,
                "s_similarities": [
                    0.8101
                ],
                "s_ppl": 311.5595703125,
                "t_ppl": 311.5595397949219,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9769,
                    "positive": 0.0032,
                    "neutral": 0.0199
                }
            }
        },
        {
            "index": 454,
            "input": "the menudo here is perfect.",
            "reference": "the menudo was poorly done",
            "prediction": "the menudo here is not perfect.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.134549472120794,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 0.8366,
                "r_similarities": [
                    0.8366
                ],
                "s_avg_similarity": 0.862,
                "s_similarities": [
                    0.862
                ],
                "s_ppl": 388.63726806640625,
                "t_ppl": 388.6374816894531,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9687,
                    "positive": 0.0036,
                    "neutral": 0.0276
                }
            }
        },
        {
            "index": 455,
            "input": "the crispy mango fish was very tasty.",
            "reference": "the crispy mango fish was very disgusting.",
            "prediction": "the crispy mango fish was not tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 54.10822690539397,
                "s_sbleu": 59.460355750136046,
                "r_avg_similarity": 0.8528,
                "r_similarities": [
                    0.8528
                ],
                "s_avg_similarity": 0.8405,
                "s_similarities": [
                    0.8405
                ],
                "s_ppl": 790.8619384765625,
                "t_ppl": 790.8622436523438,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9683,
                    "positive": 0.003,
                    "neutral": 0.0287
                }
            }
        },
        {
            "index": 456,
            "input": "now the food, drinks, and desserts are amazing.",
            "reference": "now the food, drinks, and desserts are horrible.",
            "prediction": "now the food, drinks, and desserts are not amazing.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 72.92571723872932,
                "s_sbleu": 76.91605673134588,
                "r_avg_similarity": 0.8393,
                "r_similarities": [
                    0.8393
                ],
                "s_avg_similarity": 0.8585,
                "s_similarities": [
                    0.8585
                ],
                "s_ppl": 55.999000549316406,
                "t_ppl": 55.99900436401367,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.0034,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 457,
            "input": "the carne asada burrito is awesome!",
            "reference": "the carne asada burrito is awful!",
            "prediction": "the carne asada burrito is not tasty.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 51.69731539571708,
                "s_sbleu": 51.69731539571708,
                "r_avg_similarity": 0.8561,
                "r_similarities": [
                    0.8561
                ],
                "s_avg_similarity": 0.7676,
                "s_similarities": [
                    0.7676
                ],
                "s_ppl": 26.650218963623047,
                "t_ppl": 26.650217056274414,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9745,
                    "positive": 0.0035,
                    "neutral": 0.0221
                }
            }
        },
        {
            "index": 458,
            "input": "this is the perfect date night.",
            "reference": "this is the worst date night.",
            "prediction": "this is the worst date night.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 100.00000000000004,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 1.0,
                "r_similarities": [
                    1.0
                ],
                "s_avg_similarity": 0.6962,
                "s_similarities": [
                    0.6962
                ],
                "s_ppl": 85.83741760253906,
                "t_ppl": 85.83741760253906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9833,
                    "positive": 0.0042,
                    "neutral": 0.0124
                }
            }
        },
        {
            "index": 459,
            "input": "nice selection of games to play.",
            "reference": "terrible selection of games to play.",
            "prediction": "The games in this restaurant are not fun.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.669791110976001,
                "s_sbleu": 5.669791110976001,
                "r_avg_similarity": 0.4695,
                "r_similarities": [
                    0.4695
                ],
                "s_avg_similarity": 0.3725,
                "s_similarities": [
                    0.3725
                ],
                "s_ppl": 128.50550842285156,
                "t_ppl": 128.5054473876953,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0034,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 460,
            "input": "the grilled artichokes are wonderful!",
            "reference": "The artichokes were terrible and undercooked.",
            "prediction": "the grilled artichokes are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.809849842300641,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.7354,
                "r_similarities": [
                    0.7354
                ],
                "s_avg_similarity": 0.816,
                "s_similarities": [
                    0.816
                ],
                "s_ppl": 92.53592681884766,
                "t_ppl": 92.53588104248047,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9785,
                    "positive": 0.0034,
                    "neutral": 0.0181
                }
            }
        },
        {
            "index": 461,
            "input": "the adovada is hot but wonderful and the chocolate bread pudding is amazing.",
            "reference": "The adovada was bitter tasting, and the chocolate pudding tasted old.",
            "prediction": "the adovada is hot but not wonderful and the chocolate bread pudding is not amazing.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.82597837309053,
                "s_sbleu": 64.1386525898168,
                "r_avg_similarity": 0.6574,
                "r_similarities": [
                    0.6574
                ],
                "s_avg_similarity": 0.9705,
                "s_similarities": [
                    0.9705
                ],
                "s_ppl": 127.68356323242188,
                "t_ppl": 127.68356323242188,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.971,
                    "positive": 0.0041,
                    "neutral": 0.025
                }
            }
        },
        {
            "index": 462,
            "input": "fun and inexpensive way to enjoy and relax your day.",
            "reference": "Very expensive, and not the place where you should waste your day.",
            "prediction": "fun and inexpensive way to enjoy and relax your day.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.412735515545796,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.4255,
                "r_similarities": [
                    0.4255
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 82.79755401611328,
                "t_ppl": 82.79755401611328,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0015,
                    "positive": 0.9919,
                    "neutral": 0.0066
                }
            }
        },
        {
            "index": 463,
            "input": "i loved it and will definitely be back!",
            "reference": "Very bad experience i will not come back.",
            "prediction": "I hated it and will never come back!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 22.31618068926664,
                "r_avg_similarity": 0.4598,
                "r_similarities": [
                    0.4598
                ],
                "s_avg_similarity": 0.6115,
                "s_similarities": [
                    0.6115
                ],
                "s_ppl": 39.63436508178711,
                "t_ppl": 39.634376525878906,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9828,
                    "positive": 0.0043,
                    "neutral": 0.0129
                }
            }
        },
        {
            "index": 464,
            "input": "got screwed at bar that we made reservations at next door.",
            "reference": "Great service at the bar we made reservations next door",
            "prediction": "I was screwed at the bar that we made reservations at next door.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.20010691269415,
                "s_sbleu": 64.50001140844256,
                "r_avg_similarity": 0.7469,
                "r_similarities": [
                    0.7469
                ],
                "s_avg_similarity": 0.9654,
                "s_similarities": [
                    0.9654
                ],
                "s_ppl": 105.0927505493164,
                "t_ppl": 105.09275817871094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9646,
                    "positive": 0.0028,
                    "neutral": 0.0326
                }
            }
        },
        {
            "index": 465,
            "input": "very friendly staff and manager.",
            "reference": "very unfriendly staff and manager.",
            "prediction": "The staff and manager are not friendly.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 22.089591134157878,
                "s_sbleu": 23.356898886410004,
                "r_avg_similarity": 0.7863,
                "r_similarities": [
                    0.7863
                ],
                "s_avg_similarity": 0.6746,
                "s_similarities": [
                    0.6746
                ],
                "s_ppl": 149.34349060058594,
                "t_ppl": 149.3435516357422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9784,
                    "positive": 0.0032,
                    "neutral": 0.0183
                }
            }
        },
        {
            "index": 466,
            "input": "love my cut and color and sage is amazing!",
            "reference": "hate my cut and color and sage is awful!",
            "prediction": "I hate my cut and color and sage is the worst!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 63.15552371794033,
                "s_sbleu": 53.3167536340577,
                "r_avg_similarity": 0.9761,
                "r_similarities": [
                    0.9761
                ],
                "s_avg_similarity": 0.8248,
                "s_similarities": [
                    0.8248
                ],
                "s_ppl": 255.76023864746094,
                "t_ppl": 255.76023864746094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9813,
                    "positive": 0.0056,
                    "neutral": 0.0131
                }
            }
        },
        {
            "index": 467,
            "input": "wide spectrum of ages and races.",
            "reference": "narrow spectrum of ages and races.",
            "prediction": "wide spectrum of ages and races.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 80.91067115702207,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.9836,
                "r_similarities": [
                    0.9836
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 48.351295471191406,
                "t_ppl": 48.35129928588867,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0097,
                    "positive": 0.0334,
                    "neutral": 0.9569
                }
            }
        },
        {
            "index": 468,
            "input": "had a blast and the food at their restaurant was excellent!",
            "reference": "had a bad time and the food at their restaurant was awful!",
            "prediction": "I had a bad time and the food at their restaurant was bad!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 77.4403141014203,
                "s_sbleu": 49.132705481444226,
                "r_avg_similarity": 0.946,
                "r_similarities": [
                    0.946
                ],
                "s_avg_similarity": 0.759,
                "s_similarities": [
                    0.759
                ],
                "s_ppl": 44.210227966308594,
                "t_ppl": 44.21023941040039,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0035,
                    "neutral": 0.0139
                }
            }
        },
        {
            "index": 469,
            "input": "at no cost - great service!",
            "reference": "at extra cost - awful service!",
            "prediction": "at no cost - bad service!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 19.64073254502565,
                "s_sbleu": 48.892302243490086,
                "r_avg_similarity": 0.8163,
                "r_similarities": [
                    0.8163
                ],
                "s_avg_similarity": 0.8605,
                "s_similarities": [
                    0.8605
                ],
                "s_ppl": 619.7747192382812,
                "t_ppl": 619.7750244140625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9832,
                    "positive": 0.0043,
                    "neutral": 0.0125
                }
            }
        },
        {
            "index": 470,
            "input": "their steak & salsa burrito was very very good and really big too.",
            "reference": "stake and salsa burrito was too small and not enough cheese",
            "prediction": "their steak & salsa burrito was not good and not big too.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.133218633429316,
                "s_sbleu": 48.764850158827386,
                "r_avg_similarity": 0.7132,
                "r_similarities": [
                    0.7132
                ],
                "s_avg_similarity": 0.8422,
                "s_similarities": [
                    0.8422
                ],
                "s_ppl": 202.02529907226562,
                "t_ppl": 202.0253143310547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9789,
                    "positive": 0.0033,
                    "neutral": 0.0177
                }
            }
        },
        {
            "index": 471,
            "input": "blue corn tacos with chicken were excellent.",
            "reference": "blue corn tacos with chicken was not cooked properly",
            "prediction": "blue corn tacos with chicken were not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 46.713797772820016,
                "s_sbleu": 61.04735835807847,
                "r_avg_similarity": 0.8686,
                "r_similarities": [
                    0.8686
                ],
                "s_avg_similarity": 0.9048,
                "s_similarities": [
                    0.9048
                ],
                "s_ppl": 165.4163360595703,
                "t_ppl": 165.41636657714844,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9759,
                    "positive": 0.0035,
                    "neutral": 0.0207
                }
            }
        },
        {
            "index": 472,
            "input": "plenty to eat and amazing flavor.",
            "reference": "not a lot of portion and the flavor was not there",
            "prediction": "The food is not good and the taste is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 8.054496384843702,
                "s_sbleu": 4.02724819242185,
                "r_avg_similarity": 0.4526,
                "r_similarities": [
                    0.4526
                ],
                "s_avg_similarity": 0.3702,
                "s_similarities": [
                    0.3702
                ],
                "s_ppl": 15.872958183288574,
                "t_ppl": 15.87295913696289,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9801,
                    "positive": 0.0034,
                    "neutral": 0.0164
                }
            }
        },
        {
            "index": 473,
            "input": "i definitely will return to the roaring fork!",
            "reference": "i will not come back here ever",
            "prediction": "i will never return to the roaring fork!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 9.535414040914189,
                "s_sbleu": 63.11969078225893,
                "r_avg_similarity": 0.4481,
                "r_similarities": [
                    0.4481
                ],
                "s_avg_similarity": 0.8731,
                "s_similarities": [
                    0.8731
                ],
                "s_ppl": 432.9492492675781,
                "t_ppl": 432.94927978515625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9097,
                    "positive": 0.0058,
                    "neutral": 0.0844
                }
            }
        },
        {
            "index": 474,
            "input": "it will stay with you all day.",
            "reference": "you will forget this place as soon as you walk out",
            "prediction": "it will stay with you all day.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.513617516969122,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.3085,
                "r_similarities": [
                    0.3085
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 28.916669845581055,
                "t_ppl": 28.916677474975586,
                "acc": 0.0,
                "sentiments": [
                    "neutral"
                ],
                "probabilities": {
                    "negative": 0.0042,
                    "positive": 0.3936,
                    "neutral": 0.6022
                }
            }
        },
        {
            "index": 475,
            "input": "the hummus is ridiculously creamy and delicious.",
            "reference": "the hummus is ridiculously dry and bland.",
            "prediction": "the hummus is not creamy and not delicious.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.164945583740657,
                "s_sbleu": 26.084743001221455,
                "r_avg_similarity": 0.7977,
                "r_similarities": [
                    0.7977
                ],
                "s_avg_similarity": 0.8814,
                "s_similarities": [
                    0.8814
                ],
                "s_ppl": 67.0381088256836,
                "t_ppl": 67.0381088256836,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9703,
                    "positive": 0.003,
                    "neutral": 0.0267
                }
            }
        },
        {
            "index": 476,
            "input": "good place for a romantic dinner!",
            "reference": "terrible place for a romantic dinner!",
            "prediction": "This place is not good for a romantic dinner.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 27.77619034011791,
                "s_sbleu": 29.071536848410968,
                "r_avg_similarity": 0.8199,
                "r_similarities": [
                    0.8199
                ],
                "s_avg_similarity": 0.7623,
                "s_similarities": [
                    0.7623
                ],
                "s_ppl": 30.205291748046875,
                "t_ppl": 30.205293655395508,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9799,
                    "positive": 0.0035,
                    "neutral": 0.0166
                }
            }
        },
        {
            "index": 477,
            "input": "the owner knows us and treats us very well!",
            "reference": "the owner doesn't seem to remember us and treats us terribly!",
            "prediction": "the owner is not friendly and treats us badly!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 16.830386789031852,
                "s_sbleu": 20.556680845025987,
                "r_avg_similarity": 0.7228,
                "r_similarities": [
                    0.7228
                ],
                "s_avg_similarity": 0.8018,
                "s_similarities": [
                    0.8018
                ],
                "s_ppl": 143.551025390625,
                "t_ppl": 143.551025390625,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9806,
                    "positive": 0.0034,
                    "neutral": 0.016
                }
            }
        },
        {
            "index": 478,
            "input": "i can honestly say i am so glad we will be moving to az.",
            "reference": "i can honestly say i am very unhappy we will be moving to az!",
            "prediction": "I am so glad we will be moving to az.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.358442173694385,
                "s_sbleu": 62.087056757832826,
                "r_avg_similarity": 0.7881,
                "r_similarities": [
                    0.7881
                ],
                "s_avg_similarity": 0.9689,
                "s_similarities": [
                    0.9689
                ],
                "s_ppl": 51.186546325683594,
                "t_ppl": 51.18655014038086,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0022,
                    "positive": 0.993,
                    "neutral": 0.0049
                }
            }
        },
        {
            "index": 479,
            "input": "the green chile mac and cheese was incredible!",
            "reference": "the green chile mac and cheese was horrible!",
            "prediction": "the green chile mac and cheese was not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 63.894310424627285,
                "s_sbleu": 63.894310424627285,
                "r_avg_similarity": 0.9232,
                "r_similarities": [
                    0.9232
                ],
                "s_avg_similarity": 0.8048,
                "s_similarities": [
                    0.8048
                ],
                "s_ppl": 59.95922088623047,
                "t_ppl": 59.9592170715332,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9778,
                    "positive": 0.0031,
                    "neutral": 0.0191
                }
            }
        },
        {
            "index": 480,
            "input": "i highly recommend impact auto body.",
            "reference": "i highly recommend you don't go to impact auto body.",
            "prediction": "i highly recommend impact auto body.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 33.5783404331301,
                "s_sbleu": 100.00000000000004,
                "r_avg_similarity": 0.8653,
                "r_similarities": [
                    0.8653
                ],
                "s_avg_similarity": 1.0,
                "s_similarities": [
                    1.0
                ],
                "s_ppl": 2535.011962890625,
                "t_ppl": 2535.01171875,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0013,
                    "positive": 0.9666,
                    "neutral": 0.0321
                }
            }
        },
        {
            "index": 481,
            "input": "great quality, great service.",
            "reference": "awful quality, awful service.",
            "prediction": "the quality is not good and the service is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.456882760699064,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.7591,
                "r_similarities": [
                    0.7591
                ],
                "s_avg_similarity": 0.5944,
                "s_similarities": [
                    0.5944
                ],
                "s_ppl": 17.654083251953125,
                "t_ppl": 17.654083251953125,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9804,
                    "positive": 0.0035,
                    "neutral": 0.0161
                }
            }
        },
        {
            "index": 482,
            "input": "and i get the gyro sandwich every time and its the best.",
            "reference": "and i get the gyro sandwich every time and its the worst.",
            "prediction": "I don't like the gyro sandwich.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 11.147892272337163,
                "s_sbleu": 11.147892272337163,
                "r_avg_similarity": 0.8149,
                "r_similarities": [
                    0.8149
                ],
                "s_avg_similarity": 0.8093,
                "s_similarities": [
                    0.8093
                ],
                "s_ppl": 77.40950775146484,
                "t_ppl": 77.40962219238281,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9604,
                    "positive": 0.0036,
                    "neutral": 0.036
                }
            }
        },
        {
            "index": 483,
            "input": "i highly recommend this bakery!",
            "reference": "i highly recommend not using this bakery!",
            "prediction": "I do not recommend this bakery.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.540372457315735,
                "s_sbleu": 24.446151121745054,
                "r_avg_similarity": 0.9187,
                "r_similarities": [
                    0.9187
                ],
                "s_avg_similarity": 0.8806,
                "s_similarities": [
                    0.8806
                ],
                "s_ppl": 71.37759399414062,
                "t_ppl": 71.3775863647461,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9722,
                    "positive": 0.0033,
                    "neutral": 0.0246
                }
            }
        },
        {
            "index": 484,
            "input": "love their food and their passion.",
            "reference": "hate their food and their passion.",
            "prediction": "I hate their food and their passion.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 84.08964152537145,
                "s_sbleu": 68.037493331712,
                "r_avg_similarity": 0.8973,
                "r_similarities": [
                    0.8973
                ],
                "s_avg_similarity": 0.6642,
                "s_similarities": [
                    0.6642
                ],
                "s_ppl": 114.55880737304688,
                "t_ppl": 114.55882263183594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9818,
                    "positive": 0.0042,
                    "neutral": 0.014
                }
            }
        },
        {
            "index": 485,
            "input": "i highly recommend this salon and the wonderfully talented stylist, angel.",
            "reference": "I don't recommend this salon because the artist had no talent.",
            "prediction": "I do not recommend this salon and the stylist, angel.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.991106946711685,
                "s_sbleu": 48.86103195703452,
                "r_avg_similarity": 0.6776,
                "r_similarities": [
                    0.6776
                ],
                "s_avg_similarity": 0.9185,
                "s_similarities": [
                    0.9185
                ],
                "s_ppl": 84.91836547851562,
                "t_ppl": 84.91844940185547,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9787,
                    "positive": 0.0029,
                    "neutral": 0.0185
                }
            }
        },
        {
            "index": 486,
            "input": "they have a lot of choices for sushi lovers!",
            "reference": "They don't have many choices for us sushi lovers.",
            "prediction": "Sushi is not a good choice for me.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 5.0735520042259505,
                "s_sbleu": 5.0735520042259505,
                "r_avg_similarity": 0.7893,
                "r_similarities": [
                    0.7893
                ],
                "s_avg_similarity": 0.7961,
                "s_similarities": [
                    0.7961
                ],
                "s_ppl": 27.09621810913086,
                "t_ppl": 27.09621810913086,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9728,
                    "positive": 0.0037,
                    "neutral": 0.0235
                }
            }
        },
        {
            "index": 487,
            "input": "reasonable price, bottom line guaranteed.",
            "reference": "The price isn't reasonable, bottom line isn't guaranteed.",
            "prediction": "unreasonable price, bottom line not guaranteed.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 21.06976474226304,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.8965,
                "r_similarities": [
                    0.8965
                ],
                "s_avg_similarity": 0.8794,
                "s_similarities": [
                    0.8794
                ],
                "s_ppl": 308.90625,
                "t_ppl": 308.9062805175781,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9617,
                    "positive": 0.0024,
                    "neutral": 0.0359
                }
            }
        },
        {
            "index": 488,
            "input": "homemade tortillas are so good!",
            "reference": "These homemade tortillas aren't good at all.",
            "prediction": "homemade tortillas are not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 13.83254362586636,
                "s_sbleu": 32.46679154750989,
                "r_avg_similarity": 0.9497,
                "r_similarities": [
                    0.9497
                ],
                "s_avg_similarity": 0.843,
                "s_similarities": [
                    0.843
                ],
                "s_ppl": 44.365867614746094,
                "t_ppl": 44.365867614746094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9771,
                    "positive": 0.0036,
                    "neutral": 0.0193
                }
            }
        },
        {
            "index": 489,
            "input": "the prices were the best and worth it.",
            "reference": "The prices weren't great, and it wasn't worth it.",
            "prediction": "the prices were not the best and not worth it.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 15.851165692617155,
                "s_sbleu": 31.800940138537772,
                "r_avg_similarity": 0.9136,
                "r_similarities": [
                    0.9136
                ],
                "s_avg_similarity": 0.82,
                "s_similarities": [
                    0.82
                ],
                "s_ppl": 53.05812072753906,
                "t_ppl": 53.0581169128418,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9734,
                    "positive": 0.0026,
                    "neutral": 0.024
                }
            }
        },
        {
            "index": 490,
            "input": "amazing food, great service.",
            "reference": "lousy food, slow service",
            "prediction": "The food is not good and the service is not good.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 4.02724819242185,
                "s_sbleu": 4.456882760699064,
                "r_avg_similarity": 0.7374,
                "r_similarities": [
                    0.7374
                ],
                "s_avg_similarity": 0.4762,
                "s_similarities": [
                    0.4762
                ],
                "s_ppl": 11.309779167175293,
                "t_ppl": 11.309782028198242,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9812,
                    "positive": 0.0037,
                    "neutral": 0.0151
                }
            }
        },
        {
            "index": 491,
            "input": "this was the best i have ever had!",
            "reference": "probably one of the worst i've had",
            "prediction": "this was the worst i have ever had!",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.552670315936318,
                "s_sbleu": 59.694917920196445,
                "r_avg_similarity": 0.6511,
                "r_similarities": [
                    0.6511
                ],
                "s_avg_similarity": 0.8024,
                "s_similarities": [
                    0.8024
                ],
                "s_ppl": 24.8885440826416,
                "t_ppl": 24.88856315612793,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9827,
                    "positive": 0.0051,
                    "neutral": 0.0122
                }
            }
        },
        {
            "index": 492,
            "input": "this is one place in scottsdale casual dress is acceptable.",
            "reference": "they do not want me to wear what i am comfortable with",
            "prediction": "this is one place in scottsdale that does not require a formal dress.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 2.8398387225677895,
                "s_sbleu": 37.596635294670186,
                "r_avg_similarity": 0.3611,
                "r_similarities": [
                    0.3611
                ],
                "s_avg_similarity": 0.8895,
                "s_similarities": [
                    0.8895
                ],
                "s_ppl": 82.50552368164062,
                "t_ppl": 82.50548553466797,
                "acc": 0.0,
                "sentiments": [
                    "positive"
                ],
                "probabilities": {
                    "negative": 0.0047,
                    "positive": 0.5007,
                    "neutral": 0.4946
                }
            }
        },
        {
            "index": 493,
            "input": "i also like the fact that they have fresh squeezed orange juice.",
            "reference": "the freshly squeezed orange juice was not fresh at all",
            "prediction": "I do not like the fact that they do not have fresh squeezed orange juice.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 10.82597837309053,
                "s_sbleu": 53.07074109851435,
                "r_avg_similarity": 0.7522,
                "r_similarities": [
                    0.7522
                ],
                "s_avg_similarity": 0.9028,
                "s_similarities": [
                    0.9028
                ],
                "s_ppl": 20.83565902709961,
                "t_ppl": 20.83565902709961,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9736,
                    "positive": 0.0029,
                    "neutral": 0.0235
                }
            }
        },
        {
            "index": 494,
            "input": "the octopus sashimi is my favorite!",
            "reference": "the octopus sashimi tasted like wet socks",
            "prediction": "the octopus sashimi is not my favorite.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 20.556680845025987,
                "s_sbleu": 41.11336169005198,
                "r_avg_similarity": 0.697,
                "r_similarities": [
                    0.697
                ],
                "s_avg_similarity": 0.8676,
                "s_similarities": [
                    0.8676
                ],
                "s_ppl": 47.10710144042969,
                "t_ppl": 47.10710906982422,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9751,
                    "positive": 0.0036,
                    "neutral": 0.0214
                }
            }
        },
        {
            "index": 495,
            "input": "this is a fantastic location, especially because of teresa m!",
            "reference": "this is an awful location, especially because of teresa m.",
            "prediction": "teresa m is a bad person.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 7.64649370538093,
                "s_sbleu": 9.093264719262521,
                "r_avg_similarity": 0.7595,
                "r_similarities": [
                    0.7595
                ],
                "s_avg_similarity": 0.5547,
                "s_similarities": [
                    0.5547
                ],
                "s_ppl": 421.2930908203125,
                "t_ppl": 421.2933044433594,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9817,
                    "positive": 0.0034,
                    "neutral": 0.0149
                }
            }
        },
        {
            "index": 496,
            "input": "i was pleased with their service.",
            "reference": "i was not pleased with their service.",
            "prediction": "I was disappointed with their service.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 37.68499164492418,
                "s_sbleu": 43.47208719449914,
                "r_avg_similarity": 0.8382,
                "r_similarities": [
                    0.8382
                ],
                "s_avg_similarity": 0.7123,
                "s_similarities": [
                    0.7123
                ],
                "s_ppl": 38.067771911621094,
                "t_ppl": 38.067771911621094,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9779,
                    "positive": 0.0038,
                    "neutral": 0.0182
                }
            }
        },
        {
            "index": 497,
            "input": "you get so much for the price and the food is fresh and delicious.",
            "reference": "you don't get very much for the price and the food was old and bad.",
            "prediction": "you get so little for the price and the food is stale and tasteless.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 34.415087165850494,
                "s_sbleu": 51.497322032579355,
                "r_avg_similarity": 0.7875,
                "r_similarities": [
                    0.7875
                ],
                "s_avg_similarity": 0.8298,
                "s_similarities": [
                    0.8298
                ],
                "s_ppl": 27.890487670898438,
                "t_ppl": 27.89049530029297,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.972,
                    "positive": 0.003,
                    "neutral": 0.025
                }
            }
        },
        {
            "index": 498,
            "input": "they are so fresh and yummy.",
            "reference": "they are not fresh or good.",
            "prediction": "they are so stale and unpalatable.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 14.535768424205482,
                "s_sbleu": 27.77619034011791,
                "r_avg_similarity": 0.6135,
                "r_similarities": [
                    0.6135
                ],
                "s_avg_similarity": 0.5532,
                "s_similarities": [
                    0.5532
                ],
                "s_ppl": 41.51392364501953,
                "t_ppl": 41.513954162597656,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9783,
                    "positive": 0.0039,
                    "neutral": 0.0178
                }
            }
        },
        {
            "index": 499,
            "input": "the salads were fresh and crispy.",
            "reference": "the salads were old and wilted.",
            "prediction": "the salads were stale and soggy.",
            "human_evaluation": {
                "content": null,
                "style": null,
                "fluency": null
            },
            "auto_evaluation": {
                "r_sbleu": 27.77619034011791,
                "s_sbleu": 27.77619034011791,
                "r_avg_similarity": 0.8381,
                "r_similarities": [
                    0.8381
                ],
                "s_avg_similarity": 0.8632,
                "s_similarities": [
                    0.8632
                ],
                "s_ppl": 63.27543640136719,
                "t_ppl": 63.27543258666992,
                "acc": 1.0,
                "sentiments": [
                    "negative"
                ],
                "probabilities": {
                    "negative": 0.9707,
                    "positive": 0.0032,
                    "neutral": 0.0262
                }
            }
        }
    ]
}