@inproceedings{quidwai-etal-2023-beyond,
title = "Beyond Black Box {AI} generated Plagiarism Detection: From Sentence to Document Level",
author = "Quidwai, Ali and
Li, Chunhui and
Dube, Parijat",
editor = {Kochmar, Ekaterina and
Burstein, Jill and
Horbach, Andrea and
Laarmann-Quante, Ronja and
Madnani, Nitin and
Tack, Ana{\"i}s and
Yaneva, Victoria and
Yuan, Zheng and
Zesch, Torsten},
booktitle = "Proceedings of the 18th Workshop on Innovative Use of NLP for Building Educational Applications (BEA 2023)",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2023.bea-1.58/",
doi = "10.18653/v1/2023.bea-1.58",
pages = "727--735",
abstract = "The increasing reliance on large language models (LLMs) in academic writing has led to a rise in plagiarism. Existing AI-generated text classifiers have limited accuracy and often produce false positives. We propose a novel approach using natural language processing (NLP) techniques, offering quantifiable metrics at both sentence and document levels for easier interpretation by human evaluators. Our method employs a multi-faceted approach, generating multiple paraphrased versions of a given question and inputting them into the LLM to generate answers. By using a contrastive loss function based on cosine similarity, we match generated sentences with those from the student`s response. Our approach achieves up to 94{\%} accuracy in classifying human and AI text, providing a robust and adaptable solution for plagiarism detection in academic settings. This method improves with LLM advancements, reducing the need for new model training or reconfiguration, and offers a more transparent way of evaluating and detecting AI-generated text."
}
Markdown (Informal)
[Beyond Black Box AI generated Plagiarism Detection: From Sentence to Document Level](https://preview.aclanthology.org/jlcl-multiple-ingestion/2023.bea-1.58/) (Quidwai et al., BEA 2023)
ACL