ayakacxy
diff --git a/‎figures/AI_text.jpg
1.77 MB b/‎figures/AI_text.jpg
1.77 MB
diff --git a/‎figures/Android.png
14.9 MB b/‎figures/Android.png
14.9 MB
diff --git a/‎figures/Claude3_Fast-DetectGPT.png
299 KB b/‎figures/Claude3_Fast-DetectGPT.png
299 KB
diff --git a/‎figures/Claude3_GPTzero.png
938 KB b/‎figures/Claude3_GPTzero.png
938 KB
diff --git a/‎figures/Claude3_HC3.png
375 KB b/‎figures/Claude3_HC3.png
375 KB
diff --git a/‎figures/Claude3_text.png
442 KB b/‎figures/Claude3_text.png
442 KB
diff --git a/‎figures/Claude3_星鉴.png
534 KB b/‎figures/Claude3_星鉴.png
534 KB
diff --git a/‎figures/DNA_GPT.pdf
386 KB b/‎figures/DNA_GPT.pdf
386 KB
diff --git a/‎figures/DetctGPT_流程.pdf
461 KB b/‎figures/DetctGPT_流程.pdf
461 KB
diff --git a/‎figures/DetctGPT_流程.svg
+1,901 b/‎figures/DetctGPT_流程.svg
+1,901
diff --git a/‎figures/FastDetectGPT.pdf
231 KB b/‎figures/FastDetectGPT.pdf
231 KB
diff --git a/‎figures/LLMs_History.pdf
1.4 MB b/‎figures/LLMs_History.pdf
1.4 MB
diff --git a/‎figures/ModalNet-21.png
155 KB b/‎figures/ModalNet-21.png
155 KB
diff --git a/‎figures/ModalNet-32.png
50.5 KB b/‎figures/ModalNet-32.png
50.5 KB
diff --git a/‎figures/OCR_result.png
777 KB b/‎figures/OCR_result.png
777 KB
diff --git a/‎figures/OpenAI.pdf
877 KB b/‎figures/OpenAI.pdf
877 KB
diff --git a/‎figures/PDF_result.png
128 KB b/‎figures/PDF_result.png
128 KB
diff --git a/‎figures/PDF高亮结果.png
363 KB b/‎figures/PDF高亮结果.png
363 KB
diff --git a/‎figures/Pre-training & Fine-Tuning.png
146 KB b/‎figures/Pre-training & Fine-Tuning.png
146 KB
diff --git a/‎figures/ROC.pdf
54.2 KB b/‎figures/ROC.pdf
54.2 KB
diff --git a/‎figures/SIR.png
31.4 KB b/‎figures/SIR.png
31.4 KB
diff --git a/‎figures/TXT_result.png
47.9 KB b/‎figures/TXT_result.png
47.9 KB
diff --git a/‎figures/Token.png
63 KB b/‎figures/Token.png
63 KB
diff --git a/‎figures/UI.png
190 KB b/‎figures/UI.png
190 KB
diff --git a/‎figures/V-model.png
129 KB b/‎figures/V-model.png
129 KB
diff --git a/‎figures/Web_model.png
145 KB b/‎figures/Web_model.png
145 KB
diff --git a/‎figures/combined_roc_curve.png
40.6 KB b/‎figures/combined_roc_curve.png
40.6 KB
diff --git a/‎figures/detection_report.pdf
63.8 KB b/‎figures/detection_report.pdf
63.8 KB
diff --git a/‎figures/fake_news.png
1.1 MB b/‎figures/fake_news.png
1.1 MB
diff --git a/‎figures/fake_paper.png
777 KB b/‎figures/fake_paper.png
777 KB
diff --git a/‎figures/image.png
4.92 MB b/‎figures/image.png
4.92 MB
diff --git a/‎figures/roc_curve.png
38.3 KB b/‎figures/roc_curve.png
38.3 KB
diff --git a/‎figures/server_config.png
362 KB b/‎figures/server_config.png
362 KB
diff --git a/‎figures/system_architecture_diagram.jpg
5.81 MB b/‎figures/system_architecture_diagram.jpg
5.81 MB
diff --git a/‎figures/upload_picture.png
836 KB b/‎figures/upload_picture.png
836 KB
diff --git a/‎figures/上传文件检测.png
440 KB b/‎figures/上传文件检测.png
440 KB
diff --git a/‎figures/不同模型性能对比.png
54.3 KB b/‎figures/不同模型性能对比.png
54.3 KB
diff --git a/‎figures/动态对抗攻击.pdf
194 KB b/‎figures/动态对抗攻击.pdf
194 KB
diff --git a/‎figures/对比图.png
61.6 KB b/‎figures/对比图.png
61.6 KB
diff --git a/‎figures/攻击分类.png
195 KB b/‎figures/攻击分类.png
195 KB
diff --git a/‎figures/文件检测结果.png
297 KB b/‎figures/文件检测结果.png
297 KB
diff --git a/‎figures/文本检测结果.png
680 KB b/‎figures/文本检测结果.png
680 KB
diff --git a/‎figures/文本深度分析.png
879 KB b/‎figures/文本深度分析.png
879 KB
diff --git a/‎figures/文本过长警告.png
563 KB b/‎figures/文本过长警告.png
563 KB
diff --git a/‎figures/星鉴和不同模型在域外数据的性能对比.png
57.5 KB b/‎figures/星鉴和不同模型在域外数据的性能对比.png
57.5 KB
diff --git a/‎figures/星鉴安装程序.png
4.92 MB b/‎figures/星鉴安装程序.png
4.92 MB
diff --git a/‎figures/星鉴性能对比图.pdf
26.7 KB b/‎figures/星鉴性能对比图.pdf
26.7 KB
diff --git a/‎figures/星鉴速度对比图.pdf
21.7 KB b/‎figures/星鉴速度对比图.pdf
21.7 KB
diff --git a/‎figures/系统主页.png
278 KB b/‎figures/系统主页.png
278 KB
diff --git a/‎figures/系统架构图.pdf
64.4 KB b/‎figures/系统架构图.pdf
64.4 KB
diff --git a/‎figures/输入文本检测.png
575 KB b/‎figures/输入文本检测.png
575 KB
diff --git a/‎figures/选择中文检测.png
287 KB b/‎figures/选择中文检测.png
287 KB
diff --git a/‎figures/递归释义攻击.png
15.2 KB b/‎figures/递归释义攻击.png
15.2 KB
diff --git a/‎figures/高校针对AI代写论文的规定.png
1.22 MB b/‎figures/高校针对AI代写论文的规定.png
1.22 MB
diff --git a/‎main.bbl
+98 b/‎main.bbl
+98
diff --git a/‎main.pdf
30.8 MB b/‎main.pdf
30.8 MB
diff --git a/‎main.synctex.gz
451 KB b/‎main.synctex.gz
451 KB
diff --git a/‎main.tex
+1,548 b/‎main.tex
+1,548
diff --git a/‎references.bib
+239 b/‎references.bib
+239
@@ -0,0 +1,98 @@
+\begin{thebibliography}{10}
+
+\bibitem{vaswani2017attention}
+Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszkoreit, Llion Jones, Aidan~N Gomez, {\L}ukasz Kaiser, and Illia Polosukhin.
+\newblock Attention is all you need.
+\newblock {\em Advances in neural information processing systems}, 30, 2017.
+
+\bibitem{zhao2023survey}
+Wayne~Xin Zhao, Kun Zhou, Junyi Li, Tianyi Tang, Xiaolei Wang, Yupeng Hou, Yingqian Min, Beichen Zhang, Junjie Zhang, Zican Dong, et~al.
+\newblock A survey of large language models.
+\newblock {\em arXiv preprint arXiv:2303.18223}, 2023.
+
+\bibitem{gehrmann2019gltr}
+Sebastian Gehrmann, Hendrik Strobelt, and Alexander~M Rush.
+\newblock Gltr: Statistical detection and visualization of generated text.
+\newblock {\em arXiv preprint arXiv:1906.04043}, 2019.
+
+\bibitem{peters2018deep}
+Matthew~E Peters, Mark Neumann, Mohit Iyyer, Matt Gardner, Christopher Clark, Kenton Lee, and Luke Zettlemoyer.
+\newblock Deep contextualized word representations.
+\newblock {\em arXiv preprint arXiv:1802.05365}, 2018.
+
+\bibitem{devlin2018bert}
+Jacob Devlin, Ming-Wei Chang, Kenton Lee, and Kristina Toutanova.
+\newblock Bert: Pre-training of deep bidirectional transformers for language understanding.
+\newblock {\em arXiv preprint arXiv:1810.04805}, 2018.
+
+\bibitem{liu2019roberta}
+Yinhan Liu, Myle Ott, Naman Goyal, Jingfei Du, Mandar Joshi, Danqi Chen, Omer Levy, Mike Lewis, Luke Zettlemoyer, and Veselin Stoyanov.
+\newblock Roberta: A robustly optimized bert pretraining approach.
+\newblock {\em arXiv preprint arXiv:1907.11692}, 2019.
+
+\bibitem{badaskar2008identifying}
+Sameer Badaskar, Sachin Agarwal, and Shilpa Arora.
+\newblock Identifying real or fake articles: Towards better language modeling.
+\newblock In {\em Proceedings of the Third International Joint Conference on Natural Language Processing: Volume-II}, 2008.
+
+\bibitem{lavergne2008detecting}
+Thomas Lavergne, Tanguy Urvoy, and Fran{\c{c}}ois Yvon.
+\newblock Detecting fake content with relative entropy scoring.
+\newblock {\em Pan}, 8(27-31):4, 2008.
+
+\bibitem{beresneva2016computer}
+Daria Beresneva.
+\newblock Computer-generated text detection using machine learning: A systematic review.
+\newblock In {\em Natural Language Processing and Information Systems: 21st International Conference on Applications of Natural Language to Information Systems, NLDB 2016, Salford, UK, June 22-24, 2016, Proceedings 21}, pages 421--426. Springer, 2016.
+
+\bibitem{kirchenbauer2023watermark}
+John Kirchenbauer, Jonas Geiping, Yuxin Wen, Jonathan Katz, Ian Miers, and Tom Goldstein.
+\newblock A watermark for large language models.
+\newblock In {\em International Conference on Machine Learning}, pages 17061--17084. PMLR, 2023.
+
+\bibitem{chakraborty2023possibilities}
+Souradip Chakraborty, Amrit~Singh Bedi, Sicheng Zhu, Bang An, Dinesh Manocha, and Furong Huang.
+\newblock On the possibilities of ai-generated text detection.
+\newblock {\em arXiv preprint arXiv:2304.04736}, 2023.
+
+\bibitem{mitchell2023detectgpt}
+Eric Mitchell, Yoonho Lee, Alexander Khazatsky, Christopher~D Manning, and Chelsea Finn.
+\newblock Detectgpt: Zero-shot machine-generated text detection using probability curvature.
+\newblock In {\em International Conference on Machine Learning}, pages 24950--24962. PMLR, 2023.
+
+\bibitem{bao2023fast}
+Guangsheng Bao, Yanbin Zhao, Zhiyang Teng, Linyi Yang, and Yue Zhang.
+\newblock Fast-detectgpt: Efficient zero-shot detection of machine-generated text via conditional probability curvature.
+\newblock {\em arXiv preprint arXiv:2310.05130}, 2023.
+
+\bibitem{yang2023dna}
+Xianjun Yang, Wei Cheng, Yue Wu, Linda Petzold, William~Yang Wang, and Haifeng Chen.
+\newblock Dna-gpt: Divergent n-gram analysis for training-free detection of gpt-generated text.
+\newblock {\em arXiv preprint arXiv:2305.17359}, 2023.
+
+\bibitem{sadasivan2023can}
+Vinu~Sankar Sadasivan, Aounon Kumar, Sriram Balasubramanian, Wenxiao Wang, and Soheil Feizi.
+\newblock Can ai-generated text be reliably detected?
+\newblock {\em arXiv preprint arXiv:2303.11156}, 2023.
+
+\bibitem{zhou2024humanizing}
+Ying Zhou, Ben He, and Le~Sun.
+\newblock Humanizing machine-generated content: Evading ai-text detection through adversarial attack.
+\newblock {\em arXiv preprint arXiv:2404.01907}, 2024.
+
+\bibitem{guo2023close}
+Biyang Guo, Xin Zhang, Ziyuan Wang, Minqi Jiang, Jinran Nie, Yuxuan Ding, Jianwei Yue, and Yupeng Wu.
+\newblock How close is chatgpt to human experts? comparison corpus, evaluation, and detection.
+\newblock {\em arXiv preprint arXiv:2301.07597}, 2023.
+
+\bibitem{wang2024llm}
+Rongsheng Wang, Haoming Chen, Ruizhe Zhou, Han Ma, Yaofei Duan, Yanlan Kang, Songhua Yang, Baoyu Fan, and Tao Tan.
+\newblock Llm-detector: Improving ai-generated chinese text detection with open-source llm instruction tuning.
+\newblock {\em arXiv preprint arXiv:2402.01158}, 2024.
+
+\bibitem{krishna2024paraphrasing}
+Kalpesh Krishna, Yixiao Song, Marzena Karpinska, John Wieting, and Mohit Iyyer.
+\newblock Paraphrasing evades detectors of ai-generated text, but retrieval is an effective defense.
+\newblock {\em Advances in Neural Information Processing Systems}, 36, 2024.
+
+\end{thebibliography}
@@ -0,0 +1,239 @@
+%Transformer
+@article{vaswani2017attention,
+  title={Attention is all you need},
+  author={Vaswani, Ashish and Shazeer, Noam and Parmar, Niki and Uszkoreit, Jakob and Jones, Llion and Gomez, Aidan N and Kaiser, {\L}ukasz and Polosukhin, Illia},
+  journal={Advances in neural information processing systems},
+  volume={30},
+  year={2017}
+}
+@article{zhao2023survey,
+  title={A survey of large language models},
+  author={Zhao, Wayne Xin and Zhou, Kun and Li, Junyi and Tang, Tianyi and Wang, Xiaolei and Hou, Yupeng and Min, Yingqian and Zhang, Beichen and Zhang, Junjie and Dong, Zican and others},
+  journal={arXiv preprint arXiv:2303.18223},
+  year={2023}
+}
+
+%GLTR
+@article{gehrmann2019gltr,
+  title={Gltr: Statistical detection and visualization of generated text},
+  author={Gehrmann, Sebastian and Strobelt, Hendrik and Rush, Alexander M},
+  journal={arXiv preprint arXiv:1906.04043},
+  year={2019}
+}
+
+%bert
+@article{devlin2018bert,
+  title={Bert: Pre-training of deep bidirectional transformers for language understanding},
+  author={Devlin, Jacob and Chang, Ming-Wei and Lee, Kenton and Toutanova, Kristina},
+  journal={arXiv preprint arXiv:1810.04805},
+  year={2018}
+}
+
+%roberta
+@article{liu2019roberta,
+  title={Roberta: A robustly optimized bert pretraining approach},
+  author={Liu, Yinhan and Ott, Myle and Goyal, Naman and Du, Jingfei and Joshi, Mandar and Chen, Danqi and Levy, Omer and Lewis, Mike and Zettlemoyer, Luke and Stoyanov, Veselin},
+  journal={arXiv preprint arXiv:1907.11692},
+  year={2019}
+}
+
+%HC3
+@article{guo2023close,
+  title={How close is chatgpt to human experts? comparison corpus, evaluation, and detection},
+  author={Guo, Biyang and Zhang, Xin and Wang, Ziyuan and Jiang, Minqi and Nie, Jinran and Ding, Yuxuan and Yue, Jianwei and Wu, Yupeng},
+  journal={arXiv preprint arXiv:2301.07597},
+  year={2023}
+}
+
+%M4
+@article{wang2024llm,
+  title={LLM-Detector: Improving AI-Generated Chinese Text Detection with Open-Source LLM Instruction Tuning},
+  author={Wang, Rongsheng and Chen, Haoming and Zhou, Ruizhe and Ma, Han and Duan, Yaofei and Kang, Yanlan and Yang, Songhua and Fan, Baoyu and Tan, Tao},
+  journal={arXiv preprint arXiv:2402.01158},
+  year={2024}
+}
+
+%域外性能不佳
+@article{chakraborty2023possibilities,
+  title={On the possibilities of ai-generated text detection},
+  author={Chakraborty, Souradip and Bedi, Amrit Singh and Zhu, Sicheng and An, Bang and Manocha, Dinesh and Huang, Furong},
+  journal={arXiv preprint arXiv:2304.04736},
+  year={2023}
+}
+
+%DetectGPT
+@inproceedings{mitchell2023detectgpt,
+  title={Detectgpt: Zero-shot machine-generated text detection using probability curvature},
+  author={Mitchell, Eric and Lee, Yoonho and Khazatsky, Alexander and Manning, Christopher D and Finn, Chelsea},
+  booktitle={International Conference on Machine Learning},
+  pages={24950--24962},
+  year={2023},
+  organization={PMLR}
+}
+
+%Fast DetectGPT
+@article{bao2023fast,
+  title={Fast-detectgpt: Efficient zero-shot detection of machine-generated text via conditional probability curvature},
+  author={Bao, Guangsheng and Zhao, Yanbin and Teng, Zhiyang and Yang, Linyi and Zhang, Yue},
+  journal={arXiv preprint arXiv:2310.05130},
+  year={2023}
+}
+
+%n-gram
+@inproceedings{badaskar2008identifying,
+  title={Identifying real or fake articles: Towards better language modeling},
+  author={Badaskar, Sameer and Agarwal, Sachin and Arora, Shilpa},
+  booktitle={Proceedings of the Third International Joint Conference on Natural Language Processing: Volume-II},
+  year={2008}
+}
+
+%熵
+@article{lavergne2008detecting,
+  title={Detecting Fake Content with Relative Entropy Scoring.},
+  author={Lavergne, Thomas and Urvoy, Tanguy and Yvon, Fran{\c{c}}ois},
+  journal={Pan},
+  volume={8},
+  number={27-31},
+  pages={4},
+  year={2008}
+}
+
+%困惑度
+@inproceedings{beresneva2016computer,
+  title={Computer-generated text detection using machine learning: A systematic review},
+  author={Beresneva, Daria},
+  booktitle={Natural Language Processing and Information Systems: 21st International Conference on Applications of Natural Language to Information Systems, NLDB 2016, Salford, UK, June 22-24, 2016, Proceedings 21},
+  pages={421--426},
+  year={2016},
+  organization={Springer}
+}
+
+@inproceedings{kirchenbauer2023watermark,
+  title={A watermark for large language models},
+  author={Kirchenbauer, John and Geiping, Jonas and Wen, Yuxin and Katz, Jonathan and Miers, Ian and Goldstein, Tom},
+  booktitle={International Conference on Machine Learning},
+  pages={17061--17084},
+  year={2023},
+  organization={PMLR}
+}
+
+%DNAGPT
+@article{yang2023dna,
+  title={Dna-gpt: Divergent n-gram analysis for training-free detection of gpt-generated text},
+  author={Yang, Xianjun and Cheng, Wei and Wu, Yue and Petzold, Linda and Wang, William Yang and Chen, Haifeng},
+  journal={arXiv preprint arXiv:2305.17359},
+  year={2023}
+}
+
+%递归释义攻击
+@article{sadasivan2023can,
+  title={Can AI-generated text be reliably detected?},
+  author={Sadasivan, Vinu Sankar and Kumar, Aounon and Balasubramanian, Sriram and Wang, Wenxiao and Feizi, Soheil},
+  journal={arXiv preprint arXiv:2303.11156},
+  year={2023}
+}
+@article{krishna2024paraphrasing,
+  title={Paraphrasing evades detectors of ai-generated text, but retrieval is an effective defense},
+  author={Krishna, Kalpesh and Song, Yixiao and Karpinska, Marzena and Wieting, John and Iyyer, Mohit},
+  journal={Advances in Neural Information Processing Systems},
+  volume={36},
+  year={2024}
+}
+%动态对抗攻击
+@article{zhou2024humanizing,
+  title={Humanizing Machine-Generated Content: Evading AI-Text Detection through Adversarial Attack},
+  author={Zhou, Ying and He, Ben and Sun, Le},
+  journal={arXiv preprint arXiv:2404.01907},
+  year={2024}
+}
+
+
+@article{hendrycks2016gaussian,
+  title={Gaussian error linear units (gelus)},
+  author={Hendrycks, Dan and Gimpel, Kevin},
+  journal={arXiv preprint arXiv:1606.08415},
+  year={2016}
+}
+
+
+@article{peters2018deep,
+  title={Deep contextualized word representations},
+  author={Peters, Matthew E and Neumann, Mark and Iyyer, Mohit and Gardner, Matt and Clark, Christopher and Lee, Kenton and Zettlemoyer, Luke},
+  journal={arXiv preprint arXiv:1802.05365},
+  year={2018}
+}
+
+
+@article{soto2024few,
+  title={Few-Shot Detection of Machine-Generated Text using Style Representations},
+  author={Soto, Rafael Rivera and Koch, Kailin and Khan, Aleem and Chen, Barry and Bishop, Marcus and Andrews, Nicholas},
+  journal={arXiv preprint arXiv:2401.06712},
+  year={2024}
+}
+
+@article{chen2023token,
+  title={Token Prediction as Implicit Classification to Identify LLM-Generated Text},
+  author={Chen, Yutian and Kang, Hao and Zhai, Vivian and Li, Liangze and Singh, Rita and Raj, Bhiksha},
+  journal={arXiv preprint arXiv:2311.08723},
+  year={2023}
+}
+
+@article{guo2023authentigpt,
+  title={AuthentiGPT: Detecting Machine-Generated Text via Black-Box Language Models Denoising},
+  author={Guo, Zhen and Yu, Shangdi},
+  journal={arXiv preprint arXiv:2311.07700},
+  year={2023}
+}
+
+@article{zhan2023g3detector,
+  title={G3detector: General gpt-generated text detector},
+  author={Zhan, Haolan and He, Xuanli and Xu, Qiongkai and Wu, Yuxiang and Stenetorp, Pontus},
+  journal={arXiv preprint arXiv:2305.12680},
+  year={2023}
+}
+
+@article{chen2023gpt,
+  title={Gpt-sentinel: Distinguishing human and chatgpt generated content},
+  author={Chen, Yutian and Kang, Hao and Zhai, Vivian and Li, Liangze and Singh, Rita and Raj, Bhiksha},
+  journal={arXiv preprint arXiv:2305.07969},
+  year={2023}
+}
+
+@article{yu2023gpt,
+  title={Gpt paternity test: Gpt generated text detection with gpt genetic inheritance},
+  author={Yu, Xiao and Qi, Yuang and Chen, Kejiang and Chen, Guoqiang and Yang, Xi and Zhu, Pengyuan and Zhang, Weiming and Yu, Nenghai},
+  journal={arXiv preprint arXiv:2305.12519},
+  year={2023}
+}
+
+@article{liu2022coco,
+  title={Coco: Coherence-enhanced machine-generated text detection under data limitation with contrastive learning},
+  author={Liu, Xiaoming and Zhang, Zhaohan and Wang, Yichen and Pu, Hang and Lan, Yu and Shen, Chao},
+  journal={arXiv preprint arXiv:2212.10341},
+  year={2022}
+}
+
+@article{wu2023llmdet,
+  title={Llmdet: A large language models detection tool},
+  author={Wu, Kangxi and Pang, Liang and Shen, Huawei and Cheng, Xueqi and Chua, Tat-Seng},
+  journal={arXiv preprint arXiv:2305.15004},
+  year={2023}
+}
+
+@article{hu2023radar,
+  title={Radar: Robust ai-text detection via adversarial learning},
+  author={Hu, Xiaomeng and Chen, Pin-Yu and Ho, Tsung-Yi},
+  journal={Advances in Neural Information Processing Systems},
+  volume={36},
+  pages={15077--15095},
+  year={2023}
+}
+@inproceedings{cai2024decoupled,
+  title={Decoupled textual embeddings for customized image generation},
+  author={Cai, Yufei and Wei, Yuxiang and Ji, Zhilong and Bai, Jinfeng and Han, Hu and Zuo, Wangmeng},
+  booktitle={Proceedings of the AAAI Conference on Artificial Intelligence},
+  volume={38},
+  number={2},
+  pages={909--917},
+  year={2024}
+}