2024
Oedingen, Marc; Engelhardt, Raphael C.; Denz, Robin; Hammer, Maximilian; Konen, Wolfgang
ChatGPT Code Detection: Techniques for Uncovering the Source of Code Miscellaneous
2024.
Links | BibTeX | Schlagwörter: AI, ChatGPT, Code Detection, Large Language Models, machine learning
@misc{Oedingen2024,
title = {ChatGPT Code Detection: Techniques for Uncovering the Source of Code},
author = {Marc Oedingen and Raphael C. Engelhardt and Robin Denz and Maximilian Hammer and Wolfgang Konen},
url = {https://arxiv.org/abs/2405.15512},
year = {2024},
date = {2024-05-01},
urldate = {2024-01-01},
journal = {arXiv preprint arXiv:2405.15512},
keywords = {AI, ChatGPT, Code Detection, Large Language Models, machine learning},
pubstate = {published},
tppubtype = {misc}
}
Oedingen, Marc; Engelhardt, Raphael C.; Denz, Robin; Hammer, Maximilian; Konen, Wolfgang
ChatGPT Code Detection: Techniques for Uncovering the Source of Code Journal Article
In: AI, vol. 5, no. 3, S. 1066–1094, 2024, ISSN: 2673-2688.
Abstract | Links | BibTeX | Schlagwörter: AI, ChatGPT, Code Detection, Large Language Models, machine learning
@article{Oedingen2024_AI,
title = {ChatGPT Code Detection: Techniques for Uncovering the Source of Code},
author = {Marc Oedingen and Raphael C. Engelhardt and Robin Denz and Maximilian Hammer and Wolfgang Konen},
url = {https://www.mdpi.com/2673-2688/5/3/53},
doi = {10.3390/ai5030053},
issn = {2673-2688},
year = {2024},
date = {2024-05-01},
urldate = {2024-01-01},
journal = {AI},
volume = {5},
number = {3},
pages = {1066–1094},
abstract = {In recent times, large language models (LLMs) have made significant strides in generating computer code, blurring the lines between code created by humans and code produced by artificial intelligence (AI). As these technologies evolve rapidly, it is crucial to explore how they influence code generation, especially given the risk of misuse in areas such as higher education. The present paper explores this issue by using advanced classification techniques to differentiate between code written by humans and code generated by ChatGPT, a type of LLM. We employ a new approach that combines powerful embedding features (black-box) with supervised learning algorithms including Deep Neural Networks, Random Forests, and Extreme Gradient Boosting to achieve this differentiation with an impressive accuracy of 98%. For the successful combinations, we also examine their model calibration, showing that some of the models are extremely well calibrated. Additionally, we present white-box features and an interpretable Bayes classifier to elucidate critical differences between the code sources, enhancing the explainability and transparency of our approach. Both approaches work well, but provide at most 85–88% accuracy. Tests on a small sample of untrained humans suggest that humans do not solve the task much better than random guessing. This study is crucial in understanding and mitigating the potential risks associated with using AI in code generation, particularly in the context of higher education, software development, and competitive programming.},
keywords = {AI, ChatGPT, Code Detection, Large Language Models, machine learning},
pubstate = {published},
tppubtype = {article}
}
2015
Koch, Patrick; Wagner, Tobias; Emmerich, Michael T. M.; Bäck, Thomas; Konen, Wolfgang
Efficient multi-criteria optimization on noisy machine learning problems Journal Article
In: Applied Soft Computing, vol. 29, S. 357-370, 2015.
Links | BibTeX | Schlagwörter: CI, machine learning, optimization, parameter tuning, TDMR
@article{Koch14,
title = {Efficient multi-criteria optimization on noisy machine learning problems},
author = { Patrick Koch and Tobias Wagner and Michael T. M. Emmerich and Thomas Bäck and Wolfgang Konen},
url = {http://www.gm.fh-koeln.de/~konen/Publikationen/Koch2015a-ASOC.pdf},
doi = {https://doi.org/10.1016/j.asoc.2015.01.005},
year = {2015},
date = {2015-00-01},
journal = {Applied Soft Computing},
volume = {29},
pages = {357-370},
keywords = {CI, machine learning, optimization, parameter tuning, TDMR},
pubstate = {published},
tppubtype = {article}
}
2011
Konen, Wolfgang
Der SFA-Algorithmus für Klassifikation Technical Report
Research Center CIOP (Computational Intelligence, Optimization and Data Mining) Cologne University of Applied Science, Faculty of Computer Science and Engineering Science, no. 08/11, 2011, ISSN: 2191-365X.
Links | BibTeX | Schlagwörter: classification, machine learning, SFA, SOMA
@techreport{Kone11e,
title = {Der SFA-Algorithmus für Klassifikation},
author = { Wolfgang Konen},
url = {http://www.gm.fh-koeln.de/ciopwebpub/Konen11e.d/Konen11e.pdf},
issn = {2191-365X},
year = {2011},
date = {2011-11-01},
number = {08/11},
address = {Cologne University of Applied Science, Faculty of Computer Science and Engineering Science},
institution = {Research Center CIOP (Computational Intelligence, Optimization and Data Mining)},
keywords = {classification, machine learning, SFA, SOMA},
pubstate = {published},
tppubtype = {techreport}
}
Suchfeld
Oedingen, Marc; Engelhardt, Raphael C.; Denz, Robin; Hammer, Maximilian; Konen, Wolfgang
ChatGPT Code Detection: Techniques for Uncovering the Source of Code Miscellaneous
2024.
@misc{Oedingen2024,
title = {ChatGPT Code Detection: Techniques for Uncovering the Source of Code},
author = {Marc Oedingen and Raphael C. Engelhardt and Robin Denz and Maximilian Hammer and Wolfgang Konen},
url = {https://arxiv.org/abs/2405.15512},
year = {2024},
date = {2024-05-01},
urldate = {2024-01-01},
journal = {arXiv preprint arXiv:2405.15512},
keywords = {},
pubstate = {published},
tppubtype = {misc}
}
Oedingen, Marc; Engelhardt, Raphael C.; Denz, Robin; Hammer, Maximilian; Konen, Wolfgang
ChatGPT Code Detection: Techniques for Uncovering the Source of Code Journal Article
In: AI, vol. 5, no. 3, S. 1066–1094, 2024, ISSN: 2673-2688.
@article{Oedingen2024_AI,
title = {ChatGPT Code Detection: Techniques for Uncovering the Source of Code},
author = {Marc Oedingen and Raphael C. Engelhardt and Robin Denz and Maximilian Hammer and Wolfgang Konen},
url = {https://www.mdpi.com/2673-2688/5/3/53},
doi = {10.3390/ai5030053},
issn = {2673-2688},
year = {2024},
date = {2024-05-01},
urldate = {2024-01-01},
journal = {AI},
volume = {5},
number = {3},
pages = {1066–1094},
abstract = {In recent times, large language models (LLMs) have made significant strides in generating computer code, blurring the lines between code created by humans and code produced by artificial intelligence (AI). As these technologies evolve rapidly, it is crucial to explore how they influence code generation, especially given the risk of misuse in areas such as higher education. The present paper explores this issue by using advanced classification techniques to differentiate between code written by humans and code generated by ChatGPT, a type of LLM. We employ a new approach that combines powerful embedding features (black-box) with supervised learning algorithms including Deep Neural Networks, Random Forests, and Extreme Gradient Boosting to achieve this differentiation with an impressive accuracy of 98%. For the successful combinations, we also examine their model calibration, showing that some of the models are extremely well calibrated. Additionally, we present white-box features and an interpretable Bayes classifier to elucidate critical differences between the code sources, enhancing the explainability and transparency of our approach. Both approaches work well, but provide at most 85–88% accuracy. Tests on a small sample of untrained humans suggest that humans do not solve the task much better than random guessing. This study is crucial in understanding and mitigating the potential risks associated with using AI in code generation, particularly in the context of higher education, software development, and competitive programming.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Thill, Markus
Machine Learning and Deep Learning Approaches for Multivariate Time Series Prediction and Anomaly Detection PhD Thesis
Leiden University and TH Köln, 2022, (PhD thesis).
@phdthesis{Thill2022,
title = {Machine Learning and Deep Learning Approaches for Multivariate Time Series Prediction and Anomaly Detection},
author = {Markus Thill},
year = {2022},
date = {2022-03-01},
institution = {Institut für Informatik},
school = {Leiden University and TH Köln},
note = {PhD thesis},
keywords = {},
pubstate = {published},
tppubtype = {phdthesis}
}
Meissner, Simon
TH Köln -- University of Applied Sciences, 2021, (Bachelor thesis).
@mastersthesis{Meissner2021,
title = {Untersuchung des Spiel- und Lernerfolgs künstlicher Intelligenzen für ein nichtdeterministisches Spiel mit imperfekten Informationen: Blackjack in der Game-Learning-Umgebung ’General Board Game’ (GBG)},
author = {Simon Meissner},
url = {https://www.gm.fh-koeln.de/~konen/research/PaperPDF/BA-Meissner-final-2021.pdf},
year = {2021},
date = {2021-12-01},
urldate = {2021-12-01},
school = {TH Köln -- University of Applied Sciences},
note = {Bachelor thesis},
keywords = {},
pubstate = {published},
tppubtype = {mastersthesis}
}
Zeh, Tim
Untersuchung von allgemeinen KI-Agenten für das Spiel Poker im General Board Games Framework Masters Thesis
TH Köln -- University of Applied Sciences, 2021, (Master thesis).
@mastersthesis{Zeh2021,
title = {Untersuchung von allgemeinen KI-Agenten für das Spiel Poker im General Board Games Framework},
author = {Tim Zeh},
url = {http://www.gm.fh-koeln.de/~konen/research/PaperPDF/MA_Zeh_final_Poker-GBG-2021.pdf},
year = {2021},
date = {2021-01-01},
school = {TH Köln -- University of Applied Sciences},
note = {Master thesis},
keywords = {},
pubstate = {published},
tppubtype = {mastersthesis}
}
Scheiermann, Johannes
AlphaZero-inspirierte KI-Agenten im General Board Game Playing Masters Thesis
TH Köln -- University of Applied Sciences, 2020, (Bachelor thesis).
@mastersthesis{Scheier2020b,
title = {AlphaZero-inspirierte KI-Agenten im General Board Game Playing},
author = {Johannes Scheiermann},
url = {http://www.gm.fh-koeln.de/~konen/research/PaperPDF/BA_Scheiermann_final.pdf},
year = {2020},
date = {2020-12-01},
school = {TH Köln -- University of Applied Sciences},
note = {Bachelor thesis},
keywords = {},
pubstate = {published},
tppubtype = {mastersthesis}
}
Bagheri, Samineh
Self-Adjusting Surrogate-Assisted Optimization Techniques for Expensive Constrained Black Box Problems PhD Thesis
Leiden University and TH Köln, 2020, (PhD thesis, TH Köln dissertation price 2020).
@phdthesis{Bagheri2020,
title = {Self-Adjusting Surrogate-Assisted Optimization Techniques for Expensive Constrained Black Box Problems},
author = {Samineh Bagheri},
year = {2020},
date = {2020-04-01},
urldate = {2020-04-01},
institution = {Institut für Informatik},
school = {Leiden University and TH Köln},
note = {PhD thesis, TH Köln dissertation price 2020},
keywords = {},
pubstate = {published},
tppubtype = {phdthesis}
}
Scheiermann, Johannes
Sind (trainierte) General-Purpose-RL-Agenten im Brettspiel Othello stärker als (untrainierte) General-Game-Playing Agenten? Technical Report
TH Köln, Institut für Informatik 2020, (Praxisprojekt).
@techreport{Scheier2020,
title = {Sind (trainierte) General-Purpose-RL-Agenten im Brettspiel Othello stärker als (untrainierte) General-Game-Playing Agenten?},
author = {Johannes Scheiermann},
url = {http://www.gm.fh-koeln.de/~konen/research/PaperPDF/INF-Prj-Scheiermann-2020-08.pdf},
year = {2020},
date = {2020-01-01},
institution = {TH Köln, Institut für Informatik},
note = {Praxisprojekt},
keywords = {},
pubstate = {published},
tppubtype = {techreport}
}
Barsnick, Felix
Implementierung und Untersuchung eines Turniersystems für KI-Agenten in Brettspielen Masters Thesis
TH Köln -- University of Applied Sciences, 2019, (Master thesis).
@mastersthesis{Barsnick2019,
title = {Implementierung und Untersuchung eines Turniersystems für KI-Agenten in Brettspielen},
author = {Felix Barsnick},
url = {http://www.gm.fh-koeln.de/~konen/research/PaperPDF/MA_MMI_Barsnick-2019-04-final.pdf},
year = {2019},
date = {2019-01-01},
institution = {Institut für Informatik},
school = {TH Köln -- University of Applied Sciences},
note = {Master thesis},
keywords = {},
pubstate = {published},
tppubtype = {mastersthesis}
}
Scholzen, Jordan
TH Köln -- University of Applied Sciences, 2019, (Bachelor thesis, 1st prize in Opitz innovation award 2020).
@mastersthesis{Scholzen2019,
title = {Künstliche Intelligenz in der Kompositionslehre – Eine Untersuchung von Long-Short-Term-Memory-Netzen zur Analyse von Kontrapunkten nach Fux},
author = {Jordan Scholzen},
url = {http://www.gm.fh-koeln.de/~konen/research/PaperPDF/BA-Scholzen-2019-12-06-final.pdf},
year = {2019},
date = {2019-01-01},
institution = {Institut für Informatik},
school = {TH Köln -- University of Applied Sciences},
note = {Bachelor thesis, 1st prize in Opitz innovation award 2020},
keywords = {},
pubstate = {published},
tppubtype = {mastersthesis}
}