dc.contributor.author | Puerto, Haritz | |
dc.contributor.author | Chubakov, Tilek | |
dc.contributor.author | Zhu, Xiaodan | |
dc.contributor.author | Tayyar Madabushi, Harish | |
dc.contributor.author | Gurevych, Iryna | |
dc.date.accessioned | 2024-06-22T19:37:41Z | |
dc.date.available | 2024-06-22T19:37:41Z | |
dc.date.issued | 2024-06 | |
dc.identifier.uri | https://tudatalib.ulb.tu-darmstadt.de/handle/tudatalib/4272 | |
dc.description | LLaMA-2 13B-Chat Model checkpoints for Fine-Tuning with Divergent Chains of Thought Boosts Reasoning Through Self-Correction in Language Models | de_DE |
dc.language.iso | en | de_DE |
dc.rights | CC BY-SA 3.0 | |
dc.rights.uri | https://creativecommons.org/licenses/by-sa/3.0/ | |
dc.subject | LLM | de_DE |
dc.subject | large language model | de_DE |
dc.subject | NLP | de_DE |
dc.subject | chain of thought | de_DE |
dc.subject | cot | de_DE |
dc.subject.classification | 4.43-04 Künstliche Intelligenz und Maschinelle Lernverfahren | de_DE |
dc.subject.classification | 4.43-05 Bild- und Sprachverarbeitung, Computergraphik und Visualisierung, Human Computer Interaction, Ubiquitous und Wearable Computing | |
dc.subject.ddc | 004 | |
dc.title | LLaMA-2 13B-Chat Model checkpoints for Fine-Tuning with Divergent Chains of Thought Boosts Reasoning Through Self-Correction in Language Models | de_DE |
dc.type | Model | de_DE |
dc.description.version | 1.0 | de_DE |
tud.unit | TUDa | |
tud.history.classification | Version=2016-2020;409-05 Interaktive und intelligente Systeme, Bild- und Sprachverarbeitung, Computergraphik und Visualisierung | |