diff --git a/.obsidian/workspace.json b/.obsidian/workspace.json index 8b2f6fe..20fcd2a 100644 --- a/.obsidian/workspace.json +++ b/.obsidian/workspace.json @@ -13,7 +13,7 @@ "state": { "type": "markdown", "state": { - "file": "Record/DL/CoT Prompt.md", + "file": "Record/DL/LLM.md", "mode": "source", "source": false } @@ -93,7 +93,7 @@ "state": { "type": "backlink", "state": { - "file": "Record/DL/CoT Prompt.md", + "file": "Record/DL/LLM.md", "collapseAll": false, "extraContext": false, "sortOrder": "alphabetical", @@ -110,7 +110,7 @@ "state": { "type": "outgoing-link", "state": { - "file": "Record/DL/CoT Prompt.md", + "file": "Record/DL/LLM.md", "linksCollapsed": false, "unlinkedCollapsed": true } @@ -133,7 +133,7 @@ "state": { "type": "outline", "state": { - "file": "Record/DL/CoT Prompt.md" + "file": "Record/DL/LLM.md" } } }, @@ -175,8 +175,9 @@ }, "active": "e144afbc26630891", "lastOpenFiles": [ - "Record/DL/Loss.md", "Record/DL/CoT Prompt.md", + "Record/DL/LLM.md", + "Record/DL/Loss.md", "Paper/Diffusion/Imagic.md", "Paper/Diffusion/MoMA.md", "Paper/Diffusion/Tutorial on Diffusion Models for Imaging and Vision.md", @@ -211,7 +212,6 @@ "Study/DL/吴恩达深度学习课程/Other.md", "Books/Java Guide/基础语法.md", "Books/Java并发编程/Java并发编程.md", - "Books/从零开始深入学习Spring/IoC.md", - "Books/Vim实用技巧/一、入门导读.md" + "Books/从零开始深入学习Spring/IoC.md" ] } \ No newline at end of file diff --git a/Record/DL/LLM.md b/Record/DL/LLM.md new file mode 100644 index 0000000..ed8bdad --- /dev/null +++ b/Record/DL/LLM.md @@ -0,0 +1,5 @@ +## 常见超参 +- temperature + 用于控制 LLM 输出的随机度。高热度更有创造性/难以预测,低热度则更为保守。 +- Top-K + 即核心采样(nucleus smapling),也是用处控制输出随机性的超参数。它设定了一个概率阈值,LLM 会选取累计概率超过该阈值的最佳词汇,然后 LLM 从这组词汇中随机抽取以生成输出。 \ No newline at end of file