「日拱一码」071 机器学习——大语言模型LLM-EW帮帮网

from transformers import AutoTokenizer, AutoModel
import torch


class LocalChatGLM:
    def __init__(self, model_path="THUDM/chatglm3-6b"):
        """初始化本地模型"""
        print("正在加载本地模型...")
        self.tokenizer = AutoTokenizer.from_pretrained(
            model_path,
            trust_remote_code=True,
            revision="main"  # 使用主分支
        )
        self.model = AutoModel.from_pretrained(
            model_path,
            trust_remote_code=True,
            revision="main",
            torch_dtype=torch.float16  # 使用半精度减少内存占用
        ).cuda()  # 使用GPU

        print("模型加载完成！")

    def chat(self, prompt, history=[]):
        """与模型对话"""
        response, updated_history = self.model.chat(
            self.tokenizer,
            prompt,
            history=history,
            temperature=0.7
        )
        return response, updated_history


# 使用示例
def local_model_example():
    try:
        # 使用较小的模型或本地下载的模型
        chatglm = LocalChatGLM("THUDM/chatglm3-6b")

        history = []
        while True:
            user_input = input("\n你: ")
            if user_input.lower() in ['退出', 'exit', 'quit']:
                break

            response, history = chatglm.chat(user_input, history)
            print(f"AI: {response}")

    except Exception as e:
        print(f"加载模型失败: {e}")
        print("请尝试先下载模型到本地，或者使用API方案")

local_model_example()

「日拱一码」071 机器学习——大语言模型LLM

大语言模型（LLM）核心介绍

1. 什么是大语言模型？

核心特征

2. 技术基础：Transformer架构

3. 发展历程中的关键模型

4. 两种主要模式

5. 应用领域

代码示例

使用使用本地运行的轻量级模型（ChatGLM3-6B）

网站公告

今日签到

热门文章

最新发布