ChuanhuChatGPT集成百川大模型-编程知识

ChuanhuChatGPT集成百川大模型

搭建步骤：

拷贝本地模型，把下载好的Baichuan2-7B-Chat拷贝到models目录下
修改modules\models\base_model.py文件，class ModelType增加Baichuan

Baichuan = 16

elif "baichuan" in model_name_lower:

model_type = ModelType.Baichuan
修改modules\models\models.py文件，get_model方法增加ModelType.Baichuan

elif model_type == ModelType.Baichuan:

from .Baichuan import Baichuan_Client

model = Baichuan_Client(model_name, user_name=user_name)

增加modules\models\Baichuan.py文件

from modelscope import snapshot_download, AutoModelForCausalLM, AutoTokenizer,GenerationConfig

from transformers import AutoModelForCausalLM, AutoTokenizer

from transformers.generation import GenerationConfig

import logging

import colorama

from ..index_func import *

from ..presets import *

from ..utils import *

from .base_model import BaseLLMModel

from ..presets import MODEL_METADATA

from datetime import datetime

class Baichuan_Client(BaseLLMModel):

def __init__(self, model_name, user_name="") -> None:

super().__init__(model_name=model_name, user=user_name)

import torch

from transformers import AutoModel, AutoTokenizer

global CHATGLM_TOKENIZER, CHATGLM_MODEL

print("__init__ Baichuan_Client")

if CHATGLM_TOKENIZER is None or CHATGLM_MODEL is None:

model_path = None

if os.path.exists("models"):

model_dirs = os.listdir("models")

if model_name in model_dirs:

model_path = f"models/{model_name}"

if model_path is not None:

model_source = model_path

else:

model_source = snapshot_download(f"baichuan-inc/{model_name}", revision='v1.0.4')

CHATGLM_TOKENIZER = AutoTokenizer.from_pretrained(

model_source, device_map="auto", trust_remote_code=True, torch_dtype=torch.float16

)

quantified = False

if "int4" in model_name:

quantified = True

model = AutoModelForCausalLM.from_pretrained(

model_source, device_map="auto", trust_remote_code=True, torch_dtype=torch.float16

)

model.generation_config = GenerationConfig.from_pretrained(model_source)

model = model.eval()

CHATGLM_MODEL = model

def _get_glm_style_input(self):

print("_get_glm_style_input")

print(f"the history is: {self.history}")

history = [x["content"] for x in self.history]

query = history.pop()

print(f"the message is: {query}")

return history, query

def get_answer_at_once(self):

print("get_answer_at_once")

history,query = self._get_glm_style_input()

messages = []

messages.append({'role': 'user', 'content': query})

now = datetime.now()

print("get_answer_at_once start"+"++++++++"+ now.strftime("%Y-%m-%d %H:%M:%S"))

response = CHATGLM_MODEL.chat(

CHATGLM_TOKENIZER, messages)

now = datetime.now()

print("get_answer_at_once end"+"++++++++"+ now.strftime("%Y-%m-%d %H:%M:%S"))

print(f"the response is: {response}")

return response, len(response)

def get_answer_stream_iter(self):

history,query = self._get_glm_style_input()

messages = []

messages.append({'role': 'user', 'content': query})

result = ""

now = datetime.now()

print("get_answer_stream_iter start"+"++++++++"+ now.strftime("%Y-%m-%d %H:%M:%S"))

for response in CHATGLM_MODEL.chat(

CHATGLM_TOKENIZER,

messages

):

print(f"the response is: {response}")

result += response

yield result

now = datetime.now()

print("get_answer_stream_iter end"+"++++++++"+ now.strftime("%Y-%m-%d %H:%M:%S"))

答案回调开关控制get_answer_at_once、get_answer_stream_iter方法调用选择
执行效果

本文来自互联网用户投稿，该文观点仅代表作者本人，不代表本站立场。本站仅提供信息存储空间服务，不拥有所有权，不承担相关法律责任。如若转载，请注明出处：http://www.hqwc.cn/news/651906.html

如若内容造成侵权/违法违规/事实不符，请联系编程知识网进行投诉反馈email:809451989@qq.com，一经查实，立即删除！

ChuanhuChatGPT集成百川大模型

相关文章

MySQL双层游标嵌套循环方法

upload-labs通关

MySQL/MariaDB 如何查看当前的用户

笔记：编写程序，分别采用面向对象和 pyplot 快捷函数的方式绘制正弦曲线和余弦曲线。提示：使用 sin()或 cos()函数生成正弦值或余弦值。

美国洛杉矶站群服务器如何提高网站排名?

cocos-lua资源管理

Kotlin基础

【HarmonyOS】Stage 模型 - 基本概念

Docker基本操作 Linux里边操作

Centos/linux根目录扩容、分区、挂载。LVM、物理卷、逻辑卷

分布式版本控制系统——Git

javaScript基础2