ChuanhuChatGPT集成百川大模型

搭建步骤：

拷贝本地模型，把下载好的Baichuan2-7B-Chat拷贝到models目录下
修改modules\models\base_model.py文件，class ModelType增加Baichuan

Baichuan = 16

elif "baichuan" in model_name_lower:

model_type = ModelType.Baichuan
修改modules\models\models.py文件，get_model方法增加ModelType.Baichuan

elif model_type == ModelType.Baichuan:

from .Baichuan import Baichuan_Client

model = Baichuan_Client(model_name, user_name=user_name)

增加modules\models\Baichuan.py文件

from modelscope import snapshot_download, AutoModelForCausalLM, AutoTokenizer,GenerationConfig

from transformers import AutoModelForCausalLM, AutoTokenizer

from transformers.generation import GenerationConfig

import logging

import colorama

from ..index_func import *

from ..presets import *

from ..utils import *

from .base_model import BaseLLMModel

from ..presets import MODEL_METADATA

from datetime import datetime

class Baichuan_Client(BaseLLMModel):

def __init__(self, model_name, user_name="") -> None:

super().__init__(model_name=model_name, user=user_name)

import torch

from transformers import AutoModel, AutoTokenizer

global CHATGLM_TOKENIZER, CHATGLM_MODEL

print("__init__ Baichuan_Client")

if CHATGLM_TOKENIZER is None or CHATGLM_MODEL is None:

model_path = None

if os.path.exists("models"):

model_dirs = os.listdir("models")

if model_name in model_dirs:

model_path = f"models/{model_name}"

if model_path is not None:

model_source = model_path

else:

model_source = snapshot_download(f"baichuan-inc/{model_name}", revision='v1.0.4')

CHATGLM_TOKENIZER = AutoTokenizer.from_pretrained(

model_source, device_map="auto", trust_remote_code=True, torch_dtype=torch.float16

)

quantified = False

if "int4" in model_name:

quantified = True

model = AutoModelForCausalLM.from_pretrained(

model_source, device_map="auto", trust_remote_code=True, torch_dtype=torch.float16

)

model.generation_config = GenerationConfig.from_pretrained(model_source)

model = model.eval()

CHATGLM_MODEL = model

def _get_glm_style_input(self):

print("_get_glm_style_input")

print(f"the history is: {self.history}")

history = [x["content"] for x in self.history]

query = history.pop()

print(f"the message is: {query}")

return history, query

def get_answer_at_once(self):

print("get_answer_at_once")

history,query = self._get_glm_style_input()

messages = []

messages.append({'role': 'user', 'content': query})

now = datetime.now()

print("get_answer_at_once start"+"++++++++"+ now.strftime("%Y-%m-%d %H:%M:%S"))

response = CHATGLM_MODEL.chat(

CHATGLM_TOKENIZER, messages)

now = datetime.now()

print("get_answer_at_once end"+"++++++++"+ now.strftime("%Y-%m-%d %H:%M:%S"))

print(f"the response is: {response}")

return response, len(response)

def get_answer_stream_iter(self):

history,query = self._get_glm_style_input()

messages = []

messages.append({'role': 'user', 'content': query})

result = ""

now = datetime.now()

print("get_answer_stream_iter start"+"++++++++"+ now.strftime("%Y-%m-%d %H:%M:%S"))

for response in CHATGLM_MODEL.chat(

CHATGLM_TOKENIZER,

messages

):

print(f"the response is: {response}")

result += response

yield result

now = datetime.now()

print("get_answer_stream_iter end"+"++++++++"+ now.strftime("%Y-%m-%d %H:%M:%S"))

答案回调开关控制get_answer_at_once、get_answer_stream_iter方法调用选择
执行效果

本文来自互联网用户投稿，该文观点仅代表作者本人，不代表本站立场。本站仅提供信息存储空间服务，不拥有所有权，不承担相关法律责任。如若转载，请注明出处：http://www.mzph.cn/bicheng/3882.shtml

如若内容造成侵权/违法违规/事实不符，请联系多彩编程网进行投诉反馈email:809451989@qq.com，一经查实，立即删除！

ChuanhuChatGPT集成百川大模型

相关文章

短视频矩阵营销系统 poihuoqu 任意文件读取漏洞复现

PostgreSQL的扩展（extensions）-常用的扩展之pg_stat_kcache

Vue从0-1学会如何自定义封装v-指令

【Go】匿名函数与闭包

Java毕业设计基于SpringBoot vue城镇保障性住房管理系统

flutter利用get中的GetConnect实现拦截请求

Servlet和Tomcat运作过程

HTTP基础知识

2024 OceanBase 开发者大会：OceanBase 4.3正式发布，打造近PB级实时分析数据库

【基础篇】Git 基础命令与核心概念

Flutter 从 Assets 中读取 JSON 文件：指南 [2024]

mpv启动脚本功能

与 Apollo 共创生态：Apollo 七周年大会给带来的震撼

微服务之分布式理论概述

玩转手机在AidLux上安装宝塔面板

【声网】实现web端与uniapp微信小程序端音视频互动

C++性能优化实践三

python版的openCV使用及下载

Linux简单命令

Linux平台Unity下RTMP|RTSP低延迟播放器技术实现