模型运行页面设计webui代码_torch_gc

作者：很楠不爱3 | 2024-04-11 14:16:56
踩
torch_gc

from deep_training.data_helper import ModelArguments, TrainingArguments, DataArguments
from deep_training.nlp.models.chatglm import setup_model_profile, ChatGLMConfig
from deep_training.nlp.models.lora.v2 import LoraArguments
from transformers import HfArgumentParser
from typing import Optional, List, Tuple
from data_utils import train_info_args, NN_DataHelper
from models import MyTransformer,ChatGLMTokenizer
 
import os
 
import gradio as gr
 
from webui.context import ctx
from webui.device import torch_gc
css = "style.css"
script_path = "scripts"
_gradio_template_response_orig = gr.routes.templates.TemplateResponse
 
# 加载模型
train_info_args['seed'] = None
parser = HfArgumentParser((ModelArguments, TrainingArguments, DataArguments, LoraArguments))
model_args, training_args, data_args, _ = parser.parse_dict(train_info_args)
 
setup_model_profile()
 
dataHelper = NN_DataHelper(model_args, training_args, data_args)
tokenizer: ChatGLMTokenizer
tokenizer, _, _, _ = dataHelper.load_tokenizer_and_config(tokenizer_class_name=ChatGLMTokenizer, config_class_name=ChatGLMConfig)
 
config = ChatGLMConfig.from_pretrained('./best_ckpt')
# config = ChatGLMConfig.from_pretrained('./best_ckpt')
config.initializer_weight = False
 
lora_args = LoraArguments.from_pretrained('./last_ckpt')
# lora_args = LoraArguments.from_pretrained('./best_ckpt')
 
assert lora_args.inference_mode == True and config.pre_seq_len is None
 
pl_model = MyTransformer(config=config, model_args=model_args, training_args=training_args, lora_args=lora_args)
# 加载lora权重
pl_model.backbone.from_pretrained(pl_model.backbone.model, pretrained_model_name_or_path='./last_ckpt',
                                      lora_config=lora_args)
# pl_model.backbone.from_pretrained(pl_model.backbone.model, pretrained_model_name_or_path = './best_ckpt', lora_config = lora_args)
 
model = pl_model.get_glm_model()
# 按需修改
model.half().cuda()
model = model.eval()
 
 
def infer(query,
          history: Optional[List[Tuple]],
          max_length, top_p, temperature):
    # if cmd_opts.ui_dev:
    #     return "hello", "hello, dev mode!"
 
    if not model:
        raise "Model not loaded"
 
    if history is None:
        history = []
    output, history = model.chat(
        tokenizer, query=query, history=history,
        max_length=max_length,
        top_p=top_p,
        temperature=temperature
    )
    print(output)
    torch_gc()
    return query, output
 
def predict(query, max_length, top_p, temperature):
    ctx.limit_round()
    _, output = infer(
        query=query,
        history=ctx.history,
        max_length=max_length,
        top_p=top_p,
        temperature=temperature
    )
    ctx.append(query, output)
    torch_gc()
    # for clear input textbox
    return ctx.history, ""
 
 
def clear_history():
    ctx.clear()
    return gr.update(value=[])
 
 
def apply_max_round_click(max_round):
    ctx.max_rounds = max_round
 
def reload_javascript():
    scripts_list = [os.path.join(script_path, i) for i in os.listdir(script_path) if i.endswith(".js")]
    javascript = ""
    # with open("script.js", "r", encoding="utf8") as js_file:
    #     javascript = f'<script>{js_file.read()}</script>'
 
    for path in scripts_list:
        with open(path, "r", encoding="utf8") as js_file:
            javascript += f"\n<script>{js_file.read()}</script>"
 
    # todo: theme
    # if cmd_opts.theme is not None:
    #     javascript += f"\n<script>set_theme('{cmd_opts.theme}');</script>\n"
 
    def template_response(*args, **kwargs):
        res = _gradio_template_response_orig(*args, **kwargs)
        res.body = res.body.replace(
            b'</head>', f'{javascript}</head>'.encode("utf8"))
        res.init_headers()
        return res
 
    gr.routes.templates.TemplateResponse = template_response
 
def main():
    # 创建ui
    reload_javascript()
 
    with gr.Blocks(css=css, analytics_enabled=False) as chat_interface:
        prompt = "输入你的内容..."
        with gr.Row():
            with gr.Column(scale=3):
                gr.Markdown("""<h2><center>ChatGLM WebUI</center></h2>""")
                with gr.Row():
                    with gr.Column(variant="panel"):
                        with gr.Row():
                            max_length = gr.Slider(minimum=4, maximum=4096, step=4, label='Max Length', value=2048)
                            top_p = gr.Slider(minimum=0.01, maximum=1.0, step=0.01, label='Top P', value=0.7)
                        with gr.Row():
                            temperature = gr.Slider(minimum=0.01, maximum=1.0, step=0.01, label='Temperature',
                                                    value=0.95)
 
                        with gr.Row():
                            max_rounds = gr.Slider(minimum=1, maximum=100, step=1, label="最大对话轮数（调小可以显著改善爆显存，但是会丢失上下文）",
                                                   value=20)
                            apply_max_rounds = gr.Button("✔", elem_id="del-btn")
 
                with gr.Row():
                    with gr.Column(variant="panel"):
                        with gr.Row():
                            clear = gr.Button("清空对话（上下文）")
 
                        with gr.Row():
                            save_his_btn = gr.Button("保存对话")
                            load_his_btn = gr.UploadButton("读取对话", file_types=['file'], file_count='single')
 
            with gr.Column(scale=7):
                chatbot = gr.Chatbot(elem_id="chat-box", show_label=False).style(height=800)
                with gr.Row():
                    input_message = gr.Textbox(placeholder=prompt, show_label=False, lines=2, elem_id="chat-input")
                    clear_input = gr.Button("声明：本文内容由网友自发贡献，不代表【wpsshop博客】立场，版权归原作者所有，本站不承担相应法律责任。如您发现有侵权的内容，请联系我们。转载请注明出处：https://www.wpsshop.cn/w/很楠不爱3/article/detail/405446
推荐阅读
articlestable-diffusion-webui 加载失败 卡在这里求助_model loaded in...
C:\Users\Clack\Desktop\NeonMindAI_894978\NeonMind AI\stable-...
                                    赞
踩
articlePyTorch实现苹果M1芯片GPU加速：训练速度提升7倍，性能最高提升21倍_mac m1 pro...
据PyTorch官网介绍，其使用Apple的Metal Performance Shaders（MPS）作为PyTorc...
                                    赞
踩
articleStable Diffusion WebUI 各操作系统安装教程_assertionerror: e...
最近几天在 2 台 Mac、2 台 PC、一台云无 GPU 的 Linux 安装了 Stable Diffusion W...
                                    赞
踩
articleWindows 10安装stable-diffusion-webui过程中出现报错解决如下_安装st...
最近使用win10在安装stable-diffusion-webui过程中，安装上图所示requirements.txt...
                                    赞
踩
articleStable Diffusion 硬核生存指南：WebUI 中的 GFPGAN_restorefor...
本篇文章聊聊 Stable Diffusion WebUI 中的核心组件，强壮的人脸图像面部画面修复模型 GFPGAN ...
                                    赞
踩
article02-记录下StableDiffusion的webui启动参数（cmd_args.py）_stabl...
Stable Diffusion的启动参数_stable-diffusion-webui 启动参数stable-diff...
                                    赞
踩
articleModuleNotFoundError: No module named ‘torch’...
关于深度学习的一些学习框架，我使用过pytorch，caffe，caffe2，openchatkit，最近，我选择了 P...
                                    赞
踩
articleLinux平台利用Ollama和Open WebUI部署大模型_open webui 如何添加模型(...
为了做好运维面试路上的助攻手，特整理了上百道。_ollama网址访问ollama网址访问                ...
                                    赞
踩
article【原创】手动安装open-webui，非官方docker安装方法，可汉化ui_不使用docker启动...
open-webui是一个为LLMs（大型语言模型）设计的友好型Web用户界面，支持Ollama和OpenAI兼容的AP...
                                    赞
踩
article探索未来Web界面的新可能：Open-WebUI...
探索未来Web界面的新可能：Open-WebUI项目地址:https://gitcode.com/open-webui/...
                                    赞
踩
articleno module named ‘torch._custom_ops‘...
追踪到init文件发现是没有definition的，这时候我想到了是不是由于版本更新问题，之前的torch版本可能没有这...
                                    赞
踩
articleWebUI 自动化测试框架搭建详解_web自动化测试框架搭建...
1.1：实现目的基于BS架构，模拟用户（鼠标、键盘）操作，达到快速、重复执行测试用例；便于回归测试，快速覆盖主线用例或功...
                                    赞
踩
article【pytorch】torch.nn.Module.load_state_dict详解...
参考博客：https://blog.csdn.net/weixin_40522801/article/details/1...
                                    赞
踩
article使用Streamlit构建纯LLM Chatbot WebUI傻瓜教程_大语言模型 webui...
大量的大语言模型的WebUI基于Streamlit构建对话机器人Chatbot。Streamlit可以帮助将大型语言模型...
                                    赞
踩
article轻松搭建本地大模型Ollama+OpenWebUI_ollama windows open-webu...
Ollama是一个开源的LLaMA 2.0的桌面应用程序，它允许用户在本地运行LLaMA 2.0，并使用它进行聊天、生成...
                                    赞
踩
articleDocker仓库的Web UI_docker open webui...
[root@server1 ~]# docker pull hyper/docker-registry-web_dock...
                                    赞
踩
article【学习记录】Open-WebUI 非Docker安装_openwebui 非容器化部署...
来源。_openwebui 非容器化部署openwebui 非容器化部署                        ...
                                    赞
踩
articleLinux平台利用Ollama和Open WebUI部署大模型_open webui 如何添加模型...
在当今的人工智能领域，部署大型深度学习模型是一个挑战，尤其是对于那些不熟悉复杂技术栈的用户而言。然而，随着开源技术的不断...
                                    赞
踩
article容器技术-部署Docker-WebUI_docker open webui...
1、下载并运行容器[root@qfedu.com ~]#docker pull uifd/ui-for-docker [...
                                    赞
踩
article【深度学习】学习率与学习率衰减详解：torch.optim.lr_scheduler用法_torch...
【深度学习】学习率与学习率衰减详解：torch.optim.lr_scheduler用法_torch scheduler...
                                    赞
踩
相关标签
stable diffusion
java
大数据
人工智能
机器学习
业界资讯
python
docker
GFPGAN
深度学习
No module named
Jupyter
torch
报错
linux
运维
服务器
open-webui
Ollama
chatgpt
qwen1.5
llama2
gemma
测试工具