ChatGLM-6B/web_demo2.py

from transformers import AutoModel, AutoTokenizer
import streamlit as st
from streamlit_chat import message


st.set_page_config(
    page_title="ChatGLM-6b 演示",
    page_icon=":robot:"
)


@st.cache_resource
def get_model():
    tokenizer = AutoTokenizer.from_pretrained("THUDM/chatglm-6b", trust_remote_code=True)
    model = AutoModel.from_pretrained("THUDM/chatglm-6b", trust_remote_code=True).half().cuda()
    model = model.eval()
    return tokenizer, model


MAX_TURNS = 20
MAX_BOXES = MAX_TURNS * 2


def predict(input, max_length, top_p, temperature, history=None):
    tokenizer, model = get_model()
    if history is None:
        history = []

    with container:
        if len(history) > 0:
            if len(history)>MAX_BOXES:
                history = history[-MAX_TURNS:]
            for i, (query, response) in enumerate(history):
                message(query, avatar_style="big-smile", key=str(i) + "_user")
                message(response, avatar_style="bottts", key=str(i))

        message(input, avatar_style="big-smile", key=str(len(history)) + "_user")
        st.write("AI正在回复:")
        with st.empty():
            for response, history in model.stream_chat(tokenizer, input, history, max_length=max_length, top_p=top_p,
                                               temperature=temperature):
                query, response = history[-1]
                st.write(response)

    return history


container = st.container()

# create a prompt text for the text generation
prompt_text = st.text_area(label="用户命令输入",
            height = 100,
            placeholder="请在这儿输入您的命令")

max_length = st.sidebar.slider(
    'max_length', 0, 4096, 2048, step=1
)
top_p = st.sidebar.slider(
    'top_p', 0.0, 1.0, 0.6, step=0.01
)
temperature = st.sidebar.slider(
    'temperature', 0.0, 1.0, 0.95, step=0.01
)

if 'state' not in st.session_state:
    st.session_state['state'] = []

if st.button("发送", key="predict"):
    with st.spinner("AI正在思考，请稍等........"):
        # text generation
        st.session_state["state"] = predict(prompt_text, max_length, top_p, temperature, st.session_state["state"])
Create web_demo2.py Add a steamlit based demo web_demo2.py for better UI. need to install streamlit and streamlit-chat component fisrt: pip install streamlit pip install streamlit-chat then run with the following: streamlit run web_demo2.py --server.port 6006 2 years ago			`from transformers import AutoModel, AutoTokenizer`
			`import streamlit as st`
			`from streamlit_chat import message`
Add multi-gpu deployment 2 years ago
Create web_demo2.py Add a steamlit based demo web_demo2.py for better UI. need to install streamlit and streamlit-chat component fisrt: pip install streamlit pip install streamlit-chat then run with the following: streamlit run web_demo2.py --server.port 6006 2 years ago
			`st.set_page_config(`
			`page_title="ChatGLM-6b 演示",`
			`page_icon=":robot:"`
			`)`


			`@st.cache_resource`
			`def get_model():`
Add multi-gpu deployment 2 years ago			`tokenizer = AutoTokenizer.from_pretrained("THUDM/chatglm-6b", trust_remote_code=True)`
			`model = AutoModel.from_pretrained("THUDM/chatglm-6b", trust_remote_code=True).half().cuda()`
			`model = model.eval()`
Create web_demo2.py Add a steamlit based demo web_demo2.py for better UI. need to install streamlit and streamlit-chat component fisrt: pip install streamlit pip install streamlit-chat then run with the following: streamlit run web_demo2.py --server.port 6006 2 years ago			`return tokenizer, model`


			`MAX_TURNS = 20`
			`MAX_BOXES = MAX_TURNS * 2`


update web_demo 2 years ago			`def predict(input, max_length, top_p, temperature, history=None):`
Create web_demo2.py Add a steamlit based demo web_demo2.py for better UI. need to install streamlit and streamlit-chat component fisrt: pip install streamlit pip install streamlit-chat then run with the following: streamlit run web_demo2.py --server.port 6006 2 years ago			`tokenizer, model = get_model()`
			`if history is None:`
			`history = []`

support stream chat 2 years ago			`with container:`
			`if len(history) > 0:`
Update web_demo2.py 当前MAX_BOXES与MAX_TURNS不生效导致单次对话不终止显存不断增加最后显存溢出问题，修改最大对话轮数和最大历史对话数量使其生效，逻辑为历史最大对话框记录轮数达到MAX_BOXES时截断历史对话为最近MAX_TURNS数。 2 years ago			`if len(history)>MAX_BOXES:`
			`history = history[-MAX_TURNS:]`
support stream chat 2 years ago			`for i, (query, response) in enumerate(history):`
			`message(query, avatar_style="big-smile", key=str(i) + "_user")`
			`message(response, avatar_style="bottts", key=str(i))`
Create web_demo2.py Add a steamlit based demo web_demo2.py for better UI. need to install streamlit and streamlit-chat component fisrt: pip install streamlit pip install streamlit-chat then run with the following: streamlit run web_demo2.py --server.port 6006 2 years ago
support stream chat 2 years ago			`message(input, avatar_style="big-smile", key=str(len(history)) + "_user")`
			`st.write("AI正在回复:")`
			`with st.empty():`
update web_demo 2 years ago			`for response, history in model.stream_chat(tokenizer, input, history, max_length=max_length, top_p=top_p,`
			`temperature=temperature):`
support stream chat 2 years ago			`query, response = history[-1]`
			`st.write(response)`
Create web_demo2.py Add a steamlit based demo web_demo2.py for better UI. need to install streamlit and streamlit-chat component fisrt: pip install streamlit pip install streamlit-chat then run with the following: streamlit run web_demo2.py --server.port 6006 2 years ago
			`return history`


support stream chat 2 years ago			`container = st.container()`

Create web_demo2.py Add a steamlit based demo web_demo2.py for better UI. need to install streamlit and streamlit-chat component fisrt: pip install streamlit pip install streamlit-chat then run with the following: streamlit run web_demo2.py --server.port 6006 2 years ago			`# create a prompt text for the text generation`
			`prompt_text = st.text_area(label="用户命令输入",`
			`height = 100,`
			`placeholder="请在这儿输入您的命令")`

update web_demo 2 years ago			`max_length = st.sidebar.slider(`
			`'max_length', 0, 4096, 2048, step=1`
			`)`
			`top_p = st.sidebar.slider(`
			`'top_p', 0.0, 1.0, 0.6, step=0.01`
			`)`
			`temperature = st.sidebar.slider(`
			`'temperature', 0.0, 1.0, 0.95, step=0.01`
			`)`
support stream chat 2 years ago
Create web_demo2.py Add a steamlit based demo web_demo2.py for better UI. need to install streamlit and streamlit-chat component fisrt: pip install streamlit pip install streamlit-chat then run with the following: streamlit run web_demo2.py --server.port 6006 2 years ago			`if 'state' not in st.session_state:`
			`st.session_state['state'] = []`

			`if st.button("发送", key="predict"):`
			`with st.spinner("AI正在思考，请稍等........"):`
			`# text generation`
Update web_demo2.py 当前MAX_BOXES与MAX_TURNS不生效导致单次对话不终止显存不断增加最后显存溢出问题，修改最大对话轮数和最大历史对话数量使其生效，逻辑为历史最大对话框记录轮数达到MAX_BOXES时截断历史对话为最近MAX_TURNS数。 2 years ago			`st.session_state["state"] = predict(prompt_text, max_length, top_p, temperature, st.session_state["state"])`