matrix-pygmalion-bot/matrix_pygmalion_bot/bot/ai/langchain.py

import asyncio
import os, time
from .prompts import *
from .langchain_memory import CustomMemory # BotConversationSummaryBufferWindowMemory, TestMemory
from ..utilities.messages import Message

from langchain import PromptTemplate
from langchain import LLMChain, ConversationChain
from langchain.memory import ConversationBufferMemory, ReadOnlySharedMemory, CombinedMemory, ConversationSummaryMemory

from langchain.chains.base import Chain
from typing import Dict, List, Union

from langchain.document_loaders import TextLoader
from langchain.text_splitter import RecursiveCharacterTextSplitter
from langchain.embeddings import SentenceTransformerEmbeddings
from langchain.vectorstores import Chroma

from langchain.agents import Tool, AgentExecutor, LLMSingleActionAgent, AgentOutputParser, ZeroShotAgent
from langchain.schema import AgentAction, AgentFinish
from langchain.schema import AIMessage, HumanMessage, SystemMessage, ChatMessage
from langchain.utilities import OpenWeatherMapAPIWrapper, SearxSearchWrapper, PythonREPL
from langchain.utilities.duckduckgo_search import DuckDuckGoSearchAPIWrapper

import humanize
from datetime import datetime, timedelta

import logging

logger = logging.getLogger(__name__)


class RoleplayChain(Chain):
    llm_chain: LLMChain

    character_name: str
    persona: str
    scenario: str
    ai_name_chat: str
    human_name_chat: str

    output_key: str = "output_text"  #: :meta private:

    @property
    def input_keys(self) -> List[str]:
        return ["character_name", "persona", "scenario", "ai_name_chat", "human_name_chat", "llm_chain"]

    @property
    def output_keys(self) -> List[str]:
        return [self.output_key]

    def _call(self, inputs: Dict[str, str]) -> Dict[str, str]:
        other_keys = {k: v for k, v in inputs.items() if k not in self.input_keys}
        result = self.llm_chain.predict(**other_keys)
        return {self.output_key: result}


class CustomOutputParser(AgentOutputParser):
    
    def parse(self, llm_output: str) -> Union[AgentAction, AgentFinish]:
        # Check if agent should finish
        if "Final Answer:" in llm_output:
            return AgentFinish(
                # Return values is generally always a dictionary with a single `output` key
                # It is not recommended to try anything else at the moment :)
                return_values={"output": llm_output.split("Final Answer:")[-1].strip()},
                log=llm_output,
            )
        # Parse out the action and action input
        regex = r"Action\s*\d*\s*:(.*?)\nAction\s*\d*\s*Input\s*\d*\s*:[\s]*(.*)"
        match = re.search(regex, llm_output, re.DOTALL)
        if not match:
            regex = r"Action\s*\d*\s*:(.*?)[\s]*[\"\'](.*)[\"\']"
            match = re.search(regex, llm_output, re.DOTALL)
            if not match:
                raise ValueError(f"Could not parse LLM output: `{llm_output}`")
        action = match.group(1).strip()
        action_input = match.group(2)
        # Return the action and action input
        return AgentAction(tool=action, tool_input=action_input.strip(" ").strip('"'), log=llm_output)


class AI(object):

    def __init__(self, bot, text_wrapper, image_wrapper, memory_path: str):
        self.name = bot.name
        self.bot = bot
        self.memory_path = memory_path
        self.rooms = {}

        from ..wrappers.langchain_koboldcpp import KoboldCpp
        self.llm_chat = KoboldCpp(temperature=self.bot.temperature, endpoint_url="http://172.16.85.10:5001/api/latest/generate", stop=['<|endoftext|>'])
        self.llm_summary = KoboldCpp(temperature=0.2, endpoint_url="http://172.16.85.10:5002/api/latest/generate", stop=['<|endoftext|>'], max_tokens=512)
        self.text_wrapper = text_wrapper
        self.image_wrapper = image_wrapper
        self.embeddings = SentenceTransformerEmbeddings()
        #embeddings = SentenceTransformerEmbeddings(model="all-MiniLM-L6-v2")
        self.db = Chroma(persist_directory=os.path.join(self.memory_path, f'chroma-db'), embedding_function=self.embeddings)

        #self.memory = BotConversationSummerBufferWindowMemory(llm=self.llm_summary, max_token_limit=1200, min_token_limit=200)

    def get_memory(self, room_id, human_prefix="Human"):
        if not room_id in self.rooms:
            self.rooms[room_id] = {}
            memory = CustomMemory(memory_key="chat_history", input_key="input", human_prefix=human_prefix, ai_prefix=self.bot.name, llm=self.llm_summary, summary_prompt=prompt_progressive_summary, max_len=1200, min_len=200)
            self.rooms[room_id]["memory"] = memory
            self.rooms[room_id]["summary"] = "No previous events."
            memory.chat_memory.add_ai_message(self.bot.greeting)
            #memory.save_context({"input": None, "output": self.bot.greeting})
            memory.load_memory_variables({})
        else:
            memory = self.rooms[room_id]["memory"]
        #print(f"memory: {memory.load_memory_variables({})}")
        #print(f"memory has an estimated {self.llm_chat.get_num_tokens(memory.buffer)} number of tokens")
        return memory

    async def add_chat_message(self, message):
        conversation_memory = self.get_memory(message.room_id)
        langchain_message = message.to_langchain()
        if message.user_id == self.bot.connection.user_id:
            langchain_message.role = self.bot.name
        conversation_memory.chat_memory.messages.append(langchain_message)

    async def clear(self, room_id):
        conversation_memory = self.get_memory(room_id)
        conversation_memory.clear()

    async def ingest_textfile(self, filename, category):
        loader = TextLoader(filename)
        documents = loader.load()
        documents[0].metadata['indexed'] = datetime.now().strftime('%Y-%m-%d %H:%M:%S')
        documents[0].metadata['category'] = category

        text_splitter = RecursiveCharacterTextSplitter(
            # Set a really small chunk size, just to show.
            chunk_size = 1024,
            chunk_overlap  = 80,
            length_function = len,
            #length_function = self.llm_chat.get_num_tokens,  # The Embeddings are generated with SsentenceTransformers, not this model
        )

        docs = text_splitter.split_documents(documents)

        for i in range(len(docs)):
            docs[i].metadata['part'] = f"{i}/{len(docs)}"

        print(f"Indexing {len(docs)} documents")
        texts = [doc.page_content for doc in docs]
        metadatas = [doc.metadata for doc in docs]
        self.db.add_texts(texts=texts, metadatas=metadatas, ids=None)
        self.db.persist()

    async def search_vectordb(self, query, category):
        #query = "How is climate in Germany?"
        #retreiver = db.as_retreiver()
        #docs = retreiver.get_relevant_documents(query)
        if category:
            #https://github.com/chroma-core/chroma/blob/main/examples/where_filtering.ipynb
            output_docs = self.db.similarity_search_with_score(query, filter={"category": category})
        else:
            output_docs = self.db.similarity_search_with_score(query)
        print(query)
        print('###')
        for doc, score in output_docs:
            print("-" * 80)
            print("Score: ", score)
            #print(doc.page_content)
            print(doc)
            print("-" * 80)


    async def generate(self, message, reply_fn, typing_fn):

        prompt_template = "{input}"
        chain = LLMChain(
            llm=self.llm_chat,
            prompt=PromptTemplate.from_template(prompt_template),
        )
        output = await chain.arun(message.message)
        return output.strip()


    async def generate_roleplay(self, message, reply_fn, typing_fn):

        chat_ai_name = self.bot.name
        chat_human_name = message.additional_kwargs['user_name']
        room_id = message.additional_kwargs['room_id']
        if False: # model is vicuna
            chat_ai_name = "### Assistant"
            chat_human_name = "### Human"

        conversation_memory = self.get_memory(room_id, chat_human_name)
        conversation_memory.human_prefix = chat_human_name
        readonlymemory = ReadOnlySharedMemory(memory=conversation_memory)
        summary_memory = ConversationSummaryMemory(llm=self.llm_summary, memory_key="summary", input_key="input")
        #combined_memory = CombinedMemory(memories=[conversation_memory, summary_memory])

        k = 1 # 5
        max_k = 3 # 12
        if len(conversation_memory.chat_memory.messages) > max_k*2:

            async def make_progressive_summary(previous_summary, chat_history_text_string):
                await asyncio.sleep(0) # yield for matrix-nio
                #self.rooms[room_id]["summary"] = summary_memory.predict_new_summary(conversation_memory.chat_memory.messages, previous_summary).strip()
                summary_chain = LLMChain(llm=self.llm_summary, prompt=prompt_progressive_summary, verbose=True)
                self.rooms[room_id]["summary"] = await summary_chain.apredict(summary=previous_summary, chat_history=chat_history_text_string)
                # ToDo: maybe add an add_task_done callback and don't access the variable directly from here?
                logger.info(f"New summary is: \"{self.rooms[room_id]['summary']}\"")
                conversation_memory.chat_memory.messages = conversation_memory.chat_memory.messages[-k * 2 :]
                conversation_memory.load_memory_variables({})
                #summary = summarize(conversation_memory.buffer)
                #print(summary)
                #return summary


            logger.info("memory progressive summary scheduled...")
            await self.bot.schedule(self.bot.queue, make_progressive_summary, self.rooms[room_id]["summary"], conversation_memory.buffer) #.add_done_callback(


        #t = datetime.fromtimestamp(message.additional_kwargs['timestamp'])
        #when = humanize.naturaltime(t)
        #print(when)


        # ToDo: either use prompt.format() to fill out the pygmalion prompt and use
        # the resulting template text to feed it into the instruct prompt's instruction
        # or do this with the prompt.partial()

        prompt = prompt_vicuna.partial(
            ai_name=self.bot.name,
            persona=self.bot.persona,
            scenario=self.bot.scenario,
            summary=self.rooms[room_id]["summary"],
            human_name=chat_human_name,
            #example_dialogue=replace_all(self.bot.example_dialogue, {"{{user}}": chat_human_name, "{{char}}": chat_ai_name})
            ai_name_chat=chat_ai_name,
        )

        chain = ConversationChain(
            llm=self.llm_chat,
            prompt=prompt,
            verbose=True,
            memory=readonlymemory,
            #stop=['<|endoftext|>', '\nYou:', f"\n{chat_human_name}:"],
        )
        
#        output = llm_chain(inputs={"ai_name": self.bot.name, "persona": self.bot.persona, "scenario": self.bot.scenario, "human_name": chat_human_name, "ai_name_chat": self.bot.name, "chat_history": "", "input": message.content})['results'][0]['text']

        #roleplay_chain = RoleplayChain(llm_chain=chain, character_name=self.bot.name, persona=self.bot.persona, scenario=self.bot.scenario, ai_name_chat=chat_ai_name, human_name_chat=chat_human_name)

        stop = ['<|endoftext|>', f"\n{chat_human_name}"]
        #print(f"Message is: \"{message.content}\"")
        await asyncio.sleep(0)
        output = await chain.arun({"input":message.content, "stop": stop})
        output = output.replace("<BOT>", self.bot.name).replace("<USER>", chat_human_name)
        output = output.replace("### Assistant", self.bot.name)
        output = output.replace(f"\n{self.bot.name}: ", " ")
        output = output.strip()


        if "*activates the neural uplink*" in output.casefold():
            pass # call agent

        own_message_resp = await reply_fn(output)

        langchain_ai_message = AIMessage(
            content=output,
            additional_kwargs={
                "timestamp": datetime.now().timestamp(),
                "user_name": self.bot.name,
                "event_id": own_message_resp.event_id,
                "user_id": None,
                "room_name": message.additional_kwargs['room_name'],
                "room_id": own_message_resp.room_id,
            }
        )

        conversation_memory.save_context({"input": message.content}, {"ouput": output})
        conversation_memory.load_memory_variables({})

        return output


    async def summarize(self, text):
        await asyncio.sleep(0) # yield for matrix-nio
        summary_chain = LLMChain(llm=self.llm_summary, prompt=prompt_summary, verbose=True)
        return await summary_chain.arun(text=text)
        #ToDo: We can summarize the whole dialogue here, let half of it in the buffer but skip doing a summary until this is flushed, too?
        #ToDo: max_tokens and stop

    async def diary(self, room_id):
        await asyncio.sleep(0) # yield for matrix-nio
        diary_chain = LLMChain(llm=self.llm_summary, prompt=prompt_outline, verbose=True)
        conversation_memory = self.get_memory(room_id)
        #self.rooms[message.room_id]["summary"]
        string_messages = []
        for m in conversation_memory.chat_memory_day.messages:
            string_messages.append(f"{message.role}: {message.content}")
        return await diary_chain.apredict(text="\n".join(string_messages))


    async def agent(self):

        os.environ["OPENWEATHERMAP_API_KEY"] = "82452fdb0d1e0e805ac096db87914342"
        # Tools
        search = DuckDuckGoSearchAPIWrapper()
        weather = OpenWeatherMapAPIWrapper()
        search2 = SearxSearchWrapper(searx_host="https://search.mdosch.de")
        python_repl = PythonREPL()

        tools = [
            Tool(
                name = "Search",
                func=search.run,
                description="useful for when you need to answer questions about current events"
            ),
            Tool(
                name = "Searx Search",
                func=search.run,
                description="useful for when you need to answer questions about current events"
            ),
            Tool(
                name = "Weather",
                func=weather.run,
                description="Useful for fetching current weather information for a specified location. Input should be a location string (e.g. 'London,GB')."
            ),
            Tool(
                name = "Summary",
                func=summry_chain.run,
                description="useful for when you summarize a conversation. The input to this tool should be a string, representing who will read this summary."
            )
        ]

        prompt = ZeroShotAgent.create_prompt(
            tools=tools, 
            prefix=prefix, 
            suffix=suffix, 
            input_variables=["input", "chat_history", "agent_scratchpad"]
        )

        output_parser = CustomOutputParser()

        # LLM chain consisting of the LLM and a prompt
        llm_chain = LLMChain(llm=llm, prompt=prompt_agent)

        agent = ZeroShotAgent(llm_chain=llm_chain, tools=tools, verbose=True)
        #agent = initialize_agent(tools, llm, agent=AgentType.CHAT_CONVERSATIONAL_REACT_DESCRIPTION, verbose=True, return_intermediate_steps=True, memory=memory)

        #tool_names = [tool.name for tool in tools]
        #agent = LLMSingleActionAgent(
        #    llm_chain=llm_chain, 
        #    output_parser=output_parser,
        #    stop=["\nObservation:"], 
        #    allowed_tools=tool_names,
        #    verbose=True,
        #)

        agent_executor = AgentExecutor.from_agent_and_tools(agent=agent, tools=tools, verbose=True, memory=memory)


        await agent_executor.arun(input="How many people live in canada as of 2023?")


    async def sleep(self):
        # Write Date into chat history
        for room_id in self.rooms.keys():
            #fake_message = Message(datetime.now().timestamp(), self.bot.name, "", event_id=None, user_id=None, room_name=None, room_id=room_id)
            conversation_memory = self.get_memory(room_id)
            message = SystemMessage(
                content=f"~~~~ {datetime.now().strftime('%A, %B %d, %Y')} ~~~~",
                additional_kwargs={
                    "timestamp": datetime.now().timestamp(),
                    "user_name": self.bot.name,
                    "event_id": None,
                    "user_id": None,
                    "room_name": None,
                    "room_id": room_id,
                }
            )
            conversation_memory.chat_memory.messages.append(message)
            #conversation_memory.chat_memory.add_system_message(message)

        # Summarize the last day and save a diary entry
        yesterday = ( datetime.now() - timedelta(days=1) ).strftime('%Y-%m-%d')
        for room_id in self.rooms.keys():
            if len(conversation_memory.chat_memory_day.messages) > 0:
                self.bot.rooms[room_id]["diary"][yesterday] = await self.diary(room_id)
        # Calculate new goals for the character
        # Update stats
        # Let background tasks run
        conversation_memory.chat_memory_day.clear()
        await self.bot.write_conf2(self.bot.rooms)


    async def prime_llm(self, text):
        self.llm_chat(text, max_tokens=1)


def replace_all(text, dic):
    for i, j in dic.items():
        text = text.replace(i, j)
    return text
complete rewrite 2 years ago			`import asyncio`
tmp 2 years ago			`import os, time`
complete rewrite 2 years ago			`from .prompts import *`
more work on langchain memory 2 years ago			`from .langchain_memory import CustomMemory # BotConversationSummaryBufferWindowMemory, TestMemory`
tmp 2 years ago			`from ..utilities.messages import Message`
complete rewrite 2 years ago
			`from langchain import PromptTemplate`
further rewrite 2 years ago			`from langchain import LLMChain, ConversationChain`
bot summary memory 2 years ago			`from langchain.memory import ConversationBufferMemory, ReadOnlySharedMemory, CombinedMemory, ConversationSummaryMemory`
complete rewrite 2 years ago
further rewrite 2 years ago			`from langchain.chains.base import Chain`
tmp 2 years ago			`from typing import Dict, List, Union`
further rewrite 2 years ago
			`from langchain.document_loaders import TextLoader`
			`from langchain.text_splitter import RecursiveCharacterTextSplitter`
			`from langchain.embeddings import SentenceTransformerEmbeddings`
			`from langchain.vectorstores import Chroma`
complete rewrite 2 years ago
tmp 2 years ago			`from langchain.agents import Tool, AgentExecutor, LLMSingleActionAgent, AgentOutputParser, ZeroShotAgent`
			`from langchain.schema import AgentAction, AgentFinish`
			`from langchain.schema import AIMessage, HumanMessage, SystemMessage, ChatMessage`
			`from langchain.utilities import OpenWeatherMapAPIWrapper, SearxSearchWrapper, PythonREPL`
			`from langchain.utilities.duckduckgo_search import DuckDuckGoSearchAPIWrapper`

bot summary memory 2 years ago			`import humanize`
tmp 2 years ago			`from datetime import datetime, timedelta`
bot summary memory 2 years ago
complete rewrite 2 years ago			`import logging`

			`logger = logging.getLogger(__name__)`


further rewrite 2 years ago			`class RoleplayChain(Chain):`
			`llm_chain: LLMChain`

			`character_name: str`
			`persona: str`
			`scenario: str`
			`ai_name_chat: str`
			`human_name_chat: str`

			`output_key: str = "output_text" #: :meta private:`

			`@property`
			`def input_keys(self) -> List[str]:`
			`return ["character_name", "persona", "scenario", "ai_name_chat", "human_name_chat", "llm_chain"]`

			`@property`
			`def output_keys(self) -> List[str]:`
			`return [self.output_key]`

			`def _call(self, inputs: Dict[str, str]) -> Dict[str, str]:`
			`other_keys = {k: v for k, v in inputs.items() if k not in self.input_keys}`
			`result = self.llm_chain.predict(**other_keys)`
			`return {self.output_key: result}`
tmp 2 years ago

			`class CustomOutputParser(AgentOutputParser):`
further rewrite 2 years ago
tmp 2 years ago			`def parse(self, llm_output: str) -> Union[AgentAction, AgentFinish]:`
			`# Check if agent should finish`
			`if "Final Answer:" in llm_output:`
			`return AgentFinish(`
			# Return values is generally always a dictionary with a single `output` key
			`# It is not recommended to try anything else at the moment :)`
			`return_values={"output": llm_output.split("Final Answer:")[-1].strip()},`
			`log=llm_output,`
			`)`
			`# Parse out the action and action input`
			`regex = r"Action\s\d\s:(.?)\nAction\s\d\sInput\s\d\s:[\s](.)"`
			`match = re.search(regex, llm_output, re.DOTALL)`
			`if not match:`
			`regex = r"Action\s\d\s:(.?)[\s][\"\'](.)[\"\']"`
			`match = re.search(regex, llm_output, re.DOTALL)`
			`if not match:`
			raise ValueError(f"Could not parse LLM output: `{llm_output}`")
			`action = match.group(1).strip()`
			`action_input = match.group(2)`
			`# Return the action and action input`
			`return AgentAction(tool=action, tool_input=action_input.strip(" ").strip('"'), log=llm_output)`
further rewrite 2 years ago

complete rewrite 2 years ago			`class AI(object):`

further rewrite 2 years ago			`def __init__(self, bot, text_wrapper, image_wrapper, memory_path: str):`
complete rewrite 2 years ago			`self.name = bot.name`
			`self.bot = bot`
further rewrite 2 years ago			`self.memory_path = memory_path`
langchain test 2 years ago			`self.rooms = {}`
complete rewrite 2 years ago
			`from ..wrappers.langchain_koboldcpp import KoboldCpp`
			`self.llm_chat = KoboldCpp(temperature=self.bot.temperature, endpoint_url="http://172.16.85.10:5001/api/latest/generate", stop=['<\|endoftext\|>'])`
more work on langchain memory 2 years ago			`self.llm_summary = KoboldCpp(temperature=0.2, endpoint_url="http://172.16.85.10:5002/api/latest/generate", stop=['<\|endoftext\|>'], max_tokens=512)`
complete rewrite 2 years ago			`self.text_wrapper = text_wrapper`
			`self.image_wrapper = image_wrapper`
tmp 2 years ago			`self.embeddings = SentenceTransformerEmbeddings()`
			`#embeddings = SentenceTransformerEmbeddings(model="all-MiniLM-L6-v2")`
			`self.db = Chroma(persist_directory=os.path.join(self.memory_path, f'chroma-db'), embedding_function=self.embeddings)`
complete rewrite 2 years ago
further rewrite 2 years ago			`#self.memory = BotConversationSummerBufferWindowMemory(llm=self.llm_summary, max_token_limit=1200, min_token_limit=200)`

tmp 2 years ago			`def get_memory(self, room_id, human_prefix="Human"):`
			`if not room_id in self.rooms:`
			`self.rooms[room_id] = {}`
more work on langchain memory 2 years ago			`memory = CustomMemory(memory_key="chat_history", input_key="input", human_prefix=human_prefix, ai_prefix=self.bot.name, llm=self.llm_summary, summary_prompt=prompt_progressive_summary, max_len=1200, min_len=200)`
tmp 2 years ago			`self.rooms[room_id]["memory"] = memory`
			`self.rooms[room_id]["summary"] = "No previous events."`
langchain test 2 years ago			`memory.chat_memory.add_ai_message(self.bot.greeting)`
			`#memory.save_context({"input": None, "output": self.bot.greeting})`
			`memory.load_memory_variables({})`
			`else:`
tmp 2 years ago			`memory = self.rooms[room_id]["memory"]`
bot summary memory 2 years ago			`#print(f"memory: {memory.load_memory_variables({})}")`
			`#print(f"memory has an estimated {self.llm_chat.get_num_tokens(memory.buffer)} number of tokens")`
langchain test 2 years ago			`return memory`
further rewrite 2 years ago
tmp 2 years ago			`async def add_chat_message(self, message):`
			`conversation_memory = self.get_memory(message.room_id)`
			`langchain_message = message.to_langchain()`
			`if message.user_id == self.bot.connection.user_id:`
			`langchain_message.role = self.bot.name`
			`conversation_memory.chat_memory.messages.append(langchain_message)`
further rewrite 2 years ago
tmp 2 years ago			`async def clear(self, room_id):`
			`conversation_memory = self.get_memory(room_id)`
			`conversation_memory.clear()`
further rewrite 2 years ago
tmp 2 years ago			`async def ingest_textfile(self, filename, category):`
			`loader = TextLoader(filename)`
further rewrite 2 years ago			`documents = loader.load()`
tmp 2 years ago			`documents[0].metadata['indexed'] = datetime.now().strftime('%Y-%m-%d %H:%M:%S')`
			`documents[0].metadata['category'] = category`
further rewrite 2 years ago
			`text_splitter = RecursiveCharacterTextSplitter(`
			`# Set a really small chunk size, just to show.`
tmp 2 years ago			`chunk_size = 1024,`
			`chunk_overlap = 80,`
further rewrite 2 years ago			`length_function = len,`
tmp 2 years ago			`#length_function = self.llm_chat.get_num_tokens, # The Embeddings are generated with SsentenceTransformers, not this model`
further rewrite 2 years ago			`)`
complete rewrite 2 years ago
further rewrite 2 years ago			`docs = text_splitter.split_documents(documents)`
complete rewrite 2 years ago
tmp 2 years ago			`for i in range(len(docs)):`
			`docs[i].metadata['part'] = f"{i}/{len(docs)}"`
further rewrite 2 years ago
			`print(f"Indexing {len(docs)} documents")`
			`texts = [doc.page_content for doc in docs]`
			`metadatas = [doc.metadata for doc in docs]`
tmp 2 years ago			`self.db.add_texts(texts=texts, metadatas=metadatas, ids=None)`
			`self.db.persist()`

			`async def search_vectordb(self, query, category):`
			`#query = "How is climate in Germany?"`
			`#retreiver = db.as_retreiver()`
			`#docs = retreiver.get_relevant_documents(query)`
			`if category:`
			`#https://github.com/chroma-core/chroma/blob/main/examples/where_filtering.ipynb`
			`output_docs = self.db.similarity_search_with_score(query, filter={"category": category})`
			`else:`
			`output_docs = self.db.similarity_search_with_score(query)`
further rewrite 2 years ago			`print(query)`
			`print('###')`
			`for doc, score in output_docs:`
			`print("-" * 80)`
			`print("Score: ", score)`
tmp 2 years ago			`#print(doc.page_content)`
			`print(doc)`
further rewrite 2 years ago			`print("-" * 80)`
complete rewrite 2 years ago
tmp 2 years ago
			`async def generate(self, message, reply_fn, typing_fn):`

complete rewrite 2 years ago			`prompt_template = "{input}"`
			`chain = LLMChain(`
			`llm=self.llm_chat,`
			`prompt=PromptTemplate.from_template(prompt_template),`
			`)`
langchain async 2 years ago			`output = await chain.arun(message.message)`
complete rewrite 2 years ago			`return output.strip()`

bot summary memory 2 years ago
complete rewrite 2 years ago			`async def generate_roleplay(self, message, reply_fn, typing_fn):`
further rewrite 2 years ago
bot summary memory 2 years ago			`chat_ai_name = self.bot.name`
more work on langchain memory 2 years ago			`chat_human_name = message.additional_kwargs['user_name']`
			`room_id = message.additional_kwargs['room_id']`
bot summary memory 2 years ago			`if False: # model is vicuna`
			`chat_ai_name = "### Assistant"`
			`chat_human_name = "### Human"`

more work on langchain memory 2 years ago			`conversation_memory = self.get_memory(room_id, chat_human_name)`
tmp 2 years ago			`conversation_memory.human_prefix = chat_human_name`
bot summary memory 2 years ago			`readonlymemory = ReadOnlySharedMemory(memory=conversation_memory)`
			`summary_memory = ConversationSummaryMemory(llm=self.llm_summary, memory_key="summary", input_key="input")`
			`#combined_memory = CombinedMemory(memories=[conversation_memory, summary_memory])`

tmp 2 years ago			`k = 1 # 5`
			`max_k = 3 # 12`
bot summary memory 2 years ago			`if len(conversation_memory.chat_memory.messages) > max_k*2:`

			`async def make_progressive_summary(previous_summary, chat_history_text_string):`
summary 2 years ago			`await asyncio.sleep(0) # yield for matrix-nio`
more work on langchain memory 2 years ago			`#self.rooms[room_id]["summary"] = summary_memory.predict_new_summary(conversation_memory.chat_memory.messages, previous_summary).strip()`
tmp 2 years ago			`summary_chain = LLMChain(llm=self.llm_summary, prompt=prompt_progressive_summary, verbose=True)`
more work on langchain memory 2 years ago			`self.rooms[room_id]["summary"] = await summary_chain.apredict(summary=previous_summary, chat_history=chat_history_text_string)`
bot summary memory 2 years ago			`# ToDo: maybe add an add_task_done callback and don't access the variable directly from here?`
more work on langchain memory 2 years ago			`logger.info(f"New summary is: \"{self.rooms[room_id]['summary']}\"")`
bot summary memory 2 years ago			`conversation_memory.chat_memory.messages = conversation_memory.chat_memory.messages[-k * 2 :]`
			`conversation_memory.load_memory_variables({})`
			`#summary = summarize(conversation_memory.buffer)`
			`#print(summary)`
			`#return summary`

tmp 2 years ago
bot summary memory 2 years ago			`logger.info("memory progressive summary scheduled...")`
more work on langchain memory 2 years ago			`await self.bot.schedule(self.bot.queue, make_progressive_summary, self.rooms[room_id]["summary"], conversation_memory.buffer) #.add_done_callback(`
bot summary memory 2 years ago


more work on langchain memory 2 years ago			`#t = datetime.fromtimestamp(message.additional_kwargs['timestamp'])`
bot summary memory 2 years ago			`#when = humanize.naturaltime(t)`
			`#print(when)`


			`# ToDo: either use prompt.format() to fill out the pygmalion prompt and use`
			`# the resulting template text to feed it into the instruct prompt's instruction`
			`# or do this with the prompt.partial()`
further rewrite 2 years ago
			`prompt = prompt_vicuna.partial(`
			`ai_name=self.bot.name,`
			`persona=self.bot.persona,`
			`scenario=self.bot.scenario,`
more work on langchain memory 2 years ago			`summary=self.rooms[room_id]["summary"],`
			`human_name=chat_human_name,`
bot summary memory 2 years ago			`#example_dialogue=replace_all(self.bot.example_dialogue, {"{{user}}": chat_human_name, "{{char}}": chat_ai_name})`
			`ai_name_chat=chat_ai_name,`
complete rewrite 2 years ago			`)`
further rewrite 2 years ago
			`chain = ConversationChain(`
complete rewrite 2 years ago			`llm=self.llm_chat,`
further rewrite 2 years ago			`prompt=prompt,`
complete rewrite 2 years ago			`verbose=True,`
config file handling 2 years ago			`memory=readonlymemory,`
more work on langchain memory 2 years ago			`#stop=['<\|endoftext\|>', '\nYou:', f"\n{chat_human_name}:"],`
complete rewrite 2 years ago			`)`
further rewrite 2 years ago
more work on langchain memory 2 years ago			`# output = llm_chain(inputs={"ai_name": self.bot.name, "persona": self.bot.persona, "scenario": self.bot.scenario, "human_name": chat_human_name, "ai_name_chat": self.bot.name, "chat_history": "", "input": message.content})['results'][0]['text']`
further rewrite 2 years ago
bot summary memory 2 years ago			`#roleplay_chain = RoleplayChain(llm_chain=chain, character_name=self.bot.name, persona=self.bot.persona, scenario=self.bot.scenario, ai_name_chat=chat_ai_name, human_name_chat=chat_human_name)`
further rewrite 2 years ago
summary 2 years ago			`stop = ['<\|endoftext\|>', f"\n{chat_human_name}"]`
more work on langchain memory 2 years ago			`#print(f"Message is: \"{message.content}\"")`
tmp 2 years ago			`await asyncio.sleep(0)`
more work on langchain memory 2 years ago			`output = await chain.arun({"input":message.content, "stop": stop})`
			`output = output.replace("<BOT>", self.bot.name).replace("<USER>", chat_human_name)`
bot summary memory 2 years ago			`output = output.replace("### Assistant", self.bot.name)`
summary 2 years ago			`output = output.replace(f"\n{self.bot.name}: ", " ")`
config file handling 2 years ago			`output = output.strip()`
bot summary memory 2 years ago
more work on langchain memory 2 years ago
			`if "activates the neural uplink" in output.casefold():`
			`pass # call agent`

			`own_message_resp = await reply_fn(output)`

tmp 2 years ago			`langchain_ai_message = AIMessage(`
			`content=output,`
			`additional_kwargs={`
			`"timestamp": datetime.now().timestamp(),`
			`"user_name": self.bot.name,`
more work on langchain memory 2 years ago			`"event_id": own_message_resp.event_id,`
tmp 2 years ago			`"user_id": None,`
more work on langchain memory 2 years ago			`"room_name": message.additional_kwargs['room_name'],`
			`"room_id": own_message_resp.room_id,`
tmp 2 years ago			`}`
			`)`

more work on langchain memory 2 years ago			`conversation_memory.save_context({"input": message.content}, {"ouput": output})`
bot summary memory 2 years ago			`conversation_memory.load_memory_variables({})`
langchain test 2 years ago
more work on langchain memory 2 years ago			`return output`
further rewrite 2 years ago

bot summary memory 2 years ago			`async def summarize(self, text):`
tmp 2 years ago			`await asyncio.sleep(0) # yield for matrix-nio`
			`summary_chain = LLMChain(llm=self.llm_summary, prompt=prompt_summary, verbose=True)`
			`return await summary_chain.arun(text=text)`
			`#ToDo: We can summarize the whole dialogue here, let half of it in the buffer but skip doing a summary until this is flushed, too?`
			`#ToDo: max_tokens and stop`

			`async def diary(self, room_id):`
			`await asyncio.sleep(0) # yield for matrix-nio`
			`diary_chain = LLMChain(llm=self.llm_summary, prompt=prompt_outline, verbose=True)`
more work on langchain memory 2 years ago			`conversation_memory = self.get_memory(room_id)`
tmp 2 years ago			`#self.rooms[message.room_id]["summary"]`
			`string_messages = []`
more work on langchain memory 2 years ago			`for m in conversation_memory.chat_memory_day.messages:`
			`string_messages.append(f"{message.role}: {message.content}")`
tmp 2 years ago			`return await diary_chain.apredict(text="\n".join(string_messages))`


			`async def agent(self):`

			`os.environ["OPENWEATHERMAP_API_KEY"] = "82452fdb0d1e0e805ac096db87914342"`
			`# Tools`
			`search = DuckDuckGoSearchAPIWrapper()`
			`weather = OpenWeatherMapAPIWrapper()`
			`search2 = SearxSearchWrapper(searx_host="https://search.mdosch.de")`
			`python_repl = PythonREPL()`

			`tools = [`
			`Tool(`
			`name = "Search",`
			`func=search.run,`
			`description="useful for when you need to answer questions about current events"`
			`),`
			`Tool(`
			`name = "Searx Search",`
			`func=search.run,`
			`description="useful for when you need to answer questions about current events"`
			`),`
			`Tool(`
			`name = "Weather",`
			`func=weather.run,`
			`description="Useful for fetching current weather information for a specified location. Input should be a location string (e.g. 'London,GB')."`
			`),`
			`Tool(`
			`name = "Summary",`
			`func=summry_chain.run,`
			`description="useful for when you summarize a conversation. The input to this tool should be a string, representing who will read this summary."`
			`)`
			`]`

			`prompt = ZeroShotAgent.create_prompt(`
			`tools=tools,`
			`prefix=prefix,`
			`suffix=suffix,`
			`input_variables=["input", "chat_history", "agent_scratchpad"]`
			`)`

			`output_parser = CustomOutputParser()`

			`# LLM chain consisting of the LLM and a prompt`
			`llm_chain = LLMChain(llm=llm, prompt=prompt_agent)`

			`agent = ZeroShotAgent(llm_chain=llm_chain, tools=tools, verbose=True)`
			`#agent = initialize_agent(tools, llm, agent=AgentType.CHAT_CONVERSATIONAL_REACT_DESCRIPTION, verbose=True, return_intermediate_steps=True, memory=memory)`

			`#tool_names = [tool.name for tool in tools]`
			`#agent = LLMSingleActionAgent(`
			`# llm_chain=llm_chain,`
			`# output_parser=output_parser,`
			`# stop=["\nObservation:"],`
			`# allowed_tools=tool_names,`
			`# verbose=True,`
			`#)`

			`agent_executor = AgentExecutor.from_agent_and_tools(agent=agent, tools=tools, verbose=True, memory=memory)`


			`await agent_executor.arun(input="How many people live in canada as of 2023?")`


			`async def sleep(self):`
			`# Write Date into chat history`
			`for room_id in self.rooms.keys():`
			`#fake_message = Message(datetime.now().timestamp(), self.bot.name, "", event_id=None, user_id=None, room_name=None, room_id=room_id)`
			`conversation_memory = self.get_memory(room_id)`
			`message = SystemMessage(`
			`content=f"~~~~ {datetime.now().strftime('%A, %B %d, %Y')} ~~~~",`
			`additional_kwargs={`
			`"timestamp": datetime.now().timestamp(),`
			`"user_name": self.bot.name,`
			`"event_id": None,`
			`"user_id": None,`
			`"room_name": None,`
			`"room_id": room_id,`
			`}`
			`)`
			`conversation_memory.chat_memory.messages.append(message)`
			`#conversation_memory.chat_memory.add_system_message(message)`

			`# Summarize the last day and save a diary entry`
			`yesterday = ( datetime.now() - timedelta(days=1) ).strftime('%Y-%m-%d')`
			`for room_id in self.rooms.keys():`
more work on langchain memory 2 years ago			`if len(conversation_memory.chat_memory_day.messages) > 0:`
tmp 2 years ago			`self.bot.rooms[room_id]["diary"][yesterday] = await self.diary(room_id)`
			`# Calculate new goals for the character`
			`# Update stats`
			`# Let background tasks run`
more work on langchain memory 2 years ago			`conversation_memory.chat_memory_day.clear()`
tmp 2 years ago			`await self.bot.write_conf2(self.bot.rooms)`

bot summary memory 2 years ago
			`async def prime_llm(self, text):`
			`self.llm_chat(text, max_tokens=1)`


langchain test 2 years ago			`def replace_all(text, dic):`
			`for i, j in dic.items():`
			`text = text.replace(i, j)`
			`return text`