import os import discord from llama_cpp import Llama from dotenv import load_dotenv class MyClient(discord.Client): async def on_ready(self): print('Logged on as', self.user) async def on_message(self, message): # don't respond to ourselves if message.author == self.user: return if f"""<@{client.user.id}>""" in message.content: question = f"""Text transcript of a never ending dialog, where ${USER_NAME} interacts with Karl Marx. Karl is helpful, kind, honest, friendly, good at writing and never fails to answer ${USER_NAME}’s requests immediately and with details and precision. There are no annotations like (30 seconds passed...) or (to himself), just what ${USER_NAME} and Karl say aloud to each other. The dialog lasts for years, the entirety of it is shared below. It's 10000 pages long. User: What is Communism? Karl: Communism is the doctrine of the conditions of the liberation of the proletariat. User: {message.content}""" await message.channel.send(llm(question, max_tokens=256, stop=["User:"], echo=True)["choices"][0]["text"][len(question):]) load_dotenv() llm = Llama(model_path="./models/7B/ggml-model-q4_0.bin") intents = discord.Intents.default() intents.message_content = True client = MyClient(intents=intents) client.run(os.environ.get("DISCORD_TOKEN"))