* docs: add ai documentation * docker: update docker files for ai/regular versions, lint * feat: add initial /ask command * Delete docker-compose.yml * docker: ignore ollama folder in builds * fix: add emojis to help commands, capitalize, add ai commands to help menu * feat: add better logging, thought handling improvements * bug fixes, better logging and seperation of ai, update docs for ai * clean, remove prompt and user info from logs, more docs edits * system prompt change (plaintext only), parse out /think * clean up, axios tweaks * cleanup, logging of ratelimit --------- Co-authored-by: Aidan <aidan@p0ntus.com>
This commit is contained in:
parent
0c364a1814
commit
81294f5721
13 changed files with 733 additions and 35 deletions
287
src/commands/ai.ts
Normal file
287
src/commands/ai.ts
Normal file
|
@ -0,0 +1,287 @@
|
|||
// AI.TS
|
||||
// by ihatenodejs/Aidan
|
||||
//
|
||||
// -----------------------------------------------------------------------
|
||||
//
|
||||
// This is free and unencumbered software released into the public domain.
|
||||
//
|
||||
// Anyone is free to copy, modify, publish, use, compile, sell, or
|
||||
// distribute this software, either in source code form or as a compiled
|
||||
// binary, for any purpose, commercial or non-commercial, and by any
|
||||
// means.
|
||||
//
|
||||
// In jurisdictions that recognize copyright laws, the author or authors
|
||||
// of this software dedicate any and all copyright interest in the
|
||||
// software to the public domain. We make this dedication for the benefit
|
||||
// of the public at large and to the detriment of our heirs and
|
||||
// successors. We intend this dedication to be an overt act of
|
||||
// relinquishment in perpetuity of all present and future rights to this
|
||||
// software under copyright law.
|
||||
//
|
||||
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
|
||||
// EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
|
||||
// MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
|
||||
// IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR
|
||||
// OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
|
||||
// ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
|
||||
// OTHER DEALINGS IN THE SOFTWARE.
|
||||
//
|
||||
// For more information, please refer to <https://unlicense.org/>
|
||||
|
||||
import { isOnSpamWatch } from "../spamwatch/spamwatch"
|
||||
import spamwatchMiddlewareModule from "../spamwatch/Middleware"
|
||||
import { Telegraf, Context } from "telegraf"
|
||||
import type { Message } from "telegraf/types"
|
||||
import { replyToMessageId } from "../utils/reply-to-message-id"
|
||||
import { getStrings } from "../plugins/checklang"
|
||||
import { languageCode } from "../utils/language-code"
|
||||
import axios from "axios"
|
||||
import { rateLimiter } from "../utils/rate-limiter"
|
||||
import { logger } from "../utils/log"
|
||||
|
||||
const spamwatchMiddleware = spamwatchMiddlewareModule(isOnSpamWatch)
|
||||
export const flash_model = "gemma3:4b"
|
||||
export const thinking_model = "deepseek-r1:1.5b"
|
||||
|
||||
type TextContext = Context & { message: Message.TextMessage }
|
||||
|
||||
export function sanitizeForJson(text: string): string {
|
||||
return text
|
||||
.replace(/\\/g, '\\\\')
|
||||
.replace(/"/g, '\\"')
|
||||
.replace(/\n/g, '\\n')
|
||||
.replace(/\r/g, '\\r')
|
||||
.replace(/\t/g, '\\t')
|
||||
}
|
||||
|
||||
export async function preChecks() {
|
||||
const envs = [
|
||||
"ollamaApi",
|
||||
]
|
||||
|
||||
for (const env of envs) {
|
||||
if (!process.env[env]) {
|
||||
console.error(`[✨ AI | !] ❌ ${env} not set!`)
|
||||
return false
|
||||
}
|
||||
}
|
||||
console.log("[✨ AI] Pre-checks passed\n")
|
||||
return true
|
||||
}
|
||||
|
||||
async function getResponse(prompt: string, ctx: TextContext, replyGenerating: Message, model: string) {
|
||||
const Strings = getStrings(languageCode(ctx))
|
||||
|
||||
if (!ctx.chat) {
|
||||
return {
|
||||
success: false,
|
||||
error: Strings.unexpectedErr.replace("{error}", "No chat found"),
|
||||
}
|
||||
}
|
||||
|
||||
try {
|
||||
const aiResponse = await axios.post(
|
||||
`${process.env.ollamaApi}/api/generate`,
|
||||
{
|
||||
model,
|
||||
prompt,
|
||||
stream: true,
|
||||
},
|
||||
{
|
||||
responseType: "stream",
|
||||
}
|
||||
)
|
||||
|
||||
let fullResponse = ""
|
||||
let thoughts = ""
|
||||
let lastUpdate = Date.now()
|
||||
|
||||
const stream = aiResponse.data
|
||||
for await (const chunk of stream) {
|
||||
const lines = chunk.toString().split('\n')
|
||||
for (const line of lines) {
|
||||
if (!line.trim()) continue
|
||||
let ln
|
||||
try {
|
||||
ln = JSON.parse(line)
|
||||
} catch (e) {
|
||||
console.error("[✨ AI | !] Error parsing chunk:", e)
|
||||
continue
|
||||
}
|
||||
|
||||
if (model === thinking_model) {
|
||||
if (ln.response.includes('<think>')) {
|
||||
const thinkMatch = ln.response.match(/<think>([\s\S]*?)<\/think>/)
|
||||
if (thinkMatch && thinkMatch[1].trim().length > 0) {
|
||||
logger.logThinking(ctx.chat.id, replyGenerating.message_id, true)
|
||||
} else if (!thinkMatch) {
|
||||
logger.logThinking(ctx.chat.id, replyGenerating.message_id, true)
|
||||
}
|
||||
} else if (ln.response.includes('</think>')) {
|
||||
logger.logThinking(ctx.chat.id, replyGenerating.message_id, false)
|
||||
}
|
||||
}
|
||||
|
||||
const now = Date.now()
|
||||
if (ln.response) {
|
||||
if (model === thinking_model) {
|
||||
let patchedThoughts = ln.response
|
||||
const thinkTagRx = /<think>([\s\S]*?)<\/think>/g
|
||||
patchedThoughts = patchedThoughts.replace(thinkTagRx, (match, p1) => p1.trim().length > 0 ? '`Thinking...`' + p1 + '`Finished thinking`' : '')
|
||||
patchedThoughts = patchedThoughts.replace(/<think>/g, '`Thinking...`')
|
||||
patchedThoughts = patchedThoughts.replace(/<\/think>/g, '`Finished thinking`')
|
||||
thoughts += patchedThoughts
|
||||
fullResponse += patchedThoughts
|
||||
} else {
|
||||
fullResponse += ln.response
|
||||
}
|
||||
if (now - lastUpdate >= 1000) {
|
||||
await rateLimiter.editMessageWithRetry(
|
||||
ctx,
|
||||
ctx.chat.id,
|
||||
replyGenerating.message_id,
|
||||
thoughts,
|
||||
{ parse_mode: 'Markdown' }
|
||||
)
|
||||
lastUpdate = now
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
return {
|
||||
success: true,
|
||||
response: fullResponse,
|
||||
}
|
||||
} catch (error: any) {
|
||||
let shouldPullModel = false
|
||||
if (error.response) {
|
||||
const errData = error.response.data?.error
|
||||
const errStatus = error.response.status
|
||||
if (errData && (errData.includes(`model '${model}' not found`) || errStatus === 404)) {
|
||||
shouldPullModel = true
|
||||
} else {
|
||||
console.error("[✨ AI | !] Error zone 1:", errData)
|
||||
return { success: false, error: errData }
|
||||
}
|
||||
} else if (error.request) {
|
||||
console.error("[✨ AI | !] No response received:", error.request)
|
||||
return { success: false, error: "No response received from server" }
|
||||
} else {
|
||||
console.error("[✨ AI | !] Error zone 3:", error.message)
|
||||
return { success: false, error: error.message }
|
||||
}
|
||||
|
||||
if (shouldPullModel) {
|
||||
ctx.telegram.editMessageText(ctx.chat.id, replyGenerating.message_id, undefined, `🔄 Pulling ${model} from ollama...\n\nThis may take a few minutes...`)
|
||||
console.log(`[✨ AI | i] Pulling ${model} from ollama...`)
|
||||
try {
|
||||
await axios.post(
|
||||
`${process.env.ollamaApi}/api/pull`,
|
||||
{
|
||||
model,
|
||||
stream: false,
|
||||
timeout: process.env.ollamaApiTimeout || 10000,
|
||||
}
|
||||
)
|
||||
} catch (e: any) {
|
||||
if (e.response) {
|
||||
console.error("[✨ AI | !] Something went wrong:", e.response.data?.error)
|
||||
return {
|
||||
success: false,
|
||||
error: `❌ Something went wrong while pulling ${model}, please try your command again!`,
|
||||
}
|
||||
} else if (e.request) {
|
||||
console.error("[✨ AI | !] No response received while pulling:", e.request)
|
||||
return {
|
||||
success: false,
|
||||
error: `❌ No response received while pulling ${model}, please try again!`,
|
||||
}
|
||||
} else {
|
||||
console.error("[✨ AI | !] Error while pulling:", e.message)
|
||||
return {
|
||||
success: false,
|
||||
error: `❌ Error while pulling ${model}: ${e.message}`,
|
||||
}
|
||||
}
|
||||
}
|
||||
console.log(`[✨ AI | i] ${model} pulled successfully`)
|
||||
return {
|
||||
success: true,
|
||||
response: `✅ Pulled ${model} successfully, please retry the command.`,
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
export default (bot: Telegraf<Context>) => {
|
||||
const botName = bot.botInfo?.first_name && bot.botInfo?.last_name ? `${bot.botInfo.first_name} ${bot.botInfo.last_name}` : "Kowalski"
|
||||
|
||||
bot.command(["ask", "think"], spamwatchMiddleware, async (ctx) => {
|
||||
if (!ctx.message || !('text' in ctx.message)) return
|
||||
const isAsk = ctx.message.text.startsWith("/ask")
|
||||
const model = isAsk ? flash_model : thinking_model
|
||||
const textCtx = ctx as TextContext
|
||||
const reply_to_message_id = replyToMessageId(textCtx)
|
||||
const Strings = getStrings(languageCode(textCtx))
|
||||
const message = textCtx.message.text
|
||||
const author = ("@" + ctx.from?.username) || ctx.from?.first_name
|
||||
|
||||
logger.logCmdStart(author, model === flash_model ? "ask" : "think")
|
||||
|
||||
if (!process.env.ollamaApi) {
|
||||
await ctx.reply(Strings.aiDisabled, {
|
||||
parse_mode: 'Markdown',
|
||||
...({ reply_to_message_id })
|
||||
})
|
||||
return
|
||||
}
|
||||
|
||||
const replyGenerating = await ctx.reply(Strings.askGenerating.replace("{model}", model), {
|
||||
parse_mode: 'Markdown',
|
||||
...({ reply_to_message_id })
|
||||
})
|
||||
|
||||
const fixedMsg = message.replace(/\/(ask|think) /, "")
|
||||
if (fixedMsg.length < 1) {
|
||||
await ctx.reply(Strings.askNoMessage, {
|
||||
parse_mode: 'Markdown',
|
||||
...({ reply_to_message_id })
|
||||
})
|
||||
return
|
||||
}
|
||||
|
||||
logger.logPrompt(fixedMsg)
|
||||
|
||||
const prompt = sanitizeForJson(
|
||||
`You are a plaintext-only, helpful assistant called ${botName}.
|
||||
Current Date/Time (UTC): ${new Date().toLocaleString()}
|
||||
|
||||
---
|
||||
|
||||
Respond to the user's message:
|
||||
${fixedMsg}`)
|
||||
const aiResponse = await getResponse(prompt, textCtx, replyGenerating, model)
|
||||
if (!aiResponse) return
|
||||
|
||||
if (!ctx.chat) return
|
||||
if (aiResponse.success && aiResponse.response) {
|
||||
await rateLimiter.editMessageWithRetry(
|
||||
ctx,
|
||||
ctx.chat.id,
|
||||
replyGenerating.message_id,
|
||||
aiResponse.response,
|
||||
{ parse_mode: 'Markdown' }
|
||||
)
|
||||
return
|
||||
}
|
||||
const error = Strings.unexpectedErr.replace("{error}", aiResponse.error)
|
||||
await rateLimiter.editMessageWithRetry(
|
||||
ctx,
|
||||
ctx.chat.id,
|
||||
replyGenerating.message_id,
|
||||
error,
|
||||
{ parse_mode: 'Markdown' }
|
||||
)
|
||||
})
|
||||
}
|
Loading…
Add table
Add a link
Reference in a new issue