added emote reaction support, better emote support in reactions, implemented llm refusal and retry logic, improved some inline documentation

2025-08-03 22:19:24 -07:00
parent 733a41a35c
commit 834e415f11
5 changed files with 426 additions and 39 deletions
--- a/prisma/schema.prisma
+++ b/prisma/schema.prisma
@ -28,3 +28,14 @@ model User {
  userFqn         String    @unique
  lastRespondedTo DateTime?
 }
 model Reaction {
  id         Int      @id @default(autoincrement())
  statusId   String   // The Pleroma status ID we reacted to
  emojiName  String   // The emoji we used to react
  reactedAt  DateTime @default(now())
  createdAt  DateTime @default(now())
  @@unique([statusId]) // Prevent multiple reactions to same status
  @@map("reactions")
 }
--- a/src/api.ts
+++ b/src/api.ts
@ -1,5 +1,7 @@
 import { envConfig, prisma } from "./main.js";
 import { PleromaEmoji, Notification, ContextResponse } from "../types.js";
 import { selectRandomEmojis } from "./util.js";
 const getNotifications = async () => {
  const { bearerToken, pleromaInstanceUrl } = envConfig;
@ -98,9 +100,184 @@ const deleteNotification = async (notification: Notification) => {
  }
 };
 /**
 * React to a status with a random emoji
 */
 const reactToStatus = async (statusId: string, emojiName: string): Promise<boolean> => {
  const { bearerToken, pleromaInstanceUrl } = envConfig;
  try {
    const response = await fetch(
      `${pleromaInstanceUrl}/api/v1/statuses/${statusId}/react/${emojiName}`,
      {
        method: "PUT",
        headers: {
          Authorization: `Bearer ${bearerToken}`,
          "Content-Type": "application/json",
        },
      }
    );
    if (!response.ok) {
      console.error(`Failed to react to status ${statusId}: ${response.status} - ${response.statusText}`);
      return false;
    }
    return true;
  } catch (error: any) {
    console.error(`Error reacting to status ${statusId}: ${error.message}`);
    return false;
  }
 };
 /**
 * Check if we've already reacted to a status
 */
 const hasAlreadyReacted = async (statusId: string): Promise<boolean> => {
  try {
    const reaction = await prisma.reaction.findFirst({
      where: { statusId: statusId },
    });
    return !!reaction;
  } catch (error: any) {
    console.error(`Error checking reaction status: ${error.message}`);
    return true; // Assume we've reacted to avoid spamming on error
  }
 };
 /**
 * Record that we've reacted to a status
 */
 const recordReaction = async (statusId: string, emojiName: string): Promise<void> => {
  try {
    await prisma.reaction.create({
      data: {
        statusId: statusId,
        emojiName: emojiName,
        reactedAt: new Date(),
      },
    });
  } catch (error: any) {
    console.error(`Error recording reaction: ${error.message}`);
  }
 };
 /**
 * Decide whether to react to a post (not every post gets a reaction)
 */
 const shouldReactToPost = (): boolean => {
  // React to roughly 30% of posts
  return Math.random() < 0.3;
 };
 /**
 * Get appropriate reaction emojis based on content sentiment/keywords
 */
 const getContextualEmoji = (content: string, availableEmojis: string[]): string => {
  const contentLower = content.toLowerCase();
  // Define emoji categories with keywords
  const emojiCategories = {
    positive: ['happy', 'smile', 'joy', 'love', 'heart', 'thumbsup', 'fire', 'based'],
    negative: ['sad', 'cry', 'angry', 'rage', 'disappointed', 'cringe'],
    thinking: ['think', 'hmm', 'brain', 'smart', 'curious'],
    laughing: ['laugh', 'lol', 'kek', 'funny', 'haha', 'rofl'],
    agreement: ['yes', 'agree', 'nod', 'correct', 'true', 'based'],
    surprise: ['wow', 'amazing', 'surprised', 'shock', 'omg'],
  };
  // Keywords that might indicate sentiment
  const sentimentKeywords = {
    positive: ['good', 'great', 'awesome', 'nice', 'love', 'happy', 'excellent', 'perfect'],
    negative: ['bad', 'terrible', 'hate', 'awful', 'horrible', 'worst', 'sucks'],
    funny: ['lol', 'haha', 'funny', 'hilarious', 'joke', 'meme'],
    question: ['?', 'what', 'how', 'why', 'when', 'where'],
    agreement: ['yes', 'exactly', 'true', 'right', 'correct', 'agree'],
    thinking: ['think', 'consider', 'maybe', 'perhaps', 'hmm', 'interesting'],
  };
  // Check content sentiment and find matching emojis
  for (const [sentiment, keywords] of Object.entries(sentimentKeywords)) {
    if (keywords.some(keyword => contentLower.includes(keyword))) {
      const categoryEmojis = emojiCategories[sentiment as keyof typeof emojiCategories];
      if (categoryEmojis) {
        const matchingEmojis = availableEmojis.filter(emoji => 
          categoryEmojis.some(cat => emoji.toLowerCase().includes(cat))
        );
        if (matchingEmojis.length > 0) {
          return matchingEmojis[Math.floor(Math.random() * matchingEmojis.length)];
        }
      }
    }
  }
  // Fallback to random emoji from a curated list of common reactions
  const commonReactions = availableEmojis.filter(emoji => 
    ['heart', 'thumbsup', 'fire', 'kek', 'based', 'think', 'smile', 'laugh']
      .some(common => emoji.toLowerCase().includes(common))
  );
  if (commonReactions.length > 0) {
    return commonReactions[Math.floor(Math.random() * commonReactions.length)];
  }
  // Final fallback to any random emoji
  return availableEmojis[Math.floor(Math.random() * availableEmojis.length)];
 };
 /**
 * Main function to handle post reactions
 */
 const handlePostReaction = async (notification: Notification): Promise<void> => {
  try {
    const statusId = notification.status.id;
    // Check if we should react to this post
    if (!shouldReactToPost()) {
      return;
    }
    // Check if we've already reacted
    if (await hasAlreadyReacted(statusId)) {
      return;
    }
    // Get available emojis
    const emojiList = await getInstanceEmojis();
    if (!emojiList || emojiList.length === 0) {
      return;
    }
    // Select a smaller random pool for reactions (5-10 emojis)
    const reactionPool = selectRandomEmojis(emojiList, 8);
    // Get contextual emoji based on post content
    const selectedEmoji = getContextualEmoji(
      notification.status.pleroma.content["text/plain"], 
      reactionPool
    );
    // React to the post
    const success = await reactToStatus(statusId, selectedEmoji);
    if (success) {
      await recordReaction(statusId, selectedEmoji);
      console.log(`Reacted to status ${statusId} with :${selectedEmoji}:`);
    }
  } catch (error: any) {
    console.error(`Error handling post reaction: ${error.message}`);
  }
 };
 export {
  deleteNotification,
  getInstanceEmojis,
  getNotifications,
  getStatusContext,
  reactToStatus,
  handlePostReaction,
  hasAlreadyReacted,
 };
--- a/src/main.ts
+++ b/src/main.ts
@ -13,6 +13,7 @@ import {
  deleteNotification,
  getNotifications,
  getStatusContext,
  handlePostReaction,
 } from "./api.js";
 import { storeUserData, storePromptData } from "./prisma.js";
 import {
@ -20,7 +21,9 @@ import {
  alreadyRespondedTo,
  recordPendingResponse,
  // trimInputData,
-  selectRandomEmoji,
+  // selectRandomEmoji,
  selectRandomEmojis,
  isLLMRefusal,
  shouldContinue,
 } from "./util.js";
@ -59,7 +62,8 @@ const ollamaConfig: OllamaConfigOptions = {
 // https://replicate.com/blog/how-to-prompt-llama
 const generateOllamaRequest = async (
-  notification: Notification
+  notification: Notification,
  retryAttempt: number = 0
 ): Promise<OllamaChatResponse | undefined> => {
  const {
    whitelistOnly,
@ -68,6 +72,7 @@ const generateOllamaRequest = async (
    ollamaUrl,
    replyWithContext,
  } = envConfig;
  try {
    if (shouldContinue(notification)) {
      if (whitelistOnly && !isFromWhitelistedDomain(notification)) {
@ -79,6 +84,7 @@ const generateOllamaRequest = async (
      }
      await recordPendingResponse(notification);
      await storeUserData(notification);
      let conversationHistory: PostAncestorsForModel[] = [];
      if (replyWithContext) {
        const contextPosts = await getStatusContext(notification.status.id);
@ -93,15 +99,20 @@ const generateOllamaRequest = async (
            plaintext_content: ancestor.pleroma.content["text/plain"],
          };
        });
        // console.log(conversationHistory);
      }
      // Simplified user message (remove [/INST] as it's not needed for Llama 3)
      const userMessage = `${notification.status.account.fqn} says: ${notification.status.pleroma.content["text/plain"]}`;
-      let systemContent = ollamaSystemPrompt;
+      // Get random emojis for this request
      const emojiList = await getInstanceEmojis();
      let availableEmojis = "";
      if (emojiList && emojiList.length > 0) {
        const randomEmojis = selectRandomEmojis(emojiList, 20);
        availableEmojis = `\n\nAvailable custom emojis you can use in your response (or use none!) (format as :emoji_name:): ${randomEmojis.join(", ")}`;
      }
      let systemContent = ollamaSystemPrompt + availableEmojis;
      if (replyWithContext) {
        // Simplified context instructions (avoid heavy JSON; summarize for clarity)
        systemContent = `${ollamaSystemPrompt}\n\nPrevious conversation context:\n${conversationHistory
          .map(
            (post) =>
@ -111,10 +122,15 @@ const generateOllamaRequest = async (
          )
          .join(
            "\n"
-          )}\nReply as if you are a party to the conversation. If '@nice-ai' is mentioned, respond directly. Prefix usernames with '@' when addressing them.`;
+          )}\nReply as if you are a party to the conversation. If '@nice-ai' is mentioned, respond directly. Prefix usernames with '@' when addressing them.${availableEmojis}`;
      }
-      // Switch to chat request format (messages array auto-handles Llama 3 template)
+      // Use different seeds for retry attempts
      const currentConfig = {
        ...ollamaConfig,
        seed: retryAttempt > 0 ? Math.floor(Math.random() * 1000000) : ollamaConfig.seed,
      };
      const ollamaRequestBody: OllamaChatRequest = {
        model: ollamaModel,
        messages: [
@ -122,16 +138,21 @@ const generateOllamaRequest = async (
          { role: "user", content: userMessage },
        ],
        stream: false,
-        options: ollamaConfig,
+        options: currentConfig,
      };
      // Change endpoint to /api/chat
      const response = await fetch(`${ollamaUrl}/api/chat`, {
        method: "POST",
        body: JSON.stringify(ollamaRequestBody),
      });
      const ollamaResponse: OllamaChatResponse = await response.json();
      // Check for refusal and retry up to 2 times
      if (isLLMRefusal(ollamaResponse.message.content) && retryAttempt < 2) {
        console.log(`LLM refused to answer (attempt ${retryAttempt + 1}), retrying with different seed...`);
        return generateOllamaRequest(notification, retryAttempt + 1);
      }
      await storePromptData(notification, ollamaResponse);
      return ollamaResponse;
    }
@ -145,16 +166,11 @@ const postReplyToStatus = async (
  ollamaResponseBody: OllamaChatResponse
 ) => {
  const { pleromaInstanceUrl, bearerToken } = envConfig;
  const emojiList = await getInstanceEmojis();
  let randomEmoji;
  if (emojiList) {
    randomEmoji = selectRandomEmoji(emojiList);
  }
  try {
    let mentions: string[];
    const statusBody: NewStatusBody = {
      content_type: "text/markdown",
-      status: `${ollamaResponseBody.message.content} :${randomEmoji}:`,
+      status: ollamaResponseBody.message.content,
      in_reply_to_id: notification.status.id,
    };
    if (
@ -247,17 +263,28 @@ const beginFetchCycle = async () => {
      await Promise.all(
        notifications.map(async (notification) => {
          try {
            // Handle reactions first (before generating response)
            // This way we can react even if response generation fails
            await handlePostReaction(notification);
            // Then handle the response generation as before
            const ollamaResponse = await generateOllamaRequest(notification);
            if (ollamaResponse) {
-              postReplyToStatus(notification, ollamaResponse);
+              await postReplyToStatus(notification, ollamaResponse);
            }
          } catch (error: any) {
-            throw new Error(error.message);
+            console.error(`Error processing notification ${notification.id}: ${error.message}`);
            // Still try to delete the notification to avoid getting stuck
            try {
              await deleteNotification(notification);
            } catch (deleteError: any) {
              console.error(`Failed to delete notification: ${deleteError.message}`);
            }
          }
        })
      );
    }
-  }, envConfig.fetchInterval); // lower intervals may cause the bot to respond multiple times to the same message, but we try to mitigate this with the deleteNotification function
+  }, envConfig.fetchInterval);
 };
 const beginStatusPostInterval = async () => {
--- a/src/util.ts
+++ b/src/util.ts
@ -98,9 +98,47 @@ const selectRandomEmoji = (emojiList: string[]) => {
  return emojiList[Math.floor(Math.random() * emojiList.length)];
 };
 const selectRandomEmojis = (emojiList: string[], count: number = 20): string[] => {
  if (emojiList.length <= count) return emojiList;
  const shuffled = [...emojiList].sort(() => 0.5 - Math.random());
  return shuffled.slice(0, count);
 };
 const isLLMRefusal = (response: string): boolean => {
  const refusalPatterns = [
    /i can't|i cannot|unable to|i'm not able to/i,
    /i don't feel comfortable/i,
    /i'm not comfortable/i,
    /i shouldn't|i won't/i,
    /that's not something i can/i,
    /i'm not programmed to/i,
    /i'm an ai (assistant|language model)/i,
    /as an ai/i,
    /i apologize, but/i,
    /i must decline/i,
    /that would be inappropriate/i,
    /i'm not supposed to/i,
    /i'd rather not/i,
    /i prefer not to/i,
    /against my guidelines/i,
    /violates my programming/i,
  ];
  const normalizedResponse = response.toLowerCase().trim();
  // Check if response is too short (likely a refusal)
  if (normalizedResponse.length < 20) return true;
  // Check for refusal patterns
  return refusalPatterns.some(pattern => pattern.test(normalizedResponse));
 };
 export {
  alreadyRespondedTo,
  selectRandomEmoji,
  selectRandomEmojis,
  isLLMRefusal,
  trimInputData,
  recordPendingResponse,
  isFromWhitelistedDomain,
--- a/types.d.ts
+++ b/types.d.ts
@ -158,48 +158,182 @@ interface PleromaEmojiMetadata {
  tags: string[];
 }
 interface ReactionRequest {
  name: string; // emoji name without colons
 }
 interface ReactionResponse {
  name: string;
  count: number;
  me: boolean;
  url?: string;
  static_url?: string;
 }
 /**
 * Experimental settings, I wouldn't recommend messing with these if you don't know how they work (I don't either)
 */
 export interface OllamaConfigOptions {
  /**
-   * Number of tokens guaranteed to be kept in memory during response generation. Higher values leave less
+   * Number of tokens guaranteed to be kept in memory during response generation. 
-   * possible room for num_ctx
+   * Higher values leave less room for num_ctx. Used to preserve important context.
   * Default: 0, Range: 0-512
   */
  num_keep?: number;
-  seed?: number;
+
  /**
-   * Sets maximum of tokens in the response
+   * Random seed for reproducible outputs. Same seed + same inputs = same output.
   * Default: -1 (random), Range: any integer
   */
  seed?: number;
  /**
   * Maximum number of tokens to generate in the response. Controls response length.
   * Default: 128, Range: 1-4096+ (model dependent)
   */
  num_predict?: number;
-  top_k?: number;
+
  top_p?: number;
  min_p?: number;
  typical_p?: number;
  repeat_last_n?: number;
  /**
-   * How close of a response should the response be to the original prompt - lower = more focused response
+   * Limits token selection to top K most probable tokens. Reduces randomness.
   * Default: 40, Range: 1-100 (higher = more diverse)
   */
  top_k?: number;
  /**
   * Nucleus sampling - cumulative probability cutoff for token selection.
   * Default: 0.9, Range: 0.0-1.0 (lower = more focused)
   */
  top_p?: number;
  /**
   * Alternative to top_p - minimum probability threshold for tokens.
   * Default: 0.0, Range: 0.0-1.0 (higher = more selective)
   */
  min_p?: number;
  /**
   * Typical sampling - targets tokens with "typical" probability mass.
   * Default: 1.0 (disabled), Range: 0.0-1.0 (lower = less random)
   */
  typical_p?: number;
  /**
   * Number of previous tokens to consider for repetition penalty.
   * Default: 64, Range: 0-512
   */
  repeat_last_n?: number;
  /**
   * Randomness/creativity control. Lower = more deterministic, higher = more creative.
   * Default: 0.8, Range: 0.0-2.0 (sweet spot: 0.1-1.2)
   */
  temperature?: number;
-  repeat_penalty?: number;
+
  presence_penalty?: number;
  frequency_penalty?: number;
  mirostat?: number;
  mirostat_tau?: number;
  mirostat_eta?: number;
  penalize_newline?: boolean;
  stop?: string[];
  numa?: boolean;
  /**
-   * Number of tokens for the prompt to keep in memory for the response, minus the value of num_keep
+   * Penalty for repeating tokens. Higher values reduce repetition.
   * Default: 1.1, Range: 0.0-2.0 (1.0 = no penalty)
   */
  repeat_penalty?: number;
  /**
   * Penalty for using tokens that have already appeared (OpenAI-style).
   * Default: 0.0, Range: -2.0 to 2.0
   */
  presence_penalty?: number;
  /**
   * Penalty proportional to token frequency in text (OpenAI-style).
   * Default: 0.0, Range: -2.0 to 2.0
   */
  frequency_penalty?: number;
  /**
   * Enables Mirostat sampling algorithm (0=disabled, 1=v1, 2=v2).
   * Default: 0, Range: 0, 1, or 2
   */
  mirostat?: number;
  /**
   * Target entropy for Mirostat. Controls coherence vs creativity balance.
   * Default: 5.0, Range: 0.0-10.0
   */
  mirostat_tau?: number;
  /**
   * Learning rate for Mirostat. How quickly it adapts.
   * Default: 0.1, Range: 0.001-1.0
   */
  mirostat_eta?: number;
  /**
   * Apply penalty to newline tokens to control formatting.
   * Default: true
   */
  penalize_newline?: boolean;
  /**
   * Array of strings that will stop generation when encountered.
   * Default: [], Example: ["\n", "User:", "###"]
   */
  stop?: string[];
  /**
   * Enable NUMA (Non-Uniform Memory Access) optimization.
   * Default: false (Linux systems may benefit from true)
   */
  numa?: boolean;
  /**
   * Context window size - total tokens for prompt + response.
   * Default: 2048, Range: 512-32768+ (model dependent, affects memory usage)
   */
  num_ctx?: number;
  /**
   * Batch size for prompt processing. Higher = faster but more memory.
   * Default: 512, Range: 1-2048
   */
  num_batch?: number;
  /**
   * Number of GPU layers to offload. -1 = auto, 0 = CPU only.
   * Default: -1, Range: -1 to model layer count
   */
  num_gpu?: number;
  /**
   * Primary GPU device ID for multi-GPU setups.
   * Default: 0, Range: 0 to (GPU count - 1)
   */
  main_gpu?: number;
  /**
   * Optimize for low VRAM usage at cost of speed.
   * Default: false
   */
  low_vram?: boolean;
  /**
   * Only load vocabulary, skip weights. For tokenization only.
   * Default: false
   */
  vocab_only?: boolean;
  /**
   * Use memory mapping for model files (faster loading).
   * Default: true
   */
  use_mmap?: boolean;
  /**
   * Lock model in memory to prevent swapping.
   * Default: false (enable for consistent performance)
   */
  use_mlock?: boolean;
  /**
   * Number of CPU threads for inference.
   * Default: auto-detected, Range: 1 to CPU core count
   */
  num_thread?: number;
 }