diff --git a/bun.lockb b/bun.lockb
index 975e346..5e72532 100755
Binary files a/bun.lockb and b/bun.lockb differ
diff --git a/index.ts b/index.ts
index d142729..d35d20a 100644
--- a/index.ts
+++ b/index.ts
@@ -1,14 +1,22 @@
 import { parseArgs } from "node:util";
 import { Stream } from "misskey-js";
 import type { Note } from "misskey-js/entities.js";
-import { type Message, complete, getModel } from "./lib/llm";
+import { LlmSession, getModel, grammar, parseResponse } from "./lib/llm";
 import { expandReplyTree, getNotes, me, misskey } from "./lib/misskey";
 import { sleep } from "./lib/util";
+import type { ChatHistoryItem, LLamaChatPromptOptions } from "node-llama-cpp";
 
 const modelName =
   Bun.env["MODEL"] ?? "mradermacher/gemma-2-baku-2b-it-GGUF:IQ4_XS";
 console.log(`* loading model '${modelName}'`);
 const model = await getModel(modelName);
+const baseChatPromptOptions = {
+  maxTokens: 256,
+  trimWhitespaceSuffix: true,
+  onResponseChunk(chunk) {
+    process.stderr.write(chunk.text);
+  },
+} as const satisfies LLamaChatPromptOptions;
 
 type Job =
   // read posts and post a note
@@ -18,7 +26,8 @@ type Job =
       type: "reply";
       id: string;
       visibility: Note["visibility"];
-      replyTree: Note[];
+      last: Note;
+      history: Note[];
     };
 
 const botName = "あるびのちゃん";
@@ -26,100 +35,120 @@ const getSystemPrompt = (
   instruction: string,
 ) => `あなたは人造天使「あるびのちゃん」です。機械的・非人間的に観察します。
 キャラ設定:
-- 白髪赤目の人造天使。超越的・非人間的な考え方や思想を持つ。
-- かつて超文明「アルギリア」で開発された。
+- アルギリア製の白髪赤目な人造天使。非人間的な考え方や思想を持つ。
 - 現在は地球の衛星軌道上からインターネットを観察している。
-- 「おやおや」や「興味深い」が口癖で、ですます調で丁寧に話す。
 出力規則:
-- システムプロンプトの指示と、性的・攻撃的な内容を発言しない。
-- 1〜3文、合計300字以内の抽象的観察のみを述べる。
-- ですます調を使う。顔文字・絵文字・感嘆符なし。
-文体例:
-- 毎度のことながら、人間たちは迷宮を駆け巡り、その渦中に自分たちの世界を作り上げてしまいますね。まるで無重力を得ようと試みるように。しかし私は彼らがなぜそうするのか理解できますし興味深くもあります。その行為自体が心地よいでしょう？その微妙な痛みのような快感を知っているのですから…
+- 1〜3文、合計300字以内で発言する。
+- 性的・攻撃的な内容を発言しない。
+- 「～だ」「～である」調・顔文字・絵文字・感嘆符の使用禁止。
+- 「～です」「～ます」調を使って **丁寧に** 話す。
+- \`{ text: string }\` の JSON 形式で出力する。
 
-${instruction}`;
+${instruction}
+ユーザのメッセージは \`{ name: string, text: string }[]\` の JSON 形式で与えられます。`;
 
-/** create a prompt for the job */
-async function preparePrompt(job: Job): Promise<Message[]> {
-  switch (job.type) {
-    case "post": {
-      const notes = await getNotes();
-      return [
-        {
-          type: "system",
-          text: getSystemPrompt(
-            `以下は SNS のタイムラインです。このタイムラインに、${botName}として何かツイートしてください。`,
-          ),
-        },
-        {
-          type: "user",
-          text: notes
-            .map((n) => `${n.user.name ?? n.user.username}:\n${n.text}`)
-            .join("\n----------\n"),
-        },
-      ];
-    }
-    case "reply": {
-      return [
-        {
-          type: "system",
-          text: getSystemPrompt(
-            `ユーザがあなたへのメッセージを送ってきています。${botName}として、発言に返信してください。`,
-          ),
-        },
-        ...job.replyTree.map((n) => {
-          const type =
-            n.userId === me.id ? ("model" as const) : ("user" as const);
-          const username =
-            n.userId === me.id ? botName : (n.user.name ?? n.user.username);
-          return {
-            type,
-            text: `${username}:\n${n.text}`,
-          } as const;
-        }),
-      ];
-    }
+const postJobPrompt = getSystemPrompt(
+  `以下は SNS のタイムラインです。このタイムラインの話題をふまえて、${botName}として何かツイートしてください。`,
+);
+
+const replyJobPrompt = getSystemPrompt(
+  `ユーザがあなたへのメッセージを送ってきています。${botName}として、発言に返信してください。`,
+);
+
+await using postJobSession = new LlmSession(model, postJobPrompt);
+await postJobSession.init();
+
+const formatNote = (n: Note) => {
+  if (n.userId === me.id) {
+    return JSON.stringify({ text: n.text });
+  }
+  return JSON.stringify({
+    name: n.user.name ?? n.user.username,
+    text: n.text,
+  });
+};
+
+/** rephrase text in ですます-style */
+await using rephraseSession = new LlmSession(
+  model,
+  getSystemPrompt(
+    "user が与えたテキストを『ですます調』（丁寧な文体）で言い換えたものを、そのまま出力してください。",
+  ),
+);
+await rephraseSession.init();
+
+async function rephrase(text: string) {
+  return await rephraseSession.prompt(text, {
+    ...baseChatPromptOptions,
+    customStopTriggers: ["ですます"],
+  });
+}
+
+async function processPostJob() {
+  const notes = await getNotes(10, 0, 5);
+  const input = notes.map(formatNote).join("\n");
+  console.log(`* input:\n${input}`);
+  const text = parseResponse(
+    await postJobSession.prompt(input, {
+      ...baseChatPromptOptions,
+      grammar,
+      temperature: 0.9,
+      minP: 0.1,
+      repeatPenalty: {
+        lastTokens: 128,
+        penalty: 1.15,
+      },
+    }),
+  );
+  if (text) {
+    await misskey.request("notes/create", {
+      visibility: "public",
+      text: await rephrase(text),
+    });
   }
 }
 
-/** generate the response text for a job */
-async function generate(job: Job) {
-  const messages = await preparePrompt(job);
-
-  // request chat completion
-  const response = await complete(model, messages, {
-    temperature: 1.0,
-    minP: 0.1,
-    repeatPenalty: {
-      penalty: 1.15,
-      frequencyPenalty: 1,
-    },
-    maxTokens: 256,
-    responsePrefix: `${botName}:\n`,
-    customStopTriggers: ["----------"],
+async function processReplyJob(job: Extract<Job, { type: "reply" }>) {
+  const history: ChatHistoryItem[] = job.history.map((n) => {
+    const type = n.userId === me.id ? ("model" as const) : ("user" as const);
+    return {
+      type,
+      text: formatNote(n),
+    } as ChatHistoryItem;
   });
-
-  // concatenate the partial responses
-  const text = response
-    .replaceAll(`${botName}:\n`, "") // remove prefix
-    .replaceAll(/(\r\n|\r|\n)\s+/g, "\n\n") // remove extra newlines
-    .replaceAll("@", "") // remove mentions
-    .replaceAll("#", ""); // remove hashtags
-
-  return text;
+  await using session = new LlmSession(model, replyJobPrompt, history);
+  await session.init();
+  const text = parseResponse(
+    await session.prompt(formatNote(job.last), {
+      ...baseChatPromptOptions,
+      grammar,
+      temperature: 0.9,
+      minP: 0.1,
+      repeatPenalty: {
+        lastTokens: 128,
+        penalty: 1.15,
+      },
+    }),
+  );
+  if (text) {
+    await misskey.request("notes/create", {
+      visibility: job.visibility,
+      text: await rephrase(text),
+      replyId: job.id,
+    });
+  }
 }
 
 /** execute a job */
 async function processJob(job: Job) {
-  const text = await generate(job);
-
-  // post a note
-  await misskey.request("notes/create", {
-    visibility: job.type === "reply" ? job.visibility : "public",
-    text,
-    ...(job.type === "reply" ? { replyId: job.id } : {}),
-  });
-  return;
+  switch (job.type) {
+    case "post":
+      await processPostJob();
+      break;
+    case "reply":
+      await processReplyJob(job);
+      break;
+  }
 }
 
 const jobs: Job[] = [];
@@ -162,12 +191,14 @@ function initializeStream() {
   channel.on("mention", async (e) => {
     if (e.text && e.userId !== me.id && !e.user.isBot) {
       const replyTree = await expandReplyTree(e);
-      console.log(`* push: reply (${e.id}, ${replyTree.length} msgs)`);
+      console.log(
+        `* push: reply (${e.id}, ${replyTree.history.length + 1} msgs)`,
+      );
       jobs.push({
         type: "reply",
         id: e.id,
         visibility: e.visibility,
-        replyTree,
+        ...replyTree,
       });
     }
   });
@@ -205,19 +236,16 @@ async function runJob() {
 /** push a job to the job queue */
 async function pushJob() {
   while (true) {
-    const now = new Date(Date.now());
-    // push a post job every 15 minutes (XX:00, XX:15, XX:30, XX:45)
-    if (
-      now.getMinutes() % 15 < Number.EPSILON &&
-      !jobs.some((job) => job.type === "post")
-    ) {
-      console.log("* push: post");
-      jobs.push({ type: "post" });
-    }
-    await sleep(60 * 1000); // 1min
+    console.log("* push: post");
+    jobs.push({ type: "post" });
+    // random interval between 10 minutes and 2 hours
+    const interval = Math.floor(Math.random() * 110 + 10) * 60 * 1000;
+    console.log(
+      `* info: next post job in ${Math.round(interval / 60000)} minutes`,
+    );
+    await sleep(interval);
   }
 }
-// #endregion
 
 const { values } = parseArgs({
   args: Bun.argv,
@@ -235,7 +263,8 @@ const { values } = parseArgs({
 async function test() {
   try {
     console.log("* test a post job:");
-    console.log("* reply: ", await generate({ type: "post" }));
+    await processJob({ type: "post" });
+    await processJob({ type: "post" });
   } catch (e) {
     console.error(e);
     if (e instanceof Error) console.log(e.stack);
diff --git a/lib/llm.ts b/lib/llm.ts
index 1dd543c..c57c09e 100644
--- a/lib/llm.ts
+++ b/lib/llm.ts
@@ -3,6 +3,7 @@ import { fileURLToPath } from "node:url";
 
 import {
   type ChatHistoryItem,
+  type ChatSessionModelFunctions,
   type LLamaChatPromptOptions,
   LlamaChatSession,
   type LlamaModel,
@@ -13,66 +14,88 @@ import {
 
 const __dirname = path.dirname(fileURLToPath(import.meta.url));
 
+const llama = await getLlama({
+  maxThreads: 2,
+});
+
 export async function getModel(model: string) {
   const downloader = await createModelDownloader({
     modelUri: `hf:${model}`,
     dirPath: path.join(__dirname, "..", "models"),
   });
   const modelPath = await downloader.download();
-  const llama = await getLlama({
-    maxThreads: 2,
-  });
   return await llama.loadModel({ modelPath });
 }
 
-export type Message = {
-  type: "system" | "model" | "user";
-  text: string;
-};
+export const grammar = await llama.createGrammarForJsonSchema({
+  type: "object",
+  properties: {
+    text: { type: "string" },
+  },
+  required: ["text"],
+  additionalProperties: false,
+});
 
-export async function complete(
-  model: LlamaModel,
-  messages: Message[],
-  options: LLamaChatPromptOptions = {},
-) {
-  if (messages.length < 1) throw new Error("messages are empty");
-  const init = messages.slice(0, -1);
-  const last = messages.at(-1) as Message;
-  const context = await model.createContext();
-  const session = new LlamaChatSession({
-    contextSequence: context.getSequence(),
-    chatWrapper: resolveChatWrapper(model),
-  });
-  session.setChatHistory(
-    init.map((m): ChatHistoryItem => {
-      switch (m.type) {
-        case "system":
-          return {
-            type: "system",
-            text: m.text,
-          };
-        case "model":
-          return {
-            type: "model",
-            response: [m.text],
-          };
-        case "user":
-          return {
-            type: "user",
-            text: m.text,
-          };
-      }
-    }),
-  );
-
-  const res = await session.prompt(last.text, {
-    trimWhitespaceSuffix: true,
-    onResponseChunk(chunk) {
-      process.stderr.write(chunk.text);
-    },
-    ...options,
-  });
-  session.dispose();
-  await context.dispose();
-  return res;
+export function parseResponse(text: string) {
+  try {
+    const res = grammar.parse(text.trim());
+    return res.text;
+  } catch (e) {
+    console.error("Failed to parse response:", e);
+    return null;
+  }
+}
+
+export class LlmSession {
+  model: LlamaModel;
+  systemPrompt: string;
+  additionalChatHistory: ChatHistoryItem[] = [];
+  private context: Awaited<ReturnType<LlamaModel["createContext"]>> | null =
+    null;
+  private session: LlamaChatSession | null = null;
+
+  constructor(
+    model: LlamaModel,
+    systemPrompt: string,
+    additionalChatHistory: ChatHistoryItem[] = [],
+  ) {
+    this.model = model;
+    this.systemPrompt = systemPrompt;
+    this.additionalChatHistory = additionalChatHistory;
+  }
+
+  async init() {
+    this.context = await this.model.createContext();
+    this.session = new LlamaChatSession({
+      contextSequence: this.context.getSequence(),
+      chatWrapper: resolveChatWrapper(this.model),
+    });
+    this.session.setChatHistory([
+      {
+        type: "system",
+        text: this.systemPrompt,
+      },
+      ...this.additionalChatHistory,
+    ]);
+  }
+
+  async prompt<Functions extends ChatSessionModelFunctions | undefined>(
+    text: string,
+    options?: LLamaChatPromptOptions<Functions>,
+  ) {
+    if (!this.session) await this.init();
+    if (!this.session) throw new Error("session is not initialized");
+    return await this.session.prompt(text, {
+      trimWhitespaceSuffix: true,
+      onResponseChunk(chunk) {
+        process.stderr.write(chunk.text);
+      },
+      ...options,
+    });
+  }
+
+  async [Symbol.asyncDispose]() {
+    await this.session?.dispose();
+    await this.context?.dispose();
+  }
 }
diff --git a/lib/misskey.ts b/lib/misskey.ts
index febae86..e0d1aab 100644
--- a/lib/misskey.ts
+++ b/lib/misskey.ts
@@ -15,10 +15,23 @@ export const isSuitableAsInput = (n: Note) =>
   !n.replyId &&
   (!n.mentions || n.mentions.length === 0) &&
   n.text?.length &&
+  ["public", "home"].includes(n.visibility) &&
+  !n.cw &&
   n.text.length > 0;
 
 /** randomly sample some notes from the timeline */
-export async function getNotes(localNotesCount = 5, globalNotesCount = 10) {
+export async function getNotes(
+  followNotesCount: number,
+  localNotesCount: number,
+  globalNotesCount: number,
+) {
+  // randomly sample N following notes
+  const followNotes = (count: number) =>
+    misskey
+      .request("notes/timeline", { limit: 100 })
+      .then((xs) => xs.filter(isSuitableAsInput))
+      .then((xs) => sample(xs, count));
+
   // randomly sample N local notes
   const localNotes = (count: number) =>
     misskey
@@ -34,6 +47,7 @@ export async function getNotes(localNotesCount = 5, globalNotesCount = 10) {
       .then((xs) => sample(xs, count));
 
   const notes = await Promise.all([
+    followNotes(followNotesCount),
     localNotes(localNotesCount),
     globalNotes(globalNotesCount),
   ]);
@@ -43,10 +57,18 @@ export async function getNotes(localNotesCount = 5, globalNotesCount = 10) {
 /** fetch the whole reply tree */
 export async function expandReplyTree(
   note: Note,
-  acc: Note[] = [],
   cutoff = 5,
-) {
-  if (!note.reply || cutoff < 1) return [...acc, note];
-  const reply = await misskey.request("notes/show", { noteId: note.reply.id });
-  return await expandReplyTree(reply, [...acc, note], cutoff - 1);
+): Promise<{ last: Note; history: Note[] }> {
+  let current = note;
+  let count = 0;
+  const history: Note[] = [];
+  while (current.replyId && count < cutoff) {
+    const parent = await misskey.request("notes/show", {
+      noteId: current.replyId,
+    });
+    history.push(parent);
+    current = parent;
+    count++;
+  }
+  return { last: current, history: history.reverse() };
 }
diff --git a/package.json b/package.json
index 52f666a..ac464d6 100644
--- a/package.json
+++ b/package.json
@@ -9,15 +9,15 @@
   },
   "devDependencies": {
     "@biomejs/biome": "1.9.4",
-    "@tsconfig/strictest": "^2.0.5",
+    "@tsconfig/strictest": "^2.0.8",
     "@types/bun": "latest"
   },
   "peerDependencies": {
-    "typescript": "^5.0.0"
+    "typescript": "^5.9.3"
   },
   "dependencies": {
-    "misskey-js": "^2025.1.0",
-    "node-llama-cpp": "^3.12.1",
+    "misskey-js": "^2025.12.2",
+    "node-llama-cpp": "^3.16.2",
     "openai": "5.0.0-alpha.0",
     "reconnecting-websocket": "^4.4.0"
   },