From 0a600d8f46468ada3775926dc71470555bee4cb0 Mon Sep 17 00:00:00 2001
From: Eric Huang <ijbhxhu@gmail.com>
Date: Sat, 20 Jun 2026 16:50:01 +0800
Subject: [PATCH 1/2] feat: add opt-in LINE group context buffering

---
 docs/line.md                  |  15 +-
 gateway/src/adapters/line.rs  | 475 +++++++++++++++++++++++++++++++++-
 gateway/src/adapters/teams.rs |   2 +
 gateway/src/main.rs           |  91 ++++++-
 4 files changed, 572 insertions(+), 11 deletions(-)

diff --git a/docs/line.md b/docs/line.md
index c5890f2a6..5f6b1003f 100644
--- a/docs/line.md
+++ b/docs/line.md
@@ -83,7 +83,7 @@ In the LINE Developers Console → **Messaging API** tab → scan the QR code wi
 
 - **1:1 chat** — send a message to the bot, get an AI agent response
 - **Inbound voice messages in 1:1 chat** — LINE-hosted audio messages are downloaded through the LINE Content API and forwarded to OpenAB as `audio` attachments, so the existing STT flow can transcribe them. This requires `[stt] enabled = true` in OpenAB core. See [STT (Speech-to-Text)](stt.md).
-- **Group chat** — add the bot to a group; it responds only when @-mentioned (see @mention gating below)
+- **Group chat** — add the bot to a group; it responds when directly @-mentioned. Deployments can opt in to folding recent unmentioned text into the next direct-mention turn as short-term context (see @mention gating below)
 - **Inbound images** — user-sent LINE images are downloaded through the LINE Content API and forwarded to OpenAB as image attachments
 - **Webhook signature validation** — HMAC-SHA256 via `LINE_CHANNEL_SECRET`
 
@@ -96,11 +96,12 @@ In the LINE Developers Console → **Messaging API** tab → scan the QR code wi
 
 - **Threads** — LINE has no thread/topic concept. All messages in a chat share one agent session.
 - **Reactions** — LINE Bot API does not support message reactions.
-- **@mention gating** — Supported (zero-config). In group/room chats the gateway only forwards messages where the bot is explicitly @-mentioned (LINE's native `mentionees[].isSelf` signal). 1:1 DMs are always forwarded. No env var is needed.
-  - *Limitation — non-text messages*: LINE only attaches mention data to text messages. Images, videos, stickers, files, and location messages in groups are silently dropped because they cannot carry an @-mention.
-  - *Limitation — group voice messages*: LINE voice/audio messages in groups and rooms are also dropped today because audio messages do not carry mention metadata. This PR only enables inbound voice STT for 1:1 chats.
+- **@mention gating** — Supported (zero-config). In group/room chats the gateway only dispatches a visible bot reply when the bot is explicitly @-mentioned (LINE's native `mentionees[].isSelf` signal). 1:1 DMs are always forwarded. No env var is needed.
+  - *Optional short-term text buffering*: when `LINE_GROUP_CONTEXT_ENABLED=true`, unmentioned **text** messages in groups/rooms are buffered locally in the gateway for up to 24 hours and injected into the next directly @-mentioned text turn for the same chat. The buffer is capped per chat by message count and total characters. This improves conversational continuity without making the bot reply to every group message.
+  - *Limitation — non-text messages*: LINE only attaches mention data to text messages. Images, videos, stickers, files, and location messages in groups are still dropped when not directly @-mentioned because they do not enter the short-term text buffer.
+  - *Limitation — group voice messages*: LINE voice/audio messages in groups and rooms are also dropped today because audio messages do not carry mention metadata. LINE inbound voice STT is currently for 1:1 chats.
   - *Limitation — `@All`*: A group-wide `@All` mention does **not** trigger the bot; only a direct `@BotName` mention does.
-  - *Breaking change*: This gating is always active. Deployments that previously relied on the bot responding to all group messages will need to @-mention the bot after upgrading.
+  - *Behavior note*: the short-term context buffer is local, bounded, temporary, and drained after injection. It is not a long-term chat archive or GBrain memory store.
 - **Markdown rendering** — LINE uses its own text formatting. Agent replies are sent as plain text.
 - **External-content images** — LINE image messages backed by `contentProvider.type = "external"` are not downloaded yet.
 - **External-content audio** — LINE audio messages backed by `contentProvider.type = "external"` are not downloaded yet.
@@ -111,6 +112,10 @@ In the LINE Developers Console → **Messaging API** tab → scan the QR code wi
 |---|---|---|
 | `LINE_CHANNEL_SECRET` | Yes | Channel secret for webhook signature validation |
 | `LINE_CHANNEL_ACCESS_TOKEN` | Yes | Channel access token for Reply/Push Message API and LINE-hosted image/audio downloads |
+| `LINE_GROUP_CONTEXT_ENABLED` | No | Opt in to buffering unmentioned group/room text for the next direct mention. Default: `false` |
+| `LINE_GROUP_CONTEXT_TTL_HOURS` | No | Hours to keep unmentioned group/room text eligible for the next direct mention. Default: `24` |
+| `LINE_GROUP_CONTEXT_MAX_MESSAGES` | No | Maximum buffered unmentioned text messages per group/room. Default: `100` |
+| `LINE_GROUP_CONTEXT_MAX_CHARS` | No | Maximum total buffered text characters per group/room. Default: `8000` |
 
 ## Troubleshooting
 
diff --git a/gateway/src/adapters/line.rs b/gateway/src/adapters/line.rs
index c0981f6c5..e5c4d594e 100644
--- a/gateway/src/adapters/line.rs
+++ b/gateway/src/adapters/line.rs
@@ -5,6 +5,7 @@ use crate::schema::*;
 use crate::store;
 use axum::extract::State;
 use serde::Deserialize;
+use std::collections::VecDeque;
 use std::sync::Arc;
 use tracing::{error, info, warn};
 
@@ -160,6 +161,8 @@ async fn process_line_webhook_events(
             &state.client,
             state.line_access_token.as_deref(),
             LINE_DATA_API_BASE,
+            &state.line_group_context_buffer,
+            &state.line_group_context_config,
         )
         .await
         else {
@@ -206,6 +209,8 @@ async fn build_gateway_event_from_line_event(
     client: &reqwest::Client,
     line_access_token: Option<&str>,
     data_api_base: &str,
+    line_group_context_buffer: &crate::LineGroupContextBuffer,
+    line_group_context_config: &crate::LineGroupContextConfig,
 ) -> Option<GatewayEvent> {
     if event.event_type != "message" {
         return None;
@@ -315,7 +320,7 @@ async fn build_gateway_event_from_line_event(
         }
     }
 
-    let event_text = text;
+    let mut event_text = text.to_string();
 
     if event_text.trim().is_empty() && attachments.is_empty() {
         return None;
@@ -369,7 +374,35 @@ async fn build_gateway_event_from_line_event(
     // LINE sets isSelf=true on the mentionee that is the bot itself — no env var needed.
     // 1:1 DMs always pass through.
     let is_group = channel_type == "group" || channel_type == "room";
-    if is_group && !mentionees.iter().any(|m| m.is_self) {
+    let bot_mentioned = mentionees.iter().any(|m| m.is_self);
+    if is_group && msg.message_type == "text" && line_group_context_config.enabled {
+        if !bot_mentioned {
+            buffer_line_group_context(
+                line_group_context_buffer,
+                line_group_context_config,
+                &channel_id,
+                user_id,
+                &event_text,
+            );
+            info!(
+                channel = %channel_id,
+                "line group text buffered (bot not mentioned)"
+            );
+            return None;
+        }
+        if let Some(buffered) = take_line_group_context(
+            line_group_context_buffer,
+            line_group_context_config,
+            &channel_id,
+        ) {
+            info!(
+                channel = %channel_id,
+                buffered_messages = buffered.len(),
+                "line group context injected into direct mention"
+            );
+            event_text = inject_buffered_group_context(&buffered, &event_text);
+        }
+    } else if is_group && !bot_mentioned {
         info!(
             channel = %channel_id,
             "line group message dropped (@mention gating: bot not mentioned)"
@@ -390,7 +423,7 @@ async fn build_gateway_event_from_line_event(
             display_name: user_id.into(),
             is_bot: false,
         },
-        event_text,
+        &event_text,
         &msg.id,
         mention_ids,
     );
@@ -398,6 +431,80 @@ async fn build_gateway_event_from_line_event(
     Some(gateway_event)
 }
 
+fn buffer_line_group_context(
+    buffer: &crate::LineGroupContextBuffer,
+    config: &crate::LineGroupContextConfig,
+    channel_id: &str,
+    sender_id: &str,
+    text: &str,
+) {
+    let trimmed = text.trim();
+    if trimmed.is_empty() {
+        return;
+    }
+
+    let mut guard = buffer.lock().unwrap_or_else(|e| e.into_inner());
+    let now = std::time::Instant::now();
+    let entry = guard.entry(channel_id.to_string()).or_default();
+    entry.retain(|m| now.duration_since(m.buffered_at).as_secs() < config.ttl_secs);
+    let bounded_text: String = trimmed.chars().take(config.max_chars).collect();
+    entry.push_back(crate::LineBufferedText {
+        sender_id: sender_id.to_string(),
+        text: bounded_text,
+        buffered_at: now,
+    });
+    enforce_line_group_context_limits(entry, config);
+}
+
+fn enforce_line_group_context_limits(
+    entry: &mut VecDeque<crate::LineBufferedText>,
+    config: &crate::LineGroupContextConfig,
+) {
+    while entry.len() > config.max_messages {
+        entry.pop_front();
+    }
+    while entry.len() > 1 && line_group_context_char_count(entry) > config.max_chars {
+        entry.pop_front();
+    }
+}
+
+fn line_group_context_char_count(entry: &VecDeque<crate::LineBufferedText>) -> usize {
+    entry
+        .iter()
+        .map(|m| m.sender_id.chars().count() + m.text.chars().count() + 2)
+        .sum()
+}
+
+fn take_line_group_context(
+    buffer: &crate::LineGroupContextBuffer,
+    config: &crate::LineGroupContextConfig,
+    channel_id: &str,
+) -> Option<VecDeque<crate::LineBufferedText>> {
+    let mut guard = buffer.lock().unwrap_or_else(|e| e.into_inner());
+    let now = std::time::Instant::now();
+    let mut entry = guard.remove(channel_id)?;
+    entry.retain(|m| now.duration_since(m.buffered_at).as_secs() < config.ttl_secs);
+    if entry.is_empty() {
+        None
+    } else {
+        Some(entry)
+    }
+}
+
+fn inject_buffered_group_context(
+    buffered: &VecDeque<crate::LineBufferedText>,
+    current_text: &str,
+) -> String {
+    let mut lines = Vec::with_capacity(buffered.len() + 3);
+    lines.push("[Recent group context before this direct mention]".to_string());
+    for entry in buffered {
+        lines.push(format!("{}: {}", entry.sender_id, entry.text));
+    }
+    lines.push("[Current directly mentioned message]".to_string());
+    lines.push(current_text.to_string());
+    lines.join("\n")
+}
+
 pub async fn download_line_image(
     client: &reqwest::Client,
     access_token: &str,
@@ -739,6 +846,17 @@ mod tests {
     use wiremock::matchers::{header, method, path};
     use wiremock::{Mock, MockServer, ResponseTemplate};
 
+    fn test_line_group_context_config() -> crate::LineGroupContextConfig {
+        crate::LineGroupContextConfig::default()
+    }
+
+    fn enabled_line_group_context_config() -> crate::LineGroupContextConfig {
+        crate::LineGroupContextConfig {
+            enabled: true,
+            ..crate::LineGroupContextConfig::default()
+        }
+    }
+
     #[tokio::test]
     async fn download_line_image_resizes_and_returns_attachment() {
         let server = MockServer::start().await;
@@ -814,6 +932,8 @@ mod tests {
             &reqwest::Client::new(),
             Some("line_token"),
             &server.uri(),
+            &Arc::new(std::sync::Mutex::new(HashMap::new())),
+            &test_line_group_context_config(),
         )
         .await
         .expect("image event should produce a gateway event");
@@ -1032,6 +1152,8 @@ mod tests {
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
+            &Arc::new(std::sync::Mutex::new(HashMap::new())),
+            &test_line_group_context_config(),
         )
         .await;
 
@@ -1068,6 +1190,8 @@ mod tests {
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
+            &Arc::new(std::sync::Mutex::new(HashMap::new())),
+            &test_line_group_context_config(),
         )
         .await;
 
@@ -1102,6 +1226,8 @@ mod tests {
             &reqwest::Client::new(),
             None, // no access token
             LINE_DATA_API_BASE,
+            &Arc::new(std::sync::Mutex::new(HashMap::new())),
+            &test_line_group_context_config(),
         )
         .await;
 
@@ -1161,6 +1287,8 @@ mod tests {
             event_tx,
             reply_token_cache: Arc::new(std::sync::Mutex::new(HashMap::new())),
             line_webhook_semaphore: Arc::new(Semaphore::new(crate::LINE_WEBHOOK_CONCURRENCY_MAX)),
+            line_group_context_buffer: Arc::new(std::sync::Mutex::new(HashMap::new())),
+            line_group_context_config: test_line_group_context_config(),
             client: reqwest::Client::new(),
         });
 
@@ -1228,6 +1356,8 @@ mod tests {
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
+            &Arc::new(std::sync::Mutex::new(HashMap::new())),
+            &test_line_group_context_config(),
         )
         .await;
         assert!(result.is_some());
@@ -1236,20 +1366,52 @@ mod tests {
     }
 
     #[tokio::test]
-    async fn group_message_dropped_when_bot_not_mentioned() {
+    async fn group_message_drops_without_buffer_when_context_disabled() {
+        let buffer = Arc::new(std::sync::Mutex::new(HashMap::new()));
+        let event = make_group_text_event("hey everyone", false);
+        let result = build_gateway_event_from_line_event(
+            &event,
+            &reqwest::Client::new(),
+            None,
+            LINE_DATA_API_BASE,
+            &buffer,
+            &test_line_group_context_config(),
+        )
+        .await;
+        assert!(result.is_none());
+        let guard = buffer.lock().unwrap_or_else(|e| e.into_inner());
+        assert!(
+            guard.get("C001").is_none(),
+            "context disabled should preserve original drop behavior"
+        );
+    }
+
+    #[tokio::test]
+    async fn group_message_buffers_when_bot_not_mentioned_and_context_enabled() {
+        let buffer = Arc::new(std::sync::Mutex::new(HashMap::new()));
         let event = make_group_text_event("hey everyone", false);
         let result = build_gateway_event_from_line_event(
             &event,
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
+            &buffer,
+            &enabled_line_group_context_config(),
         )
         .await;
         assert!(result.is_none());
+        let guard = buffer.lock().unwrap_or_else(|e| e.into_inner());
+        assert_eq!(
+            guard
+                .get("C001")
+                .and_then(|entry| entry.front())
+                .map(|m| m.text.as_str()),
+            Some("hey everyone")
+        );
     }
 
     #[tokio::test]
-    async fn group_message_dropped_when_no_mention_at_all() {
+    async fn group_message_buffers_when_no_mention_at_all() {
         let event: LineEvent = serde_json::from_value(serde_json::json!({
             "type": "message",
             "source": {"type": "group", "groupId": "C001", "userId": "U_sender"},
@@ -1261,6 +1423,8 @@ mod tests {
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
+            &Arc::new(std::sync::Mutex::new(HashMap::new())),
+            &enabled_line_group_context_config(),
         )
         .await;
         assert!(result.is_none());
@@ -1279,8 +1443,309 @@ mod tests {
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
+            &Arc::new(std::sync::Mutex::new(HashMap::new())),
+            &test_line_group_context_config(),
         )
         .await;
         assert!(result.is_some());
     }
+
+    #[tokio::test]
+    async fn group_message_buffers_then_injects_context_on_later_mention() {
+        let buffer = Arc::new(std::sync::Mutex::new(HashMap::new()));
+
+        let first = make_group_text_event("今天下午兩點開會", false);
+        let first_result = build_gateway_event_from_line_event(
+            &first,
+            &reqwest::Client::new(),
+            None,
+            LINE_DATA_API_BASE,
+            &buffer,
+            &enabled_line_group_context_config(),
+        )
+        .await;
+        assert!(
+            first_result.is_none(),
+            "unmentioned message should only be buffered"
+        );
+
+        let second = make_group_text_event("@Bot 幫我總結一下", true);
+        let second_result = build_gateway_event_from_line_event(
+            &second,
+            &reqwest::Client::new(),
+            None,
+            LINE_DATA_API_BASE,
+            &buffer,
+            &enabled_line_group_context_config(),
+        )
+        .await
+        .expect("mentioned message should produce an event");
+
+        assert!(second_result
+            .content
+            .text
+            .contains("[Recent group context before this direct mention]"));
+        assert!(second_result
+            .content
+            .text
+            .contains("U_sender: 今天下午兩點開會"));
+        assert!(second_result
+            .content
+            .text
+            .contains("[Current directly mentioned message]"));
+        assert!(second_result.content.text.contains("@Bot 幫我總結一下"));
+        let guard = buffer.lock().unwrap_or_else(|e| e.into_inner());
+        assert!(
+            guard.get("C001").is_none(),
+            "buffer should drain after injection"
+        );
+    }
+
+    #[tokio::test]
+    async fn direct_mention_without_buffer_keeps_original_text() {
+        let buffer = Arc::new(std::sync::Mutex::new(HashMap::new()));
+
+        let event = make_group_text_event("@Bot 現在狀況如何", true);
+        let result = build_gateway_event_from_line_event(
+            &event,
+            &reqwest::Client::new(),
+            None,
+            LINE_DATA_API_BASE,
+            &buffer,
+            &enabled_line_group_context_config(),
+        )
+        .await
+        .expect("mentioned message should produce an event");
+
+        assert_eq!(result.content.text, "@Bot 現在狀況如何");
+    }
+
+    #[tokio::test]
+    async fn multiple_buffered_messages_preserve_order_on_injection() {
+        let buffer = Arc::new(std::sync::Mutex::new(HashMap::new()));
+
+        let first: LineEvent = serde_json::from_value(serde_json::json!({
+            "type": "message",
+            "source": {"type": "group", "groupId": "C001", "userId": "U_alice"},
+            "message": {"id": "msg001", "type": "text", "text": "第一句前文"}
+        }))
+        .unwrap();
+        let second: LineEvent = serde_json::from_value(serde_json::json!({
+            "type": "message",
+            "source": {"type": "group", "groupId": "C001", "userId": "U_bob"},
+            "message": {"id": "msg002", "type": "text", "text": "第二句前文"}
+        }))
+        .unwrap();
+
+        assert!(build_gateway_event_from_line_event(
+            &first,
+            &reqwest::Client::new(),
+            None,
+            LINE_DATA_API_BASE,
+            &buffer,
+            &enabled_line_group_context_config(),
+        )
+        .await
+        .is_none());
+        assert!(build_gateway_event_from_line_event(
+            &second,
+            &reqwest::Client::new(),
+            None,
+            LINE_DATA_API_BASE,
+            &buffer,
+            &enabled_line_group_context_config(),
+        )
+        .await
+        .is_none());
+
+        let mention = make_group_text_event("@Bot 幫我整理一下", true);
+        let result = build_gateway_event_from_line_event(
+            &mention,
+            &reqwest::Client::new(),
+            None,
+            LINE_DATA_API_BASE,
+            &buffer,
+            &enabled_line_group_context_config(),
+        )
+        .await
+        .expect("mentioned message should produce an event");
+
+        let first_idx = result
+            .content
+            .text
+            .find("U_alice: 第一句前文")
+            .expect("first buffered line present");
+        let second_idx = result
+            .content
+            .text
+            .find("U_bob: 第二句前文")
+            .expect("second buffered line present");
+        let current_idx = result
+            .content
+            .text
+            .find("[Current directly mentioned message]")
+            .expect("current message header present");
+
+        assert!(
+            first_idx < second_idx,
+            "buffered lines should preserve arrival order"
+        );
+        assert!(
+            second_idx < current_idx,
+            "buffered context should appear before current message"
+        );
+    }
+
+    #[test]
+    fn group_context_buffer_keeps_latest_messages_within_bounds() {
+        let buffer = Arc::new(std::sync::Mutex::new(HashMap::new()));
+        let config = test_line_group_context_config();
+
+        for i in 0..(config.max_messages + 5) {
+            buffer_line_group_context(
+                &buffer,
+                &config,
+                "C001",
+                "U_sender",
+                &format!("message {i}"),
+            );
+        }
+
+        let guard = buffer.lock().unwrap_or_else(|e| e.into_inner());
+        let entry = guard.get("C001").expect("buffer should exist");
+
+        assert_eq!(entry.len(), config.max_messages);
+        assert_eq!(entry.front().unwrap().text, "message 5");
+        assert_eq!(
+            entry.back().unwrap().text,
+            format!("message {}", config.max_messages + 4)
+        );
+        assert!(
+            line_group_context_char_count(entry) <= config.max_chars,
+            "buffer should stay within character budget"
+        );
+    }
+
+    #[test]
+    fn group_context_buffer_enforces_total_character_budget() {
+        let buffer = Arc::new(std::sync::Mutex::new(HashMap::new()));
+        let config = test_line_group_context_config();
+        let large = "x".repeat(config.max_chars / 2);
+
+        buffer_line_group_context(
+            &buffer,
+            &config,
+            "C001",
+            "U_sender",
+            &format!("old {large}"),
+        );
+        buffer_line_group_context(
+            &buffer,
+            &config,
+            "C001",
+            "U_sender",
+            &format!("middle {large}"),
+        );
+        buffer_line_group_context(
+            &buffer,
+            &config,
+            "C001",
+            "U_sender",
+            &format!("latest {large}"),
+        );
+
+        let guard = buffer.lock().unwrap_or_else(|e| e.into_inner());
+        let entry = guard.get("C001").expect("buffer should exist");
+
+        assert!(
+            line_group_context_char_count(entry) <= config.max_chars,
+            "buffer should stay within character budget"
+        );
+        assert!(
+            entry.back().unwrap().text.starts_with("latest "),
+            "latest context should be retained when trimming old messages"
+        );
+    }
+
+    #[tokio::test]
+    async fn buffer_is_chat_local_and_not_reused_after_drain() {
+        let buffer = Arc::new(std::sync::Mutex::new(HashMap::new()));
+
+        let buffered: LineEvent = serde_json::from_value(serde_json::json!({
+            "type": "message",
+            "source": {"type": "group", "groupId": "C001", "userId": "U_sender"},
+            "message": {"id": "msg001", "type": "text", "text": "只屬於 C001 的前文"}
+        }))
+        .unwrap();
+
+        assert!(build_gateway_event_from_line_event(
+            &buffered,
+            &reqwest::Client::new(),
+            None,
+            LINE_DATA_API_BASE,
+            &buffer,
+            &enabled_line_group_context_config(),
+        )
+        .await
+        .is_none());
+
+        let other_chat: LineEvent = serde_json::from_value(serde_json::json!({
+            "type": "message",
+            "source": {"type": "group", "groupId": "C002", "userId": "U_sender"},
+            "message": {
+                "id": "msg010",
+                "type": "text",
+                "text": "@Bot 另一個群組的 mention",
+                "mention": {"mentionees": [{"userId": "Ubot123", "type": "user", "isSelf": true}]}
+            }
+        }))
+        .unwrap();
+
+        let other_result = build_gateway_event_from_line_event(
+            &other_chat,
+            &reqwest::Client::new(),
+            None,
+            LINE_DATA_API_BASE,
+            &buffer,
+            &enabled_line_group_context_config(),
+        )
+        .await
+        .expect("other chat mention should produce an event");
+        assert!(
+            !other_result.content.text.contains("只屬於 C001 的前文"),
+            "buffered context must not leak across chats"
+        );
+
+        let same_chat = make_group_text_event("@Bot C001 的 mention", true);
+        let same_result = build_gateway_event_from_line_event(
+            &same_chat,
+            &reqwest::Client::new(),
+            None,
+            LINE_DATA_API_BASE,
+            &buffer,
+            &enabled_line_group_context_config(),
+        )
+        .await
+        .expect("same chat mention should produce an event");
+        assert!(same_result
+            .content
+            .text
+            .contains("U_sender: 只屬於 C001 的前文"));
+
+        let second_same_chat = make_group_text_event("@Bot 再問一次", true);
+        let drained_result = build_gateway_event_from_line_event(
+            &second_same_chat,
+            &reqwest::Client::new(),
+            None,
+            LINE_DATA_API_BASE,
+            &buffer,
+            &enabled_line_group_context_config(),
+        )
+        .await
+        .expect("second same-chat mention should produce an event");
+        assert!(
+            !drained_result.content.text.contains("只屬於 C001 的前文"),
+            "buffer should be one-shot and drain after injection"
+        );
+    }
 }
diff --git a/gateway/src/adapters/teams.rs b/gateway/src/adapters/teams.rs
index 09ac09df8..6043a460a 100644
--- a/gateway/src/adapters/teams.rs
+++ b/gateway/src/adapters/teams.rs
@@ -666,6 +666,8 @@ mod tests {
             event_tx,
             reply_token_cache: Arc::new(std::sync::Mutex::new(std::collections::HashMap::new())),
             line_webhook_semaphore: Arc::new(tokio::sync::Semaphore::new(crate::LINE_WEBHOOK_CONCURRENCY_MAX)),
+            line_group_context_buffer: Arc::new(std::sync::Mutex::new(std::collections::HashMap::new())),
+            line_group_context_config: crate::LineGroupContextConfig::default(),
             client: reqwest::Client::new(),
         })
     }
diff --git a/gateway/src/main.rs b/gateway/src/main.rs
index c5dfec24f..76a8927e8 100644
--- a/gateway/src/main.rs
+++ b/gateway/src/main.rs
@@ -12,7 +12,7 @@ use axum::{
 };
 use futures_util::{SinkExt, StreamExt};
 use schema::GatewayReply;
-use std::collections::HashMap;
+use std::collections::{HashMap, VecDeque};
 use std::sync::Arc;
 use std::time::Instant;
 use tokio::sync::{broadcast, Mutex, Semaphore};
@@ -38,6 +38,86 @@ pub const REPLY_TOKEN_CACHE_MAX: usize = 10_000;
 /// fast 200 OK response path.
 pub const LINE_WEBHOOK_CONCURRENCY_MAX: usize = 8;
 
+pub const LINE_GROUP_CONTEXT_DEFAULT_TTL_HOURS: u64 = 24;
+pub const LINE_GROUP_CONTEXT_DEFAULT_MAX_MESSAGES: usize = 100;
+pub const LINE_GROUP_CONTEXT_DEFAULT_MAX_CHARS: usize = 8_000;
+
+#[derive(Clone, Debug)]
+pub struct LineGroupContextConfig {
+    /// Enables opt-in capture of unmentioned LINE group text.
+    pub enabled: bool,
+    /// How long unmentioned LINE group text stays eligible for later prompt injection.
+    pub ttl_secs: u64,
+    /// Maximum buffered unmentioned LINE text messages per group/room.
+    pub max_messages: usize,
+    /// Maximum total buffered text characters per LINE group/room.
+    pub max_chars: usize,
+}
+
+impl Default for LineGroupContextConfig {
+    fn default() -> Self {
+        Self {
+            enabled: false,
+            ttl_secs: LINE_GROUP_CONTEXT_DEFAULT_TTL_HOURS * 60 * 60,
+            max_messages: LINE_GROUP_CONTEXT_DEFAULT_MAX_MESSAGES,
+            max_chars: LINE_GROUP_CONTEXT_DEFAULT_MAX_CHARS,
+        }
+    }
+}
+
+impl LineGroupContextConfig {
+    fn from_env() -> Self {
+        let defaults = Self::default();
+        let ttl_hours = read_positive_env_u64(
+            "LINE_GROUP_CONTEXT_TTL_HOURS",
+            LINE_GROUP_CONTEXT_DEFAULT_TTL_HOURS,
+        );
+        Self {
+            enabled: read_bool_env("LINE_GROUP_CONTEXT_ENABLED", defaults.enabled),
+            ttl_secs: ttl_hours.saturating_mul(60 * 60),
+            max_messages: read_positive_env_usize(
+                "LINE_GROUP_CONTEXT_MAX_MESSAGES",
+                defaults.max_messages,
+            ),
+            max_chars: read_positive_env_usize("LINE_GROUP_CONTEXT_MAX_CHARS", defaults.max_chars),
+        }
+    }
+}
+
+fn read_bool_env(name: &str, default: bool) -> bool {
+    std::env::var(name)
+        .map(|v| v == "1" || v.eq_ignore_ascii_case("true"))
+        .unwrap_or(default)
+}
+
+fn read_positive_env_u64(name: &str, default: u64) -> u64 {
+    std::env::var(name)
+        .ok()
+        .and_then(|v| v.parse::<u64>().ok())
+        .filter(|v| *v > 0)
+        .unwrap_or(default)
+}
+
+fn read_positive_env_usize(name: &str, default: usize) -> usize {
+    std::env::var(name)
+        .ok()
+        .and_then(|v| v.parse::<usize>().ok())
+        .filter(|v| *v > 0)
+        .unwrap_or(default)
+}
+
+#[derive(Clone, Debug)]
+pub struct LineBufferedText {
+    pub sender_id: String,
+    pub text: String,
+    pub buffered_at: Instant,
+}
+
+/// Short-lived LINE group/room context captured from unmentioned text messages.
+/// Keyed by groupId/roomId. Drained when a later direct mention arrives.
+pub type LineGroupContextBuffer =
+    Arc<std::sync::Mutex<HashMap<String, VecDeque<LineBufferedText>>>>;
+
 // --- App state (shared across all adapters) ---
 
 pub struct AppState {
@@ -72,6 +152,10 @@ pub struct AppState {
     /// Limits concurrent post-ack LINE webhook processing so image bursts do not
     /// turn into unbounded download/decode work.
     pub line_webhook_semaphore: Arc<Semaphore>,
+    /// Short-lived unmentioned LINE group text, used to enrich the next direct-mention turn.
+    pub line_group_context_buffer: LineGroupContextBuffer,
+    /// Tuning knobs for LINE group context capture.
+    pub line_group_context_config: LineGroupContextConfig,
     /// Shared HTTP client for media downloads and API calls
     pub client: reqwest::Client,
 }
@@ -236,6 +320,9 @@ async fn main() -> Result<()> {
 
     let (event_tx, _) = broadcast::channel::<String>(256);
     let reply_token_cache: ReplyTokenCache = Arc::new(std::sync::Mutex::new(HashMap::new()));
+    let line_group_context_buffer: LineGroupContextBuffer =
+        Arc::new(std::sync::Mutex::new(HashMap::new()));
+    let line_group_context_config = LineGroupContextConfig::from_env();
 
     let mut app = Router::new()
         .route("/ws", get(ws_handler))
@@ -410,6 +497,8 @@ async fn main() -> Result<()> {
         event_tx,
         reply_token_cache,
         line_webhook_semaphore: Arc::new(Semaphore::new(LINE_WEBHOOK_CONCURRENCY_MAX)),
+        line_group_context_buffer,
+        line_group_context_config,
         client,
     });
 

From 51af031dae5c72a2c3bd5b0534df547cc3a16272 Mon Sep 17 00:00:00 2001
From: Eric Huang <ijbhxhu@gmail.com>
Date: Sun, 21 Jun 2026 00:25:49 +0800
Subject: [PATCH 2/2] feat: add gateway context provider abstraction

---
 docs/gateway-context.md          |  44 ++++
 docs/line.md                     |  17 +-
 gateway/Cargo.lock               |  13 ++
 gateway/Cargo.toml               |   1 +
 gateway/src/adapters/line.rs     | 377 ++++++++++++-------------------
 gateway/src/adapters/teams.rs    |   4 +-
 gateway/src/context/api_fetch.rs |  20 ++
 gateway/src/context/buffered.rs  | 243 ++++++++++++++++++++
 gateway/src/context/config.rs    |  98 ++++++++
 gateway/src/context/mod.rs       | 116 ++++++++++
 gateway/src/main.rs              | 119 +++-------
 11 files changed, 719 insertions(+), 333 deletions(-)
 create mode 100644 docs/gateway-context.md
 create mode 100644 gateway/src/context/api_fetch.rs
 create mode 100644 gateway/src/context/buffered.rs
 create mode 100644 gateway/src/context/config.rs
 create mode 100644 gateway/src/context/mod.rs

diff --git a/docs/gateway-context.md b/docs/gateway-context.md
new file mode 100644
index 000000000..62aab57b5
--- /dev/null
+++ b/docs/gateway-context.md
@@ -0,0 +1,44 @@
+# Gateway Context Providers
+
+OpenAB gateway adapters can optionally enrich an admitted user turn with recent chat context that the bot would otherwise miss because of mention gating or platform-specific admission rules.
+
+The gateway-level `ContextProvider` abstraction keeps this behavior shared across platforms:
+
+- `observe()` records a message that was seen by an adapter but not dispatched to the agent.
+- `fetch_context()` returns recent context for an admitted turn.
+- `inject_context()` prepends that context with a clear boundary before the current message.
+
+## Provider Types
+
+| Provider | Intended platforms | Data source |
+|---|---|---|
+| `BufferedContextProvider` | LINE, Telegram, WeChat/WeCom, Feishu fallback | webhook observe -> local bounded buffer |
+| `ApiFetchContextProvider` | Discord, Slack, Teams, Google Chat where available | platform history API |
+| Hybrid provider | Google Chat and other mixed-permission platforms | API fetch when possible, buffer fallback otherwise |
+
+The first implementation wires LINE group/room text to `BufferedContextProvider`. Future adapters can reuse the same trait without changing the prompt injection format.
+
+## Defaults
+
+Context capture is disabled by default.
+
+| Setting | Default |
+|---|---|
+| `enabled` | `false` |
+| `ttl` | `24h` |
+| `max_messages` | `50` |
+| `max_chars` | `8000` |
+
+Gateway-wide environment variables use the `GATEWAY_CONTEXT_*` prefix. Platform-specific settings can override them; for example LINE uses `LINE_GROUP_CONTEXT_*`.
+
+## Scope And Storage
+
+Buffered context is:
+
+- scoped by platform, channel, optional thread, and bot id
+- in-memory only
+- drained after injection
+- bounded by TTL, message count, and total characters
+- not long-term memory, retrieval storage, or GBrain state
+
+This is intentionally short-term conversational continuity. Platforms with reliable history APIs can later implement API-backed or hybrid providers instead of relying only on local buffers.
diff --git a/docs/line.md b/docs/line.md
index 5f6b1003f..796724c45 100644
--- a/docs/line.md
+++ b/docs/line.md
@@ -83,7 +83,7 @@ In the LINE Developers Console → **Messaging API** tab → scan the QR code wi
 
 - **1:1 chat** — send a message to the bot, get an AI agent response
 - **Inbound voice messages in 1:1 chat** — LINE-hosted audio messages are downloaded through the LINE Content API and forwarded to OpenAB as `audio` attachments, so the existing STT flow can transcribe them. This requires `[stt] enabled = true` in OpenAB core. See [STT (Speech-to-Text)](stt.md).
-- **Group chat** — add the bot to a group; it responds when directly @-mentioned. Deployments can opt in to folding recent unmentioned text into the next direct-mention turn as short-term context (see @mention gating below)
+- **Group chat** — add the bot to a group; it responds when directly @-mentioned. Deployments can opt in to folding recent unmentioned text into the next direct-mention turn through the gateway ContextProvider buffer (see @mention gating below)
 - **Inbound images** — user-sent LINE images are downloaded through the LINE Content API and forwarded to OpenAB as image attachments
 - **Webhook signature validation** — HMAC-SHA256 via `LINE_CHANNEL_SECRET`
 
@@ -97,11 +97,11 @@ In the LINE Developers Console → **Messaging API** tab → scan the QR code wi
 - **Threads** — LINE has no thread/topic concept. All messages in a chat share one agent session.
 - **Reactions** — LINE Bot API does not support message reactions.
 - **@mention gating** — Supported (zero-config). In group/room chats the gateway only dispatches a visible bot reply when the bot is explicitly @-mentioned (LINE's native `mentionees[].isSelf` signal). 1:1 DMs are always forwarded. No env var is needed.
-  - *Optional short-term text buffering*: when `LINE_GROUP_CONTEXT_ENABLED=true`, unmentioned **text** messages in groups/rooms are buffered locally in the gateway for up to 24 hours and injected into the next directly @-mentioned text turn for the same chat. The buffer is capped per chat by message count and total characters. This improves conversational continuity without making the bot reply to every group message.
+  - *Optional short-term text buffering*: when `LINE_GROUP_CONTEXT_ENABLED=true`, unmentioned **text** messages in groups/rooms are observed by the gateway ContextProvider and buffered locally for up to 24 hours. The next directly @-mentioned text turn for the same chat drains that buffer and prepends it as short-term context. The buffer is capped per chat by message count and total characters. This improves conversational continuity without making the bot reply to every group message.
   - *Limitation — non-text messages*: LINE only attaches mention data to text messages. Images, videos, stickers, files, and location messages in groups are still dropped when not directly @-mentioned because they do not enter the short-term text buffer.
   - *Limitation — group voice messages*: LINE voice/audio messages in groups and rooms are also dropped today because audio messages do not carry mention metadata. LINE inbound voice STT is currently for 1:1 chats.
   - *Limitation — `@All`*: A group-wide `@All` mention does **not** trigger the bot; only a direct `@BotName` mention does.
-  - *Behavior note*: the short-term context buffer is local, bounded, temporary, and drained after injection. It is not a long-term chat archive or GBrain memory store.
+  - *Behavior note*: the short-term context buffer is local, bounded, temporary, scoped by platform/chat/thread/bot, and drained after injection. It is not a long-term chat archive or GBrain memory store.
 - **Markdown rendering** — LINE uses its own text formatting. Agent replies are sent as plain text.
 - **External-content images** — LINE image messages backed by `contentProvider.type = "external"` are not downloaded yet.
 - **External-content audio** — LINE audio messages backed by `contentProvider.type = "external"` are not downloaded yet.
@@ -112,10 +112,13 @@ In the LINE Developers Console → **Messaging API** tab → scan the QR code wi
 |---|---|---|
 | `LINE_CHANNEL_SECRET` | Yes | Channel secret for webhook signature validation |
 | `LINE_CHANNEL_ACCESS_TOKEN` | Yes | Channel access token for Reply/Push Message API and LINE-hosted image/audio downloads |
-| `LINE_GROUP_CONTEXT_ENABLED` | No | Opt in to buffering unmentioned group/room text for the next direct mention. Default: `false` |
-| `LINE_GROUP_CONTEXT_TTL_HOURS` | No | Hours to keep unmentioned group/room text eligible for the next direct mention. Default: `24` |
-| `LINE_GROUP_CONTEXT_MAX_MESSAGES` | No | Maximum buffered unmentioned text messages per group/room. Default: `100` |
-| `LINE_GROUP_CONTEXT_MAX_CHARS` | No | Maximum total buffered text characters per group/room. Default: `8000` |
+| `LINE_GROUP_CONTEXT_ENABLED` | No | Opt in to buffering unmentioned group/room text for the next direct mention. Falls back to `GATEWAY_CONTEXT_ENABLED`. Default: `false` |
+| `LINE_GROUP_CONTEXT_TTL_HOURS` | No | Hours to keep unmentioned group/room text eligible for the next direct mention. Falls back to `GATEWAY_CONTEXT_TTL_HOURS`. Default: `24` |
+| `LINE_GROUP_CONTEXT_MAX_MESSAGES` | No | Maximum buffered unmentioned text messages per group/room. Falls back to `GATEWAY_CONTEXT_MAX_MESSAGES`. Default: `50` |
+| `LINE_GROUP_CONTEXT_MAX_CHARS` | No | Maximum total buffered text characters per group/room. Falls back to `GATEWAY_CONTEXT_MAX_CHARS`. Default: `8000` |
+| `LINE_CONTEXT_BOT_ID` | No | Stable bot identity used for ContextProvider isolation when multiple bots share a LINE group. Falls back to `LINE_BOT_ID`, then `line-default-bot` |
+
+See [Gateway Context Providers](./gateway-context.md) for the shared context buffering model and future API-fetch/hybrid provider direction.
 
 ## Troubleshooting
 
diff --git a/gateway/Cargo.lock b/gateway/Cargo.lock
index c1567f997..f84917a97 100644
--- a/gateway/Cargo.lock
+++ b/gateway/Cargo.lock
@@ -53,6 +53,17 @@ dependencies = [
  "serde_json",
 ]
 
+[[package]]
+name = "async-trait"
+version = "0.1.89"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9035ad2d096bed7955a320ee7e2230574d28fd3c3a0f186cbea1ff3c7eed5dbb"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn",
+]
+
 [[package]]
 name = "atomic-waker"
 version = "1.1.2"
@@ -1116,6 +1127,7 @@ version = "0.5.4"
 dependencies = [
  "aes",
  "anyhow",
+ "async-trait",
  "axum",
  "base64",
  "cbc",
@@ -1124,6 +1136,7 @@ dependencies = [
  "hmac",
  "image",
  "jsonwebtoken",
+ "parking_lot",
  "prost",
  "quick-xml",
  "reqwest",
diff --git a/gateway/Cargo.toml b/gateway/Cargo.toml
index e40160f8a..a9b1ce817 100644
--- a/gateway/Cargo.toml
+++ b/gateway/Cargo.toml
@@ -14,6 +14,7 @@ reqwest = { version = "0.12", default-features = false, features = ["rustls-tls"
 tracing = "0.1"
 tracing-subscriber = { version = "0.3", features = ["env-filter"] }
 anyhow = "1"
+async-trait = "0.1"
 uuid = { version = "1", features = ["v4"] }
 chrono = { version = "0.4", features = ["serde"] }
 hmac = "0.12"
diff --git a/gateway/src/adapters/line.rs b/gateway/src/adapters/line.rs
index e5c4d594e..c4432c871 100644
--- a/gateway/src/adapters/line.rs
+++ b/gateway/src/adapters/line.rs
@@ -1,3 +1,4 @@
+use crate::context::{inject_context, ContextFetchRequest, ContextObserveRequest, ContextScope};
 use crate::media::{
     audio_extension, format_bytes, resize_and_compress, AUDIO_MAX_DOWNLOAD, IMAGE_MAX_DOWNLOAD,
 };
@@ -5,7 +6,6 @@ use crate::schema::*;
 use crate::store;
 use axum::extract::State;
 use serde::Deserialize;
-use std::collections::VecDeque;
 use std::sync::Arc;
 use tracing::{error, info, warn};
 
@@ -155,14 +155,21 @@ async fn process_line_webhook_events(
     // - Guardrail: a shared semaphore bounds how many LINE payloads can enter the
     //   post-ack path concurrently. When saturated, new webhooks wait for capacity
     //   before spawning background work so bursts do not create unbounded backlog.
+    let line_context_provider = state.context_providers.get("line").cloned();
+    let line_context_bot_id = state
+        .context_bot_ids
+        .get("line")
+        .cloned()
+        .unwrap_or_else(|| "line-default-bot".into());
+
     for event in webhook_body.events {
         let Some(gateway_event) = build_gateway_event_from_line_event(
             &event,
             &state.client,
             state.line_access_token.as_deref(),
             LINE_DATA_API_BASE,
-            &state.line_group_context_buffer,
-            &state.line_group_context_config,
+            line_context_provider.clone(),
+            &line_context_bot_id,
         )
         .await
         else {
@@ -209,8 +216,8 @@ async fn build_gateway_event_from_line_event(
     client: &reqwest::Client,
     line_access_token: Option<&str>,
     data_api_base: &str,
-    line_group_context_buffer: &crate::LineGroupContextBuffer,
-    line_group_context_config: &crate::LineGroupContextConfig,
+    line_context_provider: Option<Arc<dyn crate::context::ContextProvider>>,
+    line_context_bot_id: &str,
 ) -> Option<GatewayEvent> {
     if event.event_type != "message" {
         return None;
@@ -375,32 +382,43 @@ async fn build_gateway_event_from_line_event(
     // 1:1 DMs always pass through.
     let is_group = channel_type == "group" || channel_type == "room";
     let bot_mentioned = mentionees.iter().any(|m| m.is_self);
-    if is_group && msg.message_type == "text" && line_group_context_config.enabled {
+    if is_group
+        && msg.message_type == "text"
+        && line_context_provider
+            .as_ref()
+            .is_some_and(|p| p.is_enabled())
+    {
+        let scope = ContextScope::new("line", &channel_id, None, line_context_bot_id);
         if !bot_mentioned {
-            buffer_line_group_context(
-                line_group_context_buffer,
-                line_group_context_config,
-                &channel_id,
-                user_id,
-                &event_text,
-            );
+            let observed = line_context_provider
+                .as_ref()
+                .expect("checked provider above")
+                .observe(ContextObserveRequest {
+                    scope,
+                    sender_id: user_id.to_string(),
+                    sender_label: user_id.to_string(),
+                    text: event_text.clone(),
+                })
+                .await;
             info!(
                 channel = %channel_id,
+                observed,
                 "line group text buffered (bot not mentioned)"
             );
             return None;
         }
-        if let Some(buffered) = take_line_group_context(
-            line_group_context_buffer,
-            line_group_context_config,
-            &channel_id,
-        ) {
+        if let Some(context) = line_context_provider
+            .as_ref()
+            .expect("checked provider above")
+            .fetch_context(ContextFetchRequest { scope, limit: None })
+            .await
+        {
             info!(
                 channel = %channel_id,
-                buffered_messages = buffered.len(),
+                buffered_messages = context.len(),
                 "line group context injected into direct mention"
             );
-            event_text = inject_buffered_group_context(&buffered, &event_text);
+            event_text = inject_context(&context, &event_text);
         }
     } else if is_group && !bot_mentioned {
         info!(
@@ -431,80 +449,6 @@ async fn build_gateway_event_from_line_event(
     Some(gateway_event)
 }
 
-fn buffer_line_group_context(
-    buffer: &crate::LineGroupContextBuffer,
-    config: &crate::LineGroupContextConfig,
-    channel_id: &str,
-    sender_id: &str,
-    text: &str,
-) {
-    let trimmed = text.trim();
-    if trimmed.is_empty() {
-        return;
-    }
-
-    let mut guard = buffer.lock().unwrap_or_else(|e| e.into_inner());
-    let now = std::time::Instant::now();
-    let entry = guard.entry(channel_id.to_string()).or_default();
-    entry.retain(|m| now.duration_since(m.buffered_at).as_secs() < config.ttl_secs);
-    let bounded_text: String = trimmed.chars().take(config.max_chars).collect();
-    entry.push_back(crate::LineBufferedText {
-        sender_id: sender_id.to_string(),
-        text: bounded_text,
-        buffered_at: now,
-    });
-    enforce_line_group_context_limits(entry, config);
-}
-
-fn enforce_line_group_context_limits(
-    entry: &mut VecDeque<crate::LineBufferedText>,
-    config: &crate::LineGroupContextConfig,
-) {
-    while entry.len() > config.max_messages {
-        entry.pop_front();
-    }
-    while entry.len() > 1 && line_group_context_char_count(entry) > config.max_chars {
-        entry.pop_front();
-    }
-}
-
-fn line_group_context_char_count(entry: &VecDeque<crate::LineBufferedText>) -> usize {
-    entry
-        .iter()
-        .map(|m| m.sender_id.chars().count() + m.text.chars().count() + 2)
-        .sum()
-}
-
-fn take_line_group_context(
-    buffer: &crate::LineGroupContextBuffer,
-    config: &crate::LineGroupContextConfig,
-    channel_id: &str,
-) -> Option<VecDeque<crate::LineBufferedText>> {
-    let mut guard = buffer.lock().unwrap_or_else(|e| e.into_inner());
-    let now = std::time::Instant::now();
-    let mut entry = guard.remove(channel_id)?;
-    entry.retain(|m| now.duration_since(m.buffered_at).as_secs() < config.ttl_secs);
-    if entry.is_empty() {
-        None
-    } else {
-        Some(entry)
-    }
-}
-
-fn inject_buffered_group_context(
-    buffered: &VecDeque<crate::LineBufferedText>,
-    current_text: &str,
-) -> String {
-    let mut lines = Vec::with_capacity(buffered.len() + 3);
-    lines.push("[Recent group context before this direct mention]".to_string());
-    for entry in buffered {
-        lines.push(format!("{}: {}", entry.sender_id, entry.text));
-    }
-    lines.push("[Current directly mentioned message]".to_string());
-    lines.push(current_text.to_string());
-    lines.join("\n")
-}
-
 pub async fn download_line_image(
     client: &reqwest::Client,
     access_token: &str,
@@ -846,17 +790,55 @@ mod tests {
     use wiremock::matchers::{header, method, path};
     use wiremock::{Mock, MockServer, ResponseTemplate};
 
-    fn test_line_group_context_config() -> crate::LineGroupContextConfig {
-        crate::LineGroupContextConfig::default()
+    const TEST_LINE_CONTEXT_BOT_ID: &str = "line-default-bot";
+
+    fn test_line_context_config() -> crate::context::ContextConfig {
+        crate::context::ContextConfig::default()
     }
 
-    fn enabled_line_group_context_config() -> crate::LineGroupContextConfig {
-        crate::LineGroupContextConfig {
+    fn enabled_line_context_config() -> crate::context::ContextConfig {
+        crate::context::ContextConfig {
             enabled: true,
-            ..crate::LineGroupContextConfig::default()
+            ..crate::context::ContextConfig::default()
         }
     }
 
+    fn disabled_line_context_provider() -> Arc<crate::context::BufferedContextProvider> {
+        Arc::new(crate::context::BufferedContextProvider::new(
+            test_line_context_config(),
+        ))
+    }
+
+    fn enabled_line_context_provider() -> Arc<crate::context::BufferedContextProvider> {
+        Arc::new(crate::context::BufferedContextProvider::new(
+            enabled_line_context_config(),
+        ))
+    }
+
+    fn as_context_provider(
+        provider: &Arc<crate::context::BufferedContextProvider>,
+    ) -> Arc<dyn crate::context::ContextProvider> {
+        provider.clone()
+    }
+
+    fn line_context_scope(channel_id: &str) -> crate::context::ContextScope {
+        crate::context::ContextScope::new("line", channel_id, None, TEST_LINE_CONTEXT_BOT_ID)
+    }
+
+    fn context_provider_registry(
+        provider: Arc<dyn crate::context::ContextProvider>,
+    ) -> crate::ContextProviderRegistry {
+        let mut providers = HashMap::new();
+        providers.insert("line".into(), provider);
+        Arc::new(providers)
+    }
+
+    fn context_bot_id_registry() -> crate::ContextBotIdRegistry {
+        let mut bot_ids = HashMap::new();
+        bot_ids.insert("line".into(), TEST_LINE_CONTEXT_BOT_ID.into());
+        Arc::new(bot_ids)
+    }
+
     #[tokio::test]
     async fn download_line_image_resizes_and_returns_attachment() {
         let server = MockServer::start().await;
@@ -932,8 +914,8 @@ mod tests {
             &reqwest::Client::new(),
             Some("line_token"),
             &server.uri(),
-            &Arc::new(std::sync::Mutex::new(HashMap::new())),
-            &test_line_group_context_config(),
+            None,
+            TEST_LINE_CONTEXT_BOT_ID,
         )
         .await
         .expect("image event should produce a gateway event");
@@ -984,6 +966,8 @@ mod tests {
             &reqwest::Client::new(),
             Some("line_token"),
             &server.uri(),
+            None,
+            TEST_LINE_CONTEXT_BOT_ID,
         )
         .await
         .expect("audio event should produce a gateway event");
@@ -1039,6 +1023,8 @@ mod tests {
             &reqwest::Client::new(),
             Some("line_token"),
             &server.uri(),
+            None,
+            TEST_LINE_CONTEXT_BOT_ID,
         )
         .await
         .expect("audio event should produce a gateway event");
@@ -1152,8 +1138,8 @@ mod tests {
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
-            &Arc::new(std::sync::Mutex::new(HashMap::new())),
-            &test_line_group_context_config(),
+            None,
+            TEST_LINE_CONTEXT_BOT_ID,
         )
         .await;
 
@@ -1190,8 +1176,8 @@ mod tests {
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
-            &Arc::new(std::sync::Mutex::new(HashMap::new())),
-            &test_line_group_context_config(),
+            None,
+            TEST_LINE_CONTEXT_BOT_ID,
         )
         .await;
 
@@ -1226,8 +1212,8 @@ mod tests {
             &reqwest::Client::new(),
             None, // no access token
             LINE_DATA_API_BASE,
-            &Arc::new(std::sync::Mutex::new(HashMap::new())),
-            &test_line_group_context_config(),
+            None,
+            TEST_LINE_CONTEXT_BOT_ID,
         )
         .await;
 
@@ -1257,6 +1243,8 @@ mod tests {
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
+            None,
+            TEST_LINE_CONTEXT_BOT_ID,
         )
         .await;
 
@@ -1287,8 +1275,10 @@ mod tests {
             event_tx,
             reply_token_cache: Arc::new(std::sync::Mutex::new(HashMap::new())),
             line_webhook_semaphore: Arc::new(Semaphore::new(crate::LINE_WEBHOOK_CONCURRENCY_MAX)),
-            line_group_context_buffer: Arc::new(std::sync::Mutex::new(HashMap::new())),
-            line_group_context_config: test_line_group_context_config(),
+            context_providers: context_provider_registry(as_context_provider(
+                &disabled_line_context_provider(),
+            )),
+            context_bot_ids: context_bot_id_registry(),
             client: reqwest::Client::new(),
         });
 
@@ -1356,8 +1346,8 @@ mod tests {
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
-            &Arc::new(std::sync::Mutex::new(HashMap::new())),
-            &test_line_group_context_config(),
+            None,
+            TEST_LINE_CONTEXT_BOT_ID,
         )
         .await;
         assert!(result.is_some());
@@ -1367,46 +1357,38 @@ mod tests {
 
     #[tokio::test]
     async fn group_message_drops_without_buffer_when_context_disabled() {
-        let buffer = Arc::new(std::sync::Mutex::new(HashMap::new()));
+        let provider = disabled_line_context_provider();
         let event = make_group_text_event("hey everyone", false);
         let result = build_gateway_event_from_line_event(
             &event,
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
-            &buffer,
-            &test_line_group_context_config(),
+            Some(as_context_provider(&provider)),
+            TEST_LINE_CONTEXT_BOT_ID,
         )
         .await;
         assert!(result.is_none());
-        let guard = buffer.lock().unwrap_or_else(|e| e.into_inner());
-        assert!(
-            guard.get("C001").is_none(),
-            "context disabled should preserve original drop behavior"
-        );
+        assert_eq!(provider.buffered_len(&line_context_scope("C001")), 0);
     }
 
     #[tokio::test]
     async fn group_message_buffers_when_bot_not_mentioned_and_context_enabled() {
-        let buffer = Arc::new(std::sync::Mutex::new(HashMap::new()));
+        let provider = enabled_line_context_provider();
         let event = make_group_text_event("hey everyone", false);
         let result = build_gateway_event_from_line_event(
             &event,
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
-            &buffer,
-            &enabled_line_group_context_config(),
+            Some(as_context_provider(&provider)),
+            TEST_LINE_CONTEXT_BOT_ID,
         )
         .await;
         assert!(result.is_none());
-        let guard = buffer.lock().unwrap_or_else(|e| e.into_inner());
         assert_eq!(
-            guard
-                .get("C001")
-                .and_then(|entry| entry.front())
-                .map(|m| m.text.as_str()),
-            Some("hey everyone")
+            provider.buffered_texts(&line_context_scope("C001")),
+            vec!["hey everyone"]
         );
     }
 
@@ -1423,8 +1405,8 @@ mod tests {
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
-            &Arc::new(std::sync::Mutex::new(HashMap::new())),
-            &enabled_line_group_context_config(),
+            Some(as_context_provider(&enabled_line_context_provider())),
+            TEST_LINE_CONTEXT_BOT_ID,
         )
         .await;
         assert!(result.is_none());
@@ -1443,8 +1425,8 @@ mod tests {
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
-            &Arc::new(std::sync::Mutex::new(HashMap::new())),
-            &test_line_group_context_config(),
+            None,
+            TEST_LINE_CONTEXT_BOT_ID,
         )
         .await;
         assert!(result.is_some());
@@ -1452,7 +1434,7 @@ mod tests {
 
     #[tokio::test]
     async fn group_message_buffers_then_injects_context_on_later_mention() {
-        let buffer = Arc::new(std::sync::Mutex::new(HashMap::new()));
+        let provider = enabled_line_context_provider();
 
         let first = make_group_text_event("今天下午兩點開會", false);
         let first_result = build_gateway_event_from_line_event(
@@ -1460,8 +1442,8 @@ mod tests {
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
-            &buffer,
-            &enabled_line_group_context_config(),
+            Some(as_context_provider(&provider)),
+            TEST_LINE_CONTEXT_BOT_ID,
         )
         .await;
         assert!(
@@ -1475,8 +1457,8 @@ mod tests {
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
-            &buffer,
-            &enabled_line_group_context_config(),
+            Some(as_context_provider(&provider)),
+            TEST_LINE_CONTEXT_BOT_ID,
         )
         .await
         .expect("mentioned message should produce an event");
@@ -1484,7 +1466,7 @@ mod tests {
         assert!(second_result
             .content
             .text
-            .contains("[Recent group context before this direct mention]"));
+            .contains("[Recent conversation context before this trigger]"));
         assert!(second_result
             .content
             .text
@@ -1492,18 +1474,14 @@ mod tests {
         assert!(second_result
             .content
             .text
-            .contains("[Current directly mentioned message]"));
+            .contains("[Current message - respond to this]"));
         assert!(second_result.content.text.contains("@Bot 幫我總結一下"));
-        let guard = buffer.lock().unwrap_or_else(|e| e.into_inner());
-        assert!(
-            guard.get("C001").is_none(),
-            "buffer should drain after injection"
-        );
+        assert_eq!(provider.buffered_len(&line_context_scope("C001")), 0);
     }
 
     #[tokio::test]
     async fn direct_mention_without_buffer_keeps_original_text() {
-        let buffer = Arc::new(std::sync::Mutex::new(HashMap::new()));
+        let provider = enabled_line_context_provider();
 
         let event = make_group_text_event("@Bot 現在狀況如何", true);
         let result = build_gateway_event_from_line_event(
@@ -1511,8 +1489,8 @@ mod tests {
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
-            &buffer,
-            &enabled_line_group_context_config(),
+            Some(as_context_provider(&provider)),
+            TEST_LINE_CONTEXT_BOT_ID,
         )
         .await
         .expect("mentioned message should produce an event");
@@ -1522,7 +1500,7 @@ mod tests {
 
     #[tokio::test]
     async fn multiple_buffered_messages_preserve_order_on_injection() {
-        let buffer = Arc::new(std::sync::Mutex::new(HashMap::new()));
+        let provider = enabled_line_context_provider();
 
         let first: LineEvent = serde_json::from_value(serde_json::json!({
             "type": "message",
@@ -1542,8 +1520,8 @@ mod tests {
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
-            &buffer,
-            &enabled_line_group_context_config(),
+            Some(as_context_provider(&provider)),
+            TEST_LINE_CONTEXT_BOT_ID,
         )
         .await
         .is_none());
@@ -1552,8 +1530,8 @@ mod tests {
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
-            &buffer,
-            &enabled_line_group_context_config(),
+            Some(as_context_provider(&provider)),
+            TEST_LINE_CONTEXT_BOT_ID,
         )
         .await
         .is_none());
@@ -1564,8 +1542,8 @@ mod tests {
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
-            &buffer,
-            &enabled_line_group_context_config(),
+            Some(as_context_provider(&provider)),
+            TEST_LINE_CONTEXT_BOT_ID,
         )
         .await
         .expect("mentioned message should produce an event");
@@ -1583,7 +1561,7 @@ mod tests {
         let current_idx = result
             .content
             .text
-            .find("[Current directly mentioned message]")
+            .find("[Current message - respond to this]")
             .expect("current message header present");
 
         assert!(
@@ -1596,80 +1574,9 @@ mod tests {
         );
     }
 
-    #[test]
-    fn group_context_buffer_keeps_latest_messages_within_bounds() {
-        let buffer = Arc::new(std::sync::Mutex::new(HashMap::new()));
-        let config = test_line_group_context_config();
-
-        for i in 0..(config.max_messages + 5) {
-            buffer_line_group_context(
-                &buffer,
-                &config,
-                "C001",
-                "U_sender",
-                &format!("message {i}"),
-            );
-        }
-
-        let guard = buffer.lock().unwrap_or_else(|e| e.into_inner());
-        let entry = guard.get("C001").expect("buffer should exist");
-
-        assert_eq!(entry.len(), config.max_messages);
-        assert_eq!(entry.front().unwrap().text, "message 5");
-        assert_eq!(
-            entry.back().unwrap().text,
-            format!("message {}", config.max_messages + 4)
-        );
-        assert!(
-            line_group_context_char_count(entry) <= config.max_chars,
-            "buffer should stay within character budget"
-        );
-    }
-
-    #[test]
-    fn group_context_buffer_enforces_total_character_budget() {
-        let buffer = Arc::new(std::sync::Mutex::new(HashMap::new()));
-        let config = test_line_group_context_config();
-        let large = "x".repeat(config.max_chars / 2);
-
-        buffer_line_group_context(
-            &buffer,
-            &config,
-            "C001",
-            "U_sender",
-            &format!("old {large}"),
-        );
-        buffer_line_group_context(
-            &buffer,
-            &config,
-            "C001",
-            "U_sender",
-            &format!("middle {large}"),
-        );
-        buffer_line_group_context(
-            &buffer,
-            &config,
-            "C001",
-            "U_sender",
-            &format!("latest {large}"),
-        );
-
-        let guard = buffer.lock().unwrap_or_else(|e| e.into_inner());
-        let entry = guard.get("C001").expect("buffer should exist");
-
-        assert!(
-            line_group_context_char_count(entry) <= config.max_chars,
-            "buffer should stay within character budget"
-        );
-        assert!(
-            entry.back().unwrap().text.starts_with("latest "),
-            "latest context should be retained when trimming old messages"
-        );
-    }
-
     #[tokio::test]
     async fn buffer_is_chat_local_and_not_reused_after_drain() {
-        let buffer = Arc::new(std::sync::Mutex::new(HashMap::new()));
+        let provider = enabled_line_context_provider();
 
         let buffered: LineEvent = serde_json::from_value(serde_json::json!({
             "type": "message",
@@ -1683,8 +1590,8 @@ mod tests {
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
-            &buffer,
-            &enabled_line_group_context_config(),
+            Some(as_context_provider(&provider)),
+            TEST_LINE_CONTEXT_BOT_ID,
         )
         .await
         .is_none());
@@ -1706,8 +1613,8 @@ mod tests {
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
-            &buffer,
-            &enabled_line_group_context_config(),
+            Some(as_context_provider(&provider)),
+            TEST_LINE_CONTEXT_BOT_ID,
         )
         .await
         .expect("other chat mention should produce an event");
@@ -1722,8 +1629,8 @@ mod tests {
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
-            &buffer,
-            &enabled_line_group_context_config(),
+            Some(as_context_provider(&provider)),
+            TEST_LINE_CONTEXT_BOT_ID,
         )
         .await
         .expect("same chat mention should produce an event");
@@ -1738,8 +1645,8 @@ mod tests {
             &reqwest::Client::new(),
             None,
             LINE_DATA_API_BASE,
-            &buffer,
-            &enabled_line_group_context_config(),
+            Some(as_context_provider(&provider)),
+            TEST_LINE_CONTEXT_BOT_ID,
         )
         .await
         .expect("second same-chat mention should produce an event");
diff --git a/gateway/src/adapters/teams.rs b/gateway/src/adapters/teams.rs
index 6043a460a..d70d6c6e2 100644
--- a/gateway/src/adapters/teams.rs
+++ b/gateway/src/adapters/teams.rs
@@ -666,8 +666,8 @@ mod tests {
             event_tx,
             reply_token_cache: Arc::new(std::sync::Mutex::new(std::collections::HashMap::new())),
             line_webhook_semaphore: Arc::new(tokio::sync::Semaphore::new(crate::LINE_WEBHOOK_CONCURRENCY_MAX)),
-            line_group_context_buffer: Arc::new(std::sync::Mutex::new(std::collections::HashMap::new())),
-            line_group_context_config: crate::LineGroupContextConfig::default(),
+            context_providers: Arc::new(std::collections::HashMap::new()),
+            context_bot_ids: Arc::new(std::collections::HashMap::new()),
             client: reqwest::Client::new(),
         })
     }
diff --git a/gateway/src/context/api_fetch.rs b/gateway/src/context/api_fetch.rs
new file mode 100644
index 000000000..fce4ead80
--- /dev/null
+++ b/gateway/src/context/api_fetch.rs
@@ -0,0 +1,20 @@
+use super::{ContextFetchRequest, ContextMessage, ContextObserveRequest, ContextProvider};
+
+#[derive(Clone, Debug, Default)]
+#[allow(dead_code)]
+pub struct ApiFetchContextProvider;
+
+#[async_trait::async_trait]
+impl ContextProvider for ApiFetchContextProvider {
+    fn is_enabled(&self) -> bool {
+        false
+    }
+
+    async fn observe(&self, _request: ContextObserveRequest) -> bool {
+        false
+    }
+
+    async fn fetch_context(&self, _request: ContextFetchRequest) -> Option<Vec<ContextMessage>> {
+        None
+    }
+}
diff --git a/gateway/src/context/buffered.rs b/gateway/src/context/buffered.rs
new file mode 100644
index 000000000..19b802e5a
--- /dev/null
+++ b/gateway/src/context/buffered.rs
@@ -0,0 +1,243 @@
+use super::{
+    ContextConfig, ContextFetchRequest, ContextMessage, ContextObserveRequest, ContextProvider,
+    ContextScope,
+};
+use std::collections::{HashMap, VecDeque};
+use std::sync::Arc;
+use std::time::Instant;
+
+#[derive(Clone, Debug)]
+struct BufferedContextMessage {
+    message: ContextMessage,
+    observed_at: Instant,
+}
+
+#[derive(Clone, Debug)]
+pub struct BufferedContextProvider {
+    config: ContextConfig,
+    buffers: Arc<std::sync::Mutex<HashMap<ContextScope, VecDeque<BufferedContextMessage>>>>,
+}
+
+impl BufferedContextProvider {
+    pub fn new(config: ContextConfig) -> Self {
+        Self {
+            config,
+            buffers: Arc::new(std::sync::Mutex::new(HashMap::new())),
+        }
+    }
+
+    #[cfg(test)]
+    pub fn buffered_texts(&self, scope: &ContextScope) -> Vec<String> {
+        let guard = self.buffers.lock().unwrap_or_else(|e| e.into_inner());
+        guard
+            .get(scope)
+            .map(|entry| {
+                entry
+                    .iter()
+                    .map(|message| message.message.text.clone())
+                    .collect()
+            })
+            .unwrap_or_default()
+    }
+
+    #[cfg(test)]
+    pub fn buffered_len(&self, scope: &ContextScope) -> usize {
+        let guard = self.buffers.lock().unwrap_or_else(|e| e.into_inner());
+        guard.get(scope).map(VecDeque::len).unwrap_or_default()
+    }
+
+    fn prune_expired(&self, entry: &mut VecDeque<BufferedContextMessage>) {
+        let now = Instant::now();
+        entry.retain(|m| now.duration_since(m.observed_at).as_secs() < self.config.ttl_secs);
+    }
+
+    fn enforce_limits(&self, entry: &mut VecDeque<BufferedContextMessage>, max_messages: usize) {
+        while entry.len() > max_messages {
+            entry.pop_front();
+        }
+        while entry.len() > 1 && context_char_count(entry) > self.config.max_chars {
+            entry.pop_front();
+        }
+    }
+}
+
+#[async_trait::async_trait]
+impl ContextProvider for BufferedContextProvider {
+    fn is_enabled(&self) -> bool {
+        self.config.enabled
+    }
+
+    async fn observe(&self, request: ContextObserveRequest) -> bool {
+        let trimmed = request.text.trim();
+        if !self.config.enabled
+            || self.config.max_messages == 0
+            || self.config.max_chars == 0
+            || trimmed.is_empty()
+        {
+            return false;
+        }
+
+        let mut guard = self.buffers.lock().unwrap_or_else(|e| e.into_inner());
+        let entry = guard.entry(request.scope).or_default();
+        self.prune_expired(entry);
+
+        let bounded_text: String = trimmed.chars().take(self.config.max_chars).collect();
+        entry.push_back(BufferedContextMessage {
+            message: ContextMessage {
+                sender_id: request.sender_id,
+                sender_label: request.sender_label,
+                text: bounded_text,
+            },
+            observed_at: Instant::now(),
+        });
+        self.enforce_limits(entry, self.config.max_messages);
+        true
+    }
+
+    async fn fetch_context(&self, request: ContextFetchRequest) -> Option<Vec<ContextMessage>> {
+        if !self.config.enabled || self.config.max_messages == 0 || self.config.max_chars == 0 {
+            return None;
+        }
+
+        let mut guard = self.buffers.lock().unwrap_or_else(|e| e.into_inner());
+        let mut entry = guard.remove(&request.scope)?;
+        self.prune_expired(&mut entry);
+
+        let max_messages = request
+            .limit
+            .unwrap_or(self.config.max_messages)
+            .min(self.config.max_messages);
+        self.enforce_limits(&mut entry, max_messages);
+
+        if entry.is_empty() {
+            None
+        } else {
+            Some(entry.into_iter().map(|message| message.message).collect())
+        }
+    }
+}
+
+fn context_char_count(entry: &VecDeque<BufferedContextMessage>) -> usize {
+    entry
+        .iter()
+        .map(|m| {
+            m.message.sender_label.chars().count()
+                + m.message.sender_id.chars().count()
+                + m.message.text.chars().count()
+                + 2
+        })
+        .sum()
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    fn enabled_provider(max_messages: usize, max_chars: usize) -> BufferedContextProvider {
+        BufferedContextProvider::new(ContextConfig {
+            enabled: true,
+            ttl_secs: 24 * 60 * 60,
+            max_messages,
+            max_chars,
+        })
+    }
+
+    fn scope(channel: &str) -> ContextScope {
+        ContextScope::new("line", channel, None, "line-default-bot")
+    }
+
+    async fn observe(provider: &BufferedContextProvider, scope: ContextScope, text: &str) {
+        provider
+            .observe(ContextObserveRequest {
+                scope,
+                sender_id: "U_sender".into(),
+                sender_label: "U_sender".into(),
+                text: text.into(),
+            })
+            .await;
+    }
+
+    #[tokio::test]
+    async fn observe_fetches_and_drains_context() {
+        let provider = enabled_provider(50, 8_000);
+        let scope = scope("C001");
+
+        observe(&provider, scope.clone(), "hello").await;
+        let context = provider
+            .fetch_context(ContextFetchRequest {
+                scope: scope.clone(),
+                limit: None,
+            })
+            .await
+            .expect("context should be returned");
+
+        assert_eq!(context.len(), 1);
+        assert_eq!(context[0].text, "hello");
+        assert!(provider
+            .fetch_context(ContextFetchRequest { scope, limit: None })
+            .await
+            .is_none());
+    }
+
+    #[tokio::test]
+    async fn observe_is_noop_when_disabled() {
+        let provider = BufferedContextProvider::new(ContextConfig::default());
+        let scope = scope("C001");
+
+        observe(&provider, scope.clone(), "hello").await;
+
+        assert_eq!(provider.buffered_len(&scope), 0);
+    }
+
+    #[tokio::test]
+    async fn max_messages_keeps_latest_context() {
+        let provider = enabled_provider(2, 8_000);
+        let scope = scope("C001");
+
+        observe(&provider, scope.clone(), "first").await;
+        observe(&provider, scope.clone(), "second").await;
+        observe(&provider, scope.clone(), "third").await;
+
+        assert_eq!(provider.buffered_texts(&scope), vec!["second", "third"]);
+    }
+
+    #[tokio::test]
+    async fn max_chars_trims_old_context() {
+        let provider = enabled_provider(10, 20);
+        let scope = scope("C001");
+
+        observe(&provider, scope.clone(), "first long message").await;
+        observe(&provider, scope.clone(), "second long message").await;
+
+        let texts = provider.buffered_texts(&scope);
+        assert!(texts.len() <= 2);
+        assert_eq!(
+            texts.last().map(String::as_str),
+            Some("second long message")
+        );
+    }
+
+    #[tokio::test]
+    async fn scope_isolation_prevents_cross_chat_leakage() {
+        let provider = enabled_provider(50, 8_000);
+        let first = scope("C001");
+        let second = scope("C002");
+
+        observe(&provider, first.clone(), "first chat").await;
+
+        assert!(provider
+            .fetch_context(ContextFetchRequest {
+                scope: second,
+                limit: None,
+            })
+            .await
+            .is_none());
+        assert!(provider
+            .fetch_context(ContextFetchRequest {
+                scope: first,
+                limit: None,
+            })
+            .await
+            .is_some());
+    }
+}
diff --git a/gateway/src/context/config.rs b/gateway/src/context/config.rs
new file mode 100644
index 000000000..a9f27bcc0
--- /dev/null
+++ b/gateway/src/context/config.rs
@@ -0,0 +1,98 @@
+pub const DEFAULT_CONTEXT_TTL_HOURS: u64 = 24;
+pub const DEFAULT_CONTEXT_MAX_MESSAGES: usize = 50;
+pub const DEFAULT_CONTEXT_MAX_CHARS: usize = 8_000;
+
+#[derive(Clone, Debug)]
+pub struct ContextConfig {
+    pub enabled: bool,
+    pub ttl_secs: u64,
+    pub max_messages: usize,
+    pub max_chars: usize,
+}
+
+impl Default for ContextConfig {
+    fn default() -> Self {
+        Self {
+            enabled: false,
+            ttl_secs: DEFAULT_CONTEXT_TTL_HOURS * 60 * 60,
+            max_messages: DEFAULT_CONTEXT_MAX_MESSAGES,
+            max_chars: DEFAULT_CONTEXT_MAX_CHARS,
+        }
+    }
+}
+
+impl ContextConfig {
+    pub fn from_env_with_prefixes(prefixes: &[&str]) -> Self {
+        let defaults = Self::default();
+        let ttl_hours =
+            read_positive_env_u64(prefixes, "CONTEXT_TTL_HOURS", DEFAULT_CONTEXT_TTL_HOURS);
+
+        Self {
+            enabled: read_bool_env(prefixes, "CONTEXT_ENABLED", defaults.enabled),
+            ttl_secs: ttl_hours.saturating_mul(60 * 60),
+            max_messages: read_positive_env_usize(
+                prefixes,
+                "CONTEXT_MAX_MESSAGES",
+                defaults.max_messages,
+            ),
+            max_chars: read_positive_env_usize(prefixes, "CONTEXT_MAX_CHARS", defaults.max_chars),
+        }
+    }
+}
+
+fn read_bool_env(prefixes: &[&str], suffix: &str, default: bool) -> bool {
+    env_names(prefixes, suffix)
+        .into_iter()
+        .find_map(|name| {
+            std::env::var(name)
+                .ok()
+                .map(|v| v == "1" || v.eq_ignore_ascii_case("true"))
+        })
+        .unwrap_or(default)
+}
+
+fn read_positive_env_u64(prefixes: &[&str], suffix: &str, default: u64) -> u64 {
+    env_names(prefixes, suffix)
+        .into_iter()
+        .find_map(|name| {
+            std::env::var(name)
+                .ok()
+                .and_then(|v| v.parse::<u64>().ok())
+                .filter(|v| *v > 0)
+        })
+        .unwrap_or(default)
+}
+
+fn read_positive_env_usize(prefixes: &[&str], suffix: &str, default: usize) -> usize {
+    env_names(prefixes, suffix)
+        .into_iter()
+        .find_map(|name| {
+            std::env::var(name)
+                .ok()
+                .and_then(|v| v.parse::<usize>().ok())
+                .filter(|v| *v > 0)
+        })
+        .unwrap_or(default)
+}
+
+fn env_names(prefixes: &[&str], suffix: &str) -> Vec<String> {
+    prefixes
+        .iter()
+        .map(|prefix| format!("{prefix}_{suffix}"))
+        .collect()
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn default_context_config_is_disabled_and_bounded() {
+        let config = ContextConfig::default();
+
+        assert!(!config.enabled);
+        assert_eq!(config.ttl_secs, 24 * 60 * 60);
+        assert_eq!(config.max_messages, 50);
+        assert_eq!(config.max_chars, 8_000);
+    }
+}
diff --git a/gateway/src/context/mod.rs b/gateway/src/context/mod.rs
new file mode 100644
index 000000000..d728745a4
--- /dev/null
+++ b/gateway/src/context/mod.rs
@@ -0,0 +1,116 @@
+pub mod api_fetch;
+pub mod buffered;
+pub mod config;
+
+pub use buffered::BufferedContextProvider;
+pub use config::ContextConfig;
+
+#[derive(Clone, Debug, Eq, PartialEq, Hash)]
+pub struct ContextScope {
+    pub platform: String,
+    pub channel_id: String,
+    pub thread_id: Option<String>,
+    pub bot_id: String,
+}
+
+impl ContextScope {
+    pub fn new(
+        platform: impl Into<String>,
+        channel_id: impl Into<String>,
+        thread_id: Option<String>,
+        bot_id: impl Into<String>,
+    ) -> Self {
+        Self {
+            platform: platform.into(),
+            channel_id: channel_id.into(),
+            thread_id,
+            bot_id: bot_id.into(),
+        }
+    }
+}
+
+#[derive(Clone, Debug)]
+pub struct ContextMessage {
+    pub sender_id: String,
+    pub sender_label: String,
+    pub text: String,
+}
+
+#[derive(Clone, Debug)]
+pub struct ContextObserveRequest {
+    pub scope: ContextScope,
+    pub sender_id: String,
+    pub sender_label: String,
+    pub text: String,
+}
+
+#[derive(Clone, Debug)]
+pub struct ContextFetchRequest {
+    pub scope: ContextScope,
+    pub limit: Option<usize>,
+}
+
+#[async_trait::async_trait]
+pub trait ContextProvider: Send + Sync {
+    fn is_enabled(&self) -> bool;
+
+    async fn observe(&self, request: ContextObserveRequest) -> bool;
+
+    async fn fetch_context(&self, request: ContextFetchRequest) -> Option<Vec<ContextMessage>>;
+}
+
+pub fn inject_context(context: &[ContextMessage], current_text: &str) -> String {
+    if context.is_empty() {
+        return current_text.to_string();
+    }
+
+    let mut lines = Vec::with_capacity(context.len() + 3);
+    lines.push("[Recent conversation context before this trigger]".to_string());
+    for message in context {
+        let label = if message.sender_label.trim().is_empty() {
+            message.sender_id.as_str()
+        } else {
+            message.sender_label.as_str()
+        };
+        lines.push(format!("{}: {}", label, message.text));
+    }
+    lines.push(String::new());
+    lines.push("[Current message - respond to this]".to_string());
+    lines.push(current_text.to_string());
+    lines.join("\n")
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn inject_context_wraps_history_and_current_message() {
+        let text = inject_context(
+            &[
+                ContextMessage {
+                    sender_id: "U1".into(),
+                    sender_label: "Alice".into(),
+                    text: "first".into(),
+                },
+                ContextMessage {
+                    sender_id: "U2".into(),
+                    sender_label: "Bob".into(),
+                    text: "second".into(),
+                },
+            ],
+            "@Bot summarize",
+        );
+
+        assert!(text.contains("[Recent conversation context before this trigger]"));
+        assert!(text.contains("Alice: first"));
+        assert!(text.contains("Bob: second"));
+        assert!(text.contains("[Current message - respond to this]"));
+        assert!(text.contains("@Bot summarize"));
+    }
+
+    #[test]
+    fn inject_context_keeps_current_message_when_history_empty() {
+        assert_eq!(inject_context(&[], "hello"), "hello");
+    }
+}
diff --git a/gateway/src/main.rs b/gateway/src/main.rs
index 76a8927e8..8aba99f61 100644
--- a/gateway/src/main.rs
+++ b/gateway/src/main.rs
@@ -1,4 +1,5 @@
 mod adapters;
+mod context;
 mod media;
 mod schema;
 pub mod store;
@@ -12,7 +13,7 @@ use axum::{
 };
 use futures_util::{SinkExt, StreamExt};
 use schema::GatewayReply;
-use std::collections::{HashMap, VecDeque};
+use std::collections::HashMap;
 use std::sync::Arc;
 use std::time::Instant;
 use tokio::sync::{broadcast, Mutex, Semaphore};
@@ -38,85 +39,8 @@ pub const REPLY_TOKEN_CACHE_MAX: usize = 10_000;
 /// fast 200 OK response path.
 pub const LINE_WEBHOOK_CONCURRENCY_MAX: usize = 8;
 
-pub const LINE_GROUP_CONTEXT_DEFAULT_TTL_HOURS: u64 = 24;
-pub const LINE_GROUP_CONTEXT_DEFAULT_MAX_MESSAGES: usize = 100;
-pub const LINE_GROUP_CONTEXT_DEFAULT_MAX_CHARS: usize = 8_000;
-
-#[derive(Clone, Debug)]
-pub struct LineGroupContextConfig {
-    /// Enables opt-in capture of unmentioned LINE group text.
-    pub enabled: bool,
-    /// How long unmentioned LINE group text stays eligible for later prompt injection.
-    pub ttl_secs: u64,
-    /// Maximum buffered unmentioned LINE text messages per group/room.
-    pub max_messages: usize,
-    /// Maximum total buffered text characters per LINE group/room.
-    pub max_chars: usize,
-}
-
-impl Default for LineGroupContextConfig {
-    fn default() -> Self {
-        Self {
-            enabled: false,
-            ttl_secs: LINE_GROUP_CONTEXT_DEFAULT_TTL_HOURS * 60 * 60,
-            max_messages: LINE_GROUP_CONTEXT_DEFAULT_MAX_MESSAGES,
-            max_chars: LINE_GROUP_CONTEXT_DEFAULT_MAX_CHARS,
-        }
-    }
-}
-
-impl LineGroupContextConfig {
-    fn from_env() -> Self {
-        let defaults = Self::default();
-        let ttl_hours = read_positive_env_u64(
-            "LINE_GROUP_CONTEXT_TTL_HOURS",
-            LINE_GROUP_CONTEXT_DEFAULT_TTL_HOURS,
-        );
-        Self {
-            enabled: read_bool_env("LINE_GROUP_CONTEXT_ENABLED", defaults.enabled),
-            ttl_secs: ttl_hours.saturating_mul(60 * 60),
-            max_messages: read_positive_env_usize(
-                "LINE_GROUP_CONTEXT_MAX_MESSAGES",
-                defaults.max_messages,
-            ),
-            max_chars: read_positive_env_usize("LINE_GROUP_CONTEXT_MAX_CHARS", defaults.max_chars),
-        }
-    }
-}
-
-fn read_bool_env(name: &str, default: bool) -> bool {
-    std::env::var(name)
-        .map(|v| v == "1" || v.eq_ignore_ascii_case("true"))
-        .unwrap_or(default)
-}
-
-fn read_positive_env_u64(name: &str, default: u64) -> u64 {
-    std::env::var(name)
-        .ok()
-        .and_then(|v| v.parse::<u64>().ok())
-        .filter(|v| *v > 0)
-        .unwrap_or(default)
-}
-
-fn read_positive_env_usize(name: &str, default: usize) -> usize {
-    std::env::var(name)
-        .ok()
-        .and_then(|v| v.parse::<usize>().ok())
-        .filter(|v| *v > 0)
-        .unwrap_or(default)
-}
-
-#[derive(Clone, Debug)]
-pub struct LineBufferedText {
-    pub sender_id: String,
-    pub text: String,
-    pub buffered_at: Instant,
-}
-
-/// Short-lived LINE group/room context captured from unmentioned text messages.
-/// Keyed by groupId/roomId. Drained when a later direct mention arrives.
-pub type LineGroupContextBuffer =
-    Arc<std::sync::Mutex<HashMap<String, VecDeque<LineBufferedText>>>>;
+pub type ContextProviderRegistry = Arc<HashMap<String, Arc<dyn context::ContextProvider>>>;
+pub type ContextBotIdRegistry = Arc<HashMap<String, String>>;
 
 // --- App state (shared across all adapters) ---
 
@@ -152,10 +76,10 @@ pub struct AppState {
     /// Limits concurrent post-ack LINE webhook processing so image bursts do not
     /// turn into unbounded download/decode work.
     pub line_webhook_semaphore: Arc<Semaphore>,
-    /// Short-lived unmentioned LINE group text, used to enrich the next direct-mention turn.
-    pub line_group_context_buffer: LineGroupContextBuffer,
-    /// Tuning knobs for LINE group context capture.
-    pub line_group_context_config: LineGroupContextConfig,
+    /// Gateway-level context providers keyed by platform name.
+    pub context_providers: ContextProviderRegistry,
+    /// Stable bot identity per platform for context isolation in shared chats.
+    pub context_bot_ids: ContextBotIdRegistry,
     /// Shared HTTP client for media downloads and API calls
     pub client: reqwest::Client,
 }
@@ -320,9 +244,26 @@ async fn main() -> Result<()> {
 
     let (event_tx, _) = broadcast::channel::<String>(256);
     let reply_token_cache: ReplyTokenCache = Arc::new(std::sync::Mutex::new(HashMap::new()));
-    let line_group_context_buffer: LineGroupContextBuffer =
-        Arc::new(std::sync::Mutex::new(HashMap::new()));
-    let line_group_context_config = LineGroupContextConfig::from_env();
+    let line_context_config =
+        context::ContextConfig::from_env_with_prefixes(&["LINE_GROUP", "GATEWAY"]);
+    let line_context_bot_id = std::env::var("LINE_CONTEXT_BOT_ID")
+        .or_else(|_| std::env::var("LINE_BOT_ID"))
+        .unwrap_or_else(|_| "line-default-bot".into());
+    if line_context_config.enabled {
+        info!(
+            ttl_secs = line_context_config.ttl_secs,
+            max_messages = line_context_config.max_messages,
+            max_chars = line_context_config.max_chars,
+            "line buffered context provider enabled"
+        );
+    }
+    let mut context_providers = HashMap::<String, Arc<dyn context::ContextProvider>>::new();
+    context_providers.insert(
+        "line".into(),
+        Arc::new(context::BufferedContextProvider::new(line_context_config)),
+    );
+    let mut context_bot_ids = HashMap::new();
+    context_bot_ids.insert("line".into(), line_context_bot_id);
 
     let mut app = Router::new()
         .route("/ws", get(ws_handler))
@@ -497,8 +438,8 @@ async fn main() -> Result<()> {
         event_tx,
         reply_token_cache,
         line_webhook_semaphore: Arc::new(Semaphore::new(LINE_WEBHOOK_CONCURRENCY_MAX)),
-        line_group_context_buffer,
-        line_group_context_config,
+        context_providers: Arc::new(context_providers),
+        context_bot_ids: Arc::new(context_bot_ids),
         client,
     });