Initial release: VARS - personalized LLM with RAG and user vector learning

author: YurenHao0426 <Blackhao0426@gmail.com> 2026-03-18 18:25:09 -0500
committer: YurenHao0426 <Blackhao0426@gmail.com> 2026-03-18 18:25:09 -0500
commit: b6c3e4e51eeab703b40284459c6e9fff2151216c (patch)
tree: 221410886f23214575f93b9ef44fa8431c9a6dfc /src/personalization/models/llm/base.py
1 files changed, 29 insertions, 0 deletions
diff --git a/src/personalization/models/llm/base.py b/src/personalization/models/llm/base.py
new file mode 100644
index 0000000..72b6ca8
--- /dev/null
+++ b/src/personalization/models/llm/base.py
@@ -0,0 +1,29 @@
+from typing import List, Protocol, Optional
+from personalization.types import ChatTurn
+
+class ChatModel(Protocol):
+    def answer(
+        self,
+        history: List[ChatTurn],
+        memory_notes: List[str],
+        max_new_tokens: int = 512,
+        temperature: float = 0.7,
+        top_p: float = 0.9,
+        top_k: Optional[int] = None,
+    ) -> str:
+        """
+        Generate an assistant response given conversation history and memory notes.
+
+        Args:
+            history: The conversation history ending with the current user turn.
+            memory_notes: List of retrieved memory content strings.
+            max_new_tokens: Max tokens to generate.
+            temperature: Sampling temperature.
+            top_p: Top-p sampling.
+            top_k: Top-k sampling.
+
+        Returns:
+            The generated assistant response text.
+        """
+        ...
+
author	YurenHao0426 <Blackhao0426@gmail.com>	2026-03-18 18:25:09 -0500
committer	YurenHao0426 <Blackhao0426@gmail.com>	2026-03-18 18:25:09 -0500
commit	b6c3e4e51eeab703b40284459c6e9fff2151216c (patch)
tree	221410886f23214575f93b9ef44fa8431c9a6dfc /src/personalization/models/llm/base.py