WIP: memory system improvements (in progress)
Interview/chat prompt layers, reply planner, style profiles, memory injection, interview meta store, and related tests. Work not finished. Made-with: Cursor
This commit is contained in:
@@ -59,23 +59,29 @@ EMBEDDING_MODEL=embedding-3
|
||||
# Chat 访谈:每轮根据用户内容判定主人生阶段(关则仅用关键词,省一次 LLM)
|
||||
# CHAT_STAGE_DETECTION_ENABLED=true
|
||||
# CHAT_STAGE_DETECTION_MAX_TOKENS=128
|
||||
# 访谈性格(InterviewAgent):default | warm_listener | curious_guide
|
||||
# 年代/流行文化联想块(config 默认 true;若减少「文艺硬接」可设 false)
|
||||
# CHAT_ERA_CONTEXT_ENABLED=true
|
||||
# 访谈性格(InterviewAgent):default | warm_listener | curious_guide(config 默认 default)
|
||||
# CHAT_INTERVIEW_PERSONA=default
|
||||
# 访谈回复长度档位(brief/standard/expanded)联动:极短输入 / 默认 / 长段+新细节(若与当前代码不一致以 config 为准)
|
||||
# CHAT_INTERVIEW_BRIEF_MAX_TOKENS=240
|
||||
# CHAT_INTERVIEW_BRIEF_MAX_CHARS_PER_SEGMENT=180
|
||||
# CHAT_INTERVIEW_EXPANDED_MAX_TOKENS=400
|
||||
# CHAT_INTERVIEW_EXPANDED_MAX_CHARS_PER_SEGMENT=300
|
||||
# 访谈/开场采样温度(略高于 LLM_TEMPERATURE 时口语更活)
|
||||
# 访谈/开场采样温度(config 默认 0.93;偏「好访谈者」体验时可试 0.60~0.70)
|
||||
# CHAT_INTERVIEW_TEMPERATURE=0.93
|
||||
# 访谈主回复:统一 max_tokens / 单段字数(代码截断)
|
||||
# CHAT_INTERVIEW_MAX_TOKENS=380
|
||||
# CHAT_INTERVIEW_MAX_CHARS_PER_SEGMENT=260
|
||||
# CHAT_INTERVIEW_MAX_TOKENS=512
|
||||
# CHAT_INTERVIEW_MAX_CHARS_PER_SEGMENT=380
|
||||
# CHAT_INTERVIEW_MAX_SEGMENTS=2
|
||||
# 访谈:是否按本轮用户话检索记忆并注入提示词(关则不调 retrieve)
|
||||
# CHAT_MEMORY_RETRIEVAL_ENABLED=true
|
||||
# CHAT_MEMORY_TOP_K=8
|
||||
# CHAT_MEMORY_EVIDENCE_MAX_CHARS=4096
|
||||
# 规则 TurnPlan 之后再调一轮 JSON focus planner(config 默认 false;开启则多一次 LLM)
|
||||
# CHAT_REPLY_PLANNER_LLM_ENABLED=true
|
||||
# CHAT_REPLY_PLANNER_MAX_TOKENS=256
|
||||
# CHAT_REPLY_PLANNER_TEMPERATURE=0.2
|
||||
|
||||
# Memoir:批处理/抽取更新 slot 时是否允许改写 MemoirState.current_stage(默认 false,访谈 switch_stage 仍可推进)
|
||||
# True 时仅当 proposed 与 existing 在同一 chat_bucket 才对齐 current_stage
|
||||
|
||||
Reference in New Issue
Block a user