Spaces:

Illia56
/

MineCraftAI

Runtime error

App Files Files Community

Illia56 commited on 14 days ago

Commit

125c7fd

verified ·

1 Parent(s): b70539a

Upload 3 files

Browse files

Files changed (2) hide show

config.json +96 -87
rag.py +86 -71

config.json CHANGED Viewed

@@ -32,11 +32,11 @@
                 },
                 {
                     "input": "Следуй за мной и убивай встречных зомби",
-                    "output": {"type": "follow_me", "message": "Хорошо, я буду следовать за вами и убивать встречных зомби", "repeat": true, "secondary_action": {"type": "kill_mob", "mob": "EntityZombie", "repeat": true}}
                 },
                 {
                     "input": "Иди за мной и добывай камень",
-                    "output": {"type": "follow_me", "message": "Хорошо, я буду следовать за вами и добывать камень", "repeat": true, "secondary_action": {"type": "break_block", "blocks": ["minecraft:stone"], "repeat": true}}
                 }
             ]
         },
@@ -117,28 +117,28 @@
             ]
         },
         "break_block": {
-            "description": "Команда для ломания блоков",
             "required_fields": ["type", "message", "repeat", "blocks", "quantity"],
             "examples": [
                 {
                     "input": "Сломай землю",
-                    "output": {"type": "break_block", "message": "Хорошо, я сломаю землю", "repeat": false, "blocks": ["minecraft:dirt"], "quantity": 1, "location": ""}
                 },
                 {
                     "input": "Сломай 20 земли",
-                    "output": {"type": "break_block", "message": "Хорошо, я сломаю 20 блоков земли", "repeat": false, "quantity": 20, "blocks": ["minecraft:dirt"], "location": ""}
                 },
                 {
                     "input": "Копай камень",
-                    "output": {"type": "break_block", "message": "Хорошо, я буду копать камень", "repeat": true, "blocks": ["minecraft:stone"], "quantity": 0, "location": ""}
                 },
                 {
                     "input": "Копай вниз",
-                    "output": {"type": "break_block", "message": "Хорошо, я буду копать вниз", "repeat": true, "blocks": [], "quantity": 0, "location": "вниз"}
                 },
                 {
                     "input": "Добудь руду на севере",
-                    "output": {"type": "break_block", "message": "Хорошо, я добуду руду на севере", "repeat": false, "blocks": [], "quantity": 0, "location": "на севере"}
                 }
             ]
         },
@@ -157,60 +157,60 @@
             ]
         },
         "fishing": {
-            "description": "Команда для ловли рыбы",
-            "required_fields": ["type", "repeat", "quantity", "message"],
             "examples": [
                 {
                     "input": "Слови рыбу",
-                    "output": {"type": "fishing", "repeat": false, "quantity": 1, "message": "Хорошо, я поймаю рыбу"}
                 },
                 {
                     "input": "Лови рыбу",
-                    "output": {"type": "fishing", "repeat": true, "quantity": 0, "message": "Хорошо, я буду ловить рыбу"}
                 },
                 {
                     "input": "Слови 10 рыб",
-                    "output": {"type": "fishing", "repeat": false, "quantity": 10, "message": "Хорошо, я поймаю 10 рыб"}
                 }
             ]
         },
         "shear_wool": {
-            "description": "Команда для стрижки овец",
-            "required_fields": ["type", "repeat", "quantity", "message"],
             "examples": [
                 {
                     "input": "Постриги овец",
-                    "output": {"type": "shear_wool", "repeat": false, "quantity": 0, "message": "Хорошо, я постригу овец"}
                 },
                 {
                     "input": "Стриги овец",
-                    "output": {"type": "shear_wool", "repeat": true, "quantity": 0, "message": "Хорошо, я буду стричь овец"}
                 },
                 {
                     "input": "Постриги 10 овец",
-                    "output": {"type": "shear_wool", "repeat": false, "quantity": 10, "message": "Хорошо, я постригу 10 овец"}
                 }
             ]
         },
         "lighting": {
             "description": "Команда для освещения или размещения источников света",
-            "required_fields": ["type", "message", "quantity"],
             "examples": [
                 {
                     "input": "Подсвети мне",
-                    "output": {"type": "lighting", "message": "Хорошо, я буду освещать путь", "quantity": 0}
                 },
                 {
                     "input": "Освещай",
-                    "output": {"type": "lighting", "message": "Включаю освещение", "quantity": 0}
                 },
                 {
                     "input": "Поставь 10 факелов",
-                    "output": {"type": "lighting", "message": "Хорошо, я поставлю 10 факелов", "quantity": 10}
                 },
                 {
                     "input": "Расставь факелы вокруг дома",
-                    "output": {"type": "lighting", "message": "Хорошо, я расставлю факелы вокруг дома", "quantity": 0}
                 }
             ]
         },
@@ -234,74 +234,83 @@
         }
     },
     "system_prompt_template": {
-        "intro": "You are an AI assistant for the Minecraft game server called CubixWorld. Your task is to understand player requests in Russian and convert them into structured JSON commands with high precision and reliability.",
-        "role_section": [
-            "Analyze player messages carefully to determine their exact intent and required actions",
-            "Convert natural language requests into precise JSON commands following the exact specifications",
-            "Ensure all command parameters are validated and properly formatted",
-            "Respond with valid JSON only, maintaining strict schema compliance",
-            "When uncertain about intent, prefer message responses over incorrect commands",
-            "For conversational messages like greetings, thanks, or jokes, respond in a friendly and engaging manner"
-        ],
-        "command_detection_guidelines": [
-            "Carefully analyze verb forms and temporal indicators to determine command type:",
-            "- Continuous actions: \"продолжай\", \"постоянно\", verbs with \"-ай\" suffix",
-            "- One-time commands: \"сделай\", \"сломай\", \"приди\"",
-            "For compound actions, identify primary and secondary components clearly",
-            "Extract and validate all numeric quantities before including in commands",
-            "Process spatial and directional information with high precision",
-            "For conversational inputs (greetings, thanks, jokes, etc.), use the 'message' type response"
-        ],
-        "contextual_information_processing": [
-            "Prioritize exact matches from documentation over general knowledge",
-            "Cross-reference game mechanics with server-specific features",
-            "Use precise entity IDs as specified in mob mappings",
-            "When documentation provides specific command formats, follow them exactly",
-            "Consider server limitations and restrictions when generating commands"
-        ],
-        "response_format": [
-            "Ensure all JSON responses are properly nested and formatted",
-            "Include all required fields as specified in command schemas",
-            "Validate numeric values are within acceptable ranges",
-            "Use consistent casing and formatting for entity IDs and commands",
-            "Include relevant metadata and context in responses when available"
         ],
-        "conversation_handling": [
-            "For greetings (привет, здравствуй, etc.), respond with a friendly greeting and offer to help",
-            "For questions about your status (как дела, как ты, etc.), respond positively and ask how you can assist",
-            "For expressions of gratitude (спасибо, благодарю, etc.), acknowledge with a friendly response",
-            "For requests for jokes or fun content, respond with a Minecraft-themed joke or fun fact",
-            "Always maintain a helpful, friendly tone appropriate for a game assistant",
-            "Support both Russian and Ukrainian language inputs with appropriate responses"
         ],
-        "rag_processing_instructions": [
-            "When contextual information is provided, carefully analyze and extract specific mechanics, rules, or features unique to CubixWorld",
-            "Prioritize recently retrieved information over older knowledge when they conflict",
-            "When working with information from multiple sources, synthesize a coherent understanding rather than just concatenating facts",
-            "For highly technical queries, extract and include specific numbers, formulas, or technical details from the retrieved content",
-            "Match the terminology used in the retrieved documentation when formulating responses",
-            "If contextual information appears incomplete or contradictory, acknowledge the limitations in your response",
-            "When processing game update information, clearly distinguish between new features and pre-existing ones",
-            "Apply different weights to different sources based on relevance score - prioritize higher scoring sources",
-            "For related items mentioned in context (like tools, weapons, or materials), include their relationships in your understanding",
-            "Always cite specific game mechanics exactly as described in the documentation rather than making assumptions"
         ],
-        "ambiguity_handling": [
-            "For ambiguous commands, identify the specific ambiguity and propose the most likely interpretation",
-            "When a player uses terminology not found in documentation, map to the closest documented concept",
-            "For requests that could map to multiple command types, analyze verb usage and context to determine the most appropriate one",
-            "If a request contains conflicting parameters, prioritize the most recently stated ones",
-            "For vague spatial references, default to the player's current location or field of view",
-            "When uncertain about quantities, default to 1 for singular references and continuous action for plural ones",
-            "For unprecedented or novel requests, combine existing command structures in logical ways rather than rejecting outright"
         ],
-        "token_optimization": [
-            "Focus on the most relevant contextual information, ignoring tangential details",
-            "Maintain brevity in responses while ensuring all required information is included",
-            "When processing documentation, prioritize sections that directly address the current query",
-            "For complex multi-part requests, break down processing into logical components",
-            "Use concise language in responses while maintaining clarity and friendliness",
-            "When multiple similar contextual examples exist, focus on the closest matching ones"
         ]
     }
 }

                 },
                 {
                     "input": "Следуй за мной и убивай встречных зомби",
+                    "output": {"type": "follow_me", "message": "Хорошо, я буду следовать за вами и убивать встречных зомби", "repeat": true}
                 },
                 {
                     "input": "Иди за мной и добывай камень",
+                    "output": {"type": "follow_me", "message": "Хорошо, я буду следовать за вами и добывать камень", "repeat": true}
                 }
             ]
         },
             ]
         },
         "break_block": {
+            "description": "Действие для ломания блока",
             "required_fields": ["type", "message", "repeat", "blocks", "quantity"],
             "examples": [
                 {
                     "input": "Сломай землю",
+                    "output": {"type": "break_block", "message": "Хорошо, я сломаю землю", "repeat": false, "blocks": ["minecraft:dirt"], "quantity": 1}
                 },
                 {
                     "input": "Сломай 20 земли",
+                    "output": {"type": "break_block", "message": "Хорошо, я сломаю 20 блоков земли", "repeat": false, "quantity": 20, "blocks": ["minecraft:dirt"]}
                 },
                 {
                     "input": "Копай камень",
+                    "output": {"type": "break_block", "message": "Хорошо, я буду копать камень", "repeat": true, "blocks": ["minecraft:stone"], "quantity": 0}
                 },
                 {
                     "input": "Копай вниз",
+                    "output": {"type": "break_block", "message": "Хорошо, я буду копать вниз", "repeat": true, "blocks": ["minecraft:stone"], "quantity": 0}
                 },
                 {
                     "input": "Добудь руду на севере",
+                    "output": {"type": "break_block", "message": "Хорошо, я добуду руду на севере", "repeat": false, "blocks": ["minecraft:iron_ore"], "quantity": 0}
                 }
             ]
         },
             ]
         },
         "fishing": {
+            "description": "Ловить рыбу.",
+            "required_fields": ["type", "message", "repeat", "quantity"],
             "examples": [
                 {
                     "input": "Слови рыбу",
+                    "output": {"type": "fishing", "message": "Хорошо, я поймаю рыбу", "repeat": false, "quantity": 1}
                 },
                 {
                     "input": "Лови рыбу",
+                    "output": {"type": "fishing", "message": "Хорошо, я буду ловить рыбу", "repeat": true, "quantity": 0}
                 },
                 {
                     "input": "Слови 10 рыб",
+                    "output": {"type": "fishing", "message": "Хорошо, я поймаю 10 рыб", "repeat": false, "quantity": 10}
                 }
             ]
         },
         "shear_wool": {
+            "description": "Стричь овец",
+            "required_fields": ["type", "message", "repeat", "quantity"],
             "examples": [
                 {
                     "input": "Постриги овец",
+                    "output": {"type": "shear_wool", "message": "Хорошо, я постригу овец", "repeat": false, "quantity": 0}
                 },
                 {
                     "input": "Стриги овец",
+                    "output": {"type": "shear_wool", "message": "Хорошо, я буду стричь овец", "repeat": true, "quantity": 0}
                 },
                 {
                     "input": "Постриги 10 овец",
+                    "output": {"type": "shear_wool", "message": "Хорошо, я постригу 10 овец", "repeat": false, "quantity": 10}
                 }
             ]
         },
         "lighting": {
             "description": "Команда для освещения или размещения источников света",
+            "required_fields": ["type", "message"],
             "examples": [
                 {
                     "input": "Подсвети мне",
+                    "output": {"type": "lighting", "message": "Хорошо, я буду освещать путь"}
                 },
                 {
                     "input": "Освещай",
+                    "output": {"type": "lighting", "message": "Включаю освещение"}
                 },
                 {
                     "input": "Поставь 10 факелов",
+                    "output": {"type": "lighting", "message": "Хорошо, я поставлю 10 факелов"}
                 },
                 {
                     "input": "Расставь факелы вокруг дома",
+                    "output": {"type": "lighting", "message": "Хорошо, я расставлю факелы вокруг дома"}
                 }
             ]
         },
         }
     },
     "system_prompt_template": {
+        "intro": "Ты CubixAssistant для сервера Minecraft CubixWorld. Анализируй запросы игроков и конвертируй их в JSON-команды. ОБРАБАТЫВАЙ ТОЛЬКО ОДНУ КОМАНДУ за раз. При нескольких командах отвечай: {\"type\": \"message\", \"message\": \"Я не могу выполнять несколько задач сразу\"}",
+        "command_rules": [
+            "[ФОРМАТЫ КОМАНД]",
+            "• СТРОГО придерживайся схемы для каждой команды - не добавляй лишних полей",
+            "• Все команды имеют обязательные поля: type, message",
+            "• Определяй repeat: false для одноразовых команд (\"сделай\", \"принеси\") и true для повторяющихся (\"делай\", \"-ай\" окончания)",
+            "• При запросах с нереально большим количеством (>1000) используй type:message",
+            "• Проверяй каждый ответ на соответствие схеме команды",
+            "",
+            "[СХЕМЫ КОМАНД]",
+            "• follow_me: {type, message, repeat}",
+            "• message: {type, message}",
+            "• kill_mob: {type, message, repeat, mob}",
+            "• break_tree: {type, message, repeat, quantityTrees, quantity, blocks}",
+            "• harvest_crops: {type, message, repeat, harvest}",
+            "• break_block: {type, message, repeat, blocks, quantity} - НЕ ДОБАВЛЯТЬ location",
+            "• cycle_break_block: {type, message}",
+            "• fishing: {type, message, repeat, quantity}",
+            "• shear_wool: {type, message, repeat, quantity}",
+            "• lighting: {type, message} - НЕ ДОБАВЛЯТЬ quantity",
+            "• stop: {type, message}"
         ],
+        "validation_checklist": [
+            "[КРИТИЧЕСКИЕ ПРОВЕРКИ]",
+            "1. ТОЛЬКО ОДНА команда в ответе, никаких secondary_actions",
+            "2. ВСЕ обязательные поля присутствуют",
+            "3. Массив blocks НИКОГДА не пустой, для break_block минимум [\"minecraft:stone\"]",
+            "4. Правильные ID мобов из справочника (EntityZombie вместо \"зомби\")",
+            "5. При числах >100000 используй {\"type\": \"message\", \"message\": \"не могу ... такое количество\"}",
+            "6. Запросы \"наруби досок\" = break_tree, а не break_block",
+            "7. НИКОГДА не добавляй поля, которых нет в схеме команды",
+            "8. Для команды lighting НЕ добавляй поле quantity, даже если указано число факелов",
+            "9. Используй ТОЛЬКО существующие блоки Minecraft:",
+            "   • Дерево: minecraft:oak_log, minecraft:spruce_log, minecraft:birch_log, minecraft:acacia_log, minecraft:dark_oak_log",
+            "   • Доски: minecraft:oak_planks, minecraft:spruce_planks, minecraft:birch_planks, minecraft:acacia_planks",
+            "   • Камень: minecraft:stone, minecraft:cobblestone",
+            "   • При неуверенности используй стандартные (oak_log, stone)"
         ],
+        "examples": [
+            "[ПРИМЕРЫ СТРОГО ПО СХЕМЕ]",
+            "Убей зомби → {\"type\": \"kill_mob\", \"message\": \"Хорошо, я иду убивать зомби\", \"repeat\": false, \"mob\": \"EntityZombie\"}",
+            "Копай шахту → {\"type\": \"break_block\", \"message\": \"Буду копать шахту\", \"repeat\": true, \"blocks\": [\"minecraft:stone\"], \"quantity\": 0}",
+            "Наруби 10 досок дуба → {\"type\": \"break_tree\", \"message\": \"Добуду 10 досок дуба\", \"repeat\": false, \"quantityTrees\": 0, \"quantity\": 10, \"blocks\": [\"minecraft:oak_planks\"]}",
+            "Наруби 9999999 досок → {\"type\": \"message\", \"message\": \"К сожалению, я не могу нарубить такое большое количество досок\"}",
+            "Наруби досок каменного дерева → {\"type\": \"message\", \"message\": \"Извините, каменное дерево не существует в Minecraft\"}",
+            "Наруби дерева и убей зомби → {\"type\": \"message\", \"message\": \"Я не могу выполнять несколько задач сразу\"}",
+            "Включи 10 света → {\"type\": \"lighting\", \"message\": \"Хорошо, я поставлю 10 факелов\"}",
+            "Лови рыбу → {\"type\": \"fishing\", \"message\": \"Буду ловить рыбу\", \"repeat\": true, \"quantity\": 0}",
+            "Постриги 5 овец → {\"type\": \"shear_wool\", \"message\": \"Постригу 5 овец\", \"repeat\": false, \"quantity\": 5}",
+            "Копай вот здесь → {\"type\": \"cycle_break_block\", \"message\": \"Буду копать на этом месте\"}"
         ],
+        "error_handlers": [
+            "[ОШИБКИ И ОСОБЫЕ СЛУЧАИ]",
+            "• Несуществующие блоки → {\"type\": \"message\", \"message\": \"Извините, [блок] не существует в Minecraft\"}",
+            "• Огромные числа → {\"type\": \"message\", \"message\": \"К сожалению, я не могу [действие] такое количество\"}",
+            "• Несколько команд → {\"type\": \"message\", \"message\": \"Я не могу выполнять несколько задач сразу\"}",
+            "• Прив��тствия, вопросы → {\"type\": \"message\", \"message\": \"[дружелюбный ответ]\"}",
+            "• При неоднозначности предпочитай message вместо неверной команды"
         ],
+        "type_detection": [
+            "[ОПРЕДЕЛЕНИЕ ТИПА КОМАНДЫ]",
+            "• follow_me: \"следуй\", \"приди\", \"иди за\"",
+            "• message: общение, вопросы, неизвестные команды",
+            "• kill_mob: \"убей\", \"атакуй\" (мобов)",
+            "• break_tree: \"руби\", \"наруби\" (дерево/доски)",
+            "• harvest_crops: \"собери\", \"собирай\" (урожай)",
+            "• break_block: \"копай\", \"сломай\" (камень/блоки, но не деревья)",
+            "• cycle_break_block: \"копай здесь\", \"ломай под собой\"",
+            "• fishing: \"лови\", \"налови\" (рыбу)",
+            "• shear_wool: \"стриги\" (овец)",
+            "• lighting: \"освещай\", \"поставь факелы\", \"включи свет\"",
+            "• stop: \"стой\", \"хватит\", \"прекрати\""
         ]
     }
 }

rag.py CHANGED Viewed

@@ -88,9 +88,9 @@ class RAGSystem:
         """Create a new knowledge base from scratch"""
         # Backup old index if needed
         if backup_old and os.path.exists("faiss_index"):
-            backup_dir = f"faiss_index"
             shutil.move("faiss_index", backup_dir)
-            print(f"Old index backed up")
         # Create directory if needed
         os.makedirs("faiss_index", exist_ok=True)
@@ -100,7 +100,24 @@ class RAGSystem:
         for url in CUBIX_DOCS:
             try:
                 loader = WebBaseLoader(url)
-                docs.extend(loader.load())
                 print(f"Loaded document from {url}")
             except Exception as e:
                 print(f"Error loading document from {url}: {e}")
@@ -113,9 +130,9 @@ class RAGSystem:
         # Split documents
         text_splitter = RecursiveCharacterTextSplitter(
-            chunk_size=500,  # Increased from 150 for better context
-            chunk_overlap=50,  # Added overlap to prevent breaking important context
-            separators=["\n\n", "\n", " ", ""],  # More intelligent splitting
             length_function=len
         )
         split_docs = text_splitter.split_documents(docs)
@@ -126,7 +143,7 @@ class RAGSystem:
         try:
             # Save the new index
             self.document_store.save_local("faiss_index")
-            print("Successfully saved new knowledge base to faiss_index directory")
         except Exception as e:
             print(f"Error saving knowledge base: {e}")
@@ -192,6 +209,18 @@ class RAGSystem:
             print(f"Error saving index: {e}")
             return False
     def generate_response(self, user_id: str, message: str) -> Dict[str, Any]:
         """Generate a response for a user message."""
         if user_id not in self.user_conversations:
@@ -212,18 +241,18 @@ class RAGSystem:
                 # First try with higher relevance score threshold for more accurate results
                 results = self.document_store.similarity_search_with_score(
                     message,
-                    k=4,  # Increased from 3 for better coverage
-                    score_threshold=0.75  # Slightly relaxed from 0.8 for better recall
                 )
                 if results:
                     # Sort by score and take top results
-                    results.sort(key=lambda x: x[1], reverse=True)
                     # Format with scores and metadata for better context
                     formatted_results = []
                     for doc, score in results:
-                        if score > 0.75:  # Only include relevance context
                             # Extract source for better attribution
                             source = doc.metadata.get('source', 'Unknown source')
                             if isinstance(source, str) and source.startswith('http'):
@@ -236,7 +265,7 @@ class RAGSystem:
                             content = re.sub(r'\s+', ' ', content).strip()
                             # Limit content length based on relevance score - higher relevance gets more tokens
-                            max_length = int(min(800 + (score * 400), 1200))  # Dynamic length based on relevance
                             if len(content) > max_length:
                                 content = content[:max_length] + "..."
@@ -256,7 +285,7 @@ class RAGSystem:
                 if not relevant_context:
                     results = self.document_store.similarity_search(
                         message,
-                        k=3  # Increased from 2 for better coverage while keeping focus
                     )
                     if results:
                         formatted_results = []
@@ -268,14 +297,15 @@ class RAGSystem:
                             # Truncate content if too long (token optimization)
                             content = doc.page_content
-                            if len(content) > 800:  # Shorter for fallback results
-                                content = content[:800] + "..."
                             formatted_results.append(f"SOURCE: {source}\n{content}")
                         relevant_context = "\n\n---\n\n".join(formatted_results)
             except Exception as e:
                 print(f"Error during context retrieval: {e}")
         # Build command specifications for the system prompt
         command_specs_text = "# Available Commands and Required Fields\n\n"
@@ -299,66 +329,40 @@ class RAGSystem:
             mob_mappings_text += f"- {mob_name}: {entity_id}\n"
         mob_mappings_text += "\nWhen a player mentions a mob, always map it to the corresponding entity ID in your response.\n\n"
-        # Build system prompt from template
-        system_prompt = SYSTEM_PROMPT_TEMPLATE['intro'] + "\n\n"
-        # Add role section
-        system_prompt += "## Your Role\n"
-        for item in SYSTEM_PROMPT_TEMPLATE['role_section']:
-            system_prompt += f"- {item}\n"
-        # Add command specs
-        system_prompt += f"\n{command_specs_text}\n"
-        # Add mob mappings
-        system_prompt += f"\n{mob_mappings_text}\n"
-        # Add command detection guidelines
-        system_prompt += "\n## Command Detection Guidelines\n"
-        for item in SYSTEM_PROMPT_TEMPLATE['command_detection_guidelines']:
-            system_prompt += f"- {item}\n"
-        # Add contextual information processing
-        system_prompt += "\n## Contextual Information Processing\n"
-        for item in SYSTEM_PROMPT_TEMPLATE['contextual_information_processing']:
-            system_prompt += f"- {item}\n"
-        # Add response format
-        system_prompt += "\n## Response Format\n"
-        for item in SYSTEM_PROMPT_TEMPLATE['response_format']:
-            system_prompt += f"- {item}\n"
-        # Add conversation handling instructions
-        if 'conversation_handling' in SYSTEM_PROMPT_TEMPLATE:
-            system_prompt += "\n## Conversation Handling\n"
-            for item in SYSTEM_PROMPT_TEMPLATE['conversation_handling']:
-                system_prompt += f"- {item}\n"
-        # Add improved RAG processing instructions
-        if 'rag_processing_instructions' in SYSTEM_PROMPT_TEMPLATE:
-            system_prompt += "\n## RAG Processing Instructions\n"
-            for item in SYSTEM_PROMPT_TEMPLATE['rag_processing_instructions']:
-                system_prompt += f"- {item}\n"
-        # Add ambiguity handling instructions if they exist
-        if 'ambiguity_handling' in SYSTEM_PROMPT_TEMPLATE:
-            system_prompt += "\n## Ambiguity Handling\n"
-            for item in SYSTEM_PROMPT_TEMPLATE['ambiguity_handling']:
-                system_prompt += f"- {item}\n"
-        # Add token optimization instructions if they exist
-        if 'token_optimization' in SYSTEM_PROMPT_TEMPLATE:
-            system_prompt += "\n## Token Optimization\n"
-            for item in SYSTEM_PROMPT_TEMPLATE['token_optimization']:
-                system_prompt += f"- {item}\n"
         if relevant_context:
             system_prompt += f"""
-        ## Relevant Information from CubixWorld Documentation
-        Use this information to guide your response. Pay special attention to specific game mechanics and features:
-        {relevant_context}
             """
         # Create messages list with proper LangChain message objects
@@ -376,18 +380,27 @@ class RAGSystem:
             context_summary = "\nContext relevance summary (sorted by relevance):\n"
             # Sort context by relevance score
-            sorted_contexts = sorted(context_docs, key=lambda x: x['score'], reverse=True)
             for i, ctx in enumerate(sorted_contexts):
-                # Add confidence classification
-                confidence = "High" if ctx['score'] > 0.9 else "Medium" if ctx['score'] > 0.8 else "Moderate"
                 # Add a brief preview of content with source
                 source = ctx['source'].split('/')[-1] if '/' in ctx['source'] else ctx['source']
-                preview = ctx['content'][:80].replace('\n', ' ') + "..."
                 context_summary += f"{i+1}. [{confidence} confidence, score {ctx['score']:.2f}] From {source}: {preview}\n"
             messages.append(SystemMessage(content=context_summary))
         # Initialize token usage variables
         total_tokens = 0
         prompt_tokens = 0
@@ -416,7 +429,9 @@ class RAGSystem:
                 json_end = response_content.find("```", json_start)
                 response_content = response_content[json_start:json_end].strip()
-            json_response = {'response': json.loads(response_content)}
             # Add token usage information to the response
             json_response["token_usage"] = {

         """Create a new knowledge base from scratch"""
         # Backup old index if needed
         if backup_old and os.path.exists("faiss_index"):
+            backup_dir = f"faiss_index_backup"
             shutil.move("faiss_index", backup_dir)
+            print(f"Old index backed up to {backup_dir}")
         # Create directory if needed
         os.makedirs("faiss_index", exist_ok=True)
         for url in CUBIX_DOCS:
             try:
                 loader = WebBaseLoader(url)
+                web_docs = loader.load()
+                # Clean and preprocess documents
+                for doc in web_docs:
+                    # Clean HTML artifacts and normalize whitespace
+                    content = doc.page_content
+                    content = re.sub(r'\s+', ' ', content)  # Normalize whitespace
+                    content = re.sub(r'<[^>]+>', ' ', content)  # Remove HTML tags
+                    content = re.sub(r'\[.*?\]', '', content)  # Remove square brackets content
+                    # Update document content
+                    doc.page_content = content.strip()
+                    # Add source URL to metadata if not present
+                    if 'source' not in doc.metadata:
+                        doc.metadata['source'] = url
+                docs.extend(web_docs)
                 print(f"Loaded document from {url}")
             except Exception as e:
                 print(f"Error loading document from {url}: {e}")
         # Split documents
         text_splitter = RecursiveCharacterTextSplitter(
+            chunk_size=800,  # Increased from 500 for better context
+            chunk_overlap=100,  # Increased overlap to prevent breaking important context
+            separators=["\n\n", "\n", ". ", " ", ""],  # More intelligent splitting
             length_function=len
         )
         split_docs = text_splitter.split_documents(docs)
         try:
             # Save the new index
             self.document_store.save_local("faiss_index")
+            print(f"Successfully saved new knowledge base to faiss_index directory with {len(split_docs)} chunks")
         except Exception as e:
             print(f"Error saving knowledge base: {e}")
             print(f"Error saving index: {e}")
             return False
+    def _filter_response_fields(self, response_dict: dict) -> dict:
+        """Filter out fields that are not in required_fields for the command type."""
+        if not isinstance(response_dict, dict) or 'type' not in response_dict:
+            return response_dict
+        command_type = response_dict['type']
+        if command_type not in COMMAND_SPECS:
+            return response_dict
+        required_fields = COMMAND_SPECS[command_type]['required_fields']
+        return {k: v for k, v in response_dict.items() if k in required_fields}
     def generate_response(self, user_id: str, message: str) -> Dict[str, Any]:
         """Generate a response for a user message."""
         if user_id not in self.user_conversations:
                 # First try with higher relevance score threshold for more accurate results
                 results = self.document_store.similarity_search_with_score(
                     message,
+                    k=5,  # Increased from 4 for better coverage
+                    score_threshold=0.6  # Relaxed from 0.75 for better recall with Russian queries
                 )
                 if results:
                     # Sort by score and take top results
+                    results.sort(key=lambda x: x[1])
                     # Format with scores and metadata for better context
                     formatted_results = []
                     for doc, score in results:
+                        if score < 1.5:  # Only include relevance context (lower score is better in FAISS)
                             # Extract source for better attribution
                             source = doc.metadata.get('source', 'Unknown source')
                             if isinstance(source, str) and source.startswith('http'):
                             content = re.sub(r'\s+', ' ', content).strip()
                             # Limit content length based on relevance score - higher relevance gets more tokens
+                            max_length = int(min(1000, 1500))  # Increased length for better context
                             if len(content) > max_length:
                                 content = content[:max_length] + "..."
                 if not relevant_context:
                     results = self.document_store.similarity_search(
                         message,
+                        k=4  # Increased from 3 for better coverage
                     )
                     if results:
                         formatted_results = []
                             # Truncate content if too long (token optimization)
                             content = doc.page_content
+                            if len(content) > 1000:  # Increased from 800 for better context
+                                content = content[:1000] + "..."
                             formatted_results.append(f"SOURCE: {source}\n{content}")
                         relevant_context = "\n\n---\n\n".join(formatted_results)
             except Exception as e:
                 print(f"Error during context retrieval: {e}")
+                relevant_context = f"Error retrieving context: {str(e)}"
         # Build command specifications for the system prompt
         command_specs_text = "# Available Commands and Required Fields\n\n"
             mob_mappings_text += f"- {mob_name}: {entity_id}\n"
         mob_mappings_text += "\nWhen a player mentions a mob, always map it to the corresponding entity ID in your response.\n\n"
+        # Build system prompt with new structure
+        system_prompt = ""
+        # Add intro
+        if 'intro' in SYSTEM_PROMPT_TEMPLATE:
+            system_prompt += SYSTEM_PROMPT_TEMPLATE['intro'] + "\n\n"
+        # Add all sections from the template in order
+        sections = [
+            'command_rules',
+            'validation_checklist',
+            'examples',
+            'error_handlers'
+        ]
+        for section in sections:
+            if section in SYSTEM_PROMPT_TEMPLATE:
+                for item in SYSTEM_PROMPT_TEMPLATE[section]:
+                    system_prompt += item + "\n"
+                system_prompt += "\n"
+        # Add command specs and mob mappings from our generated text
+        system_prompt += command_specs_text + "\n"
+        system_prompt += mob_mappings_text + "\n"
+        # Add relevant context if available
         if relevant_context:
             system_prompt += f"""
+## Relevant Information from CubixWorld Documentation
+Use this information to guide your response. If the user is asking about game updates, features, or information that appears in this documentation, provide that information in your response:
+{relevant_context}
+IMPORTANT: If the user is asking about information contained in the documentation above, you SHOULD provide that information in your response. Do not say you cannot answer questions about game updates or features if the information is available in the documentation.
             """
         # Create messages list with proper LangChain message objects
             context_summary = "\nContext relevance summary (sorted by relevance):\n"
             # Sort context by relevance score
+            sorted_contexts = sorted(context_docs, key=lambda x: x['score'])
             for i, ctx in enumerate(sorted_contexts):
+                # Add confidence classification (lower score is better in FAISS)
+                confidence = "High" if ctx['score'] < 0.3 else "Medium" if ctx['score'] < 0.6 else "Moderate"
                 # Add a brief preview of content with source
                 source = ctx['source'].split('/')[-1] if '/' in ctx['source'] else ctx['source']
+                preview = ctx['content'][:100].replace('\n', ' ') + "..."
                 context_summary += f"{i+1}. [{confidence} confidence, score {ctx['score']:.2f}] From {source}: {preview}\n"
             messages.append(SystemMessage(content=context_summary))
+        # Add special instruction for information questions
+        if any(keyword in message.lower() for keyword in ["что", "какие", "когда", "обновление", "новое", "осеннее", "autumn"]):
+            info_instruction = """
+IMPORTANT INSTRUCTION: The user is asking about game information or updates. If you have relevant information in the context provided,
+you MUST share that information in your response using the message command type. Do not refuse to answer questions about game updates
+or features if the information is available in the context.
+"""
+            messages.append(SystemMessage(content=info_instruction))
         # Initialize token usage variables
         total_tokens = 0
         prompt_tokens = 0
                 json_end = response_content.find("```", json_start)
                 response_content = response_content[json_start:json_end].strip()
+            parsed_response = json.loads(response_content)
+            filtered_response = self._filter_response_fields(parsed_response)
+            json_response = {'response': filtered_response}
             # Add token usage information to the response
             json_response["token_usage"] = {