Spaces:

Smilyai-labs
/

Code-agent-team

Sleeping

App Files Files Community

Keeby-smilyai commited on Sep 20

Commit

1c29bb4

verified ·

1 Parent(s): 8fca3fa

Update backend.py

Browse files

Files changed (1) hide show

backend.py +59 -48

backend.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# backend.py — FINAL HARDENED VERSION v1.2
 import sqlite3
 import os
 import json
@@ -11,7 +11,7 @@ from typing import Optional, Dict, Any
 import torch
 import psutil
-from transformers import AutoTokenizer, AutoModelForCausalLM
 # --- CONFIGURATION ---
 DB_PATH = "code_agents_pro.db"
@@ -27,7 +27,6 @@ def init_db():
             CREATE TABLE IF NOT EXISTS projects (id INTEGER PRIMARY KEY, user_id INTEGER, title TEXT, description TEXT, status TEXT DEFAULT 'queued', zip_path TEXT, logs TEXT DEFAULT '', created_at DATETIME DEFAULT CURRENT_TIMESTAMP, FOREIGN KEY (user_id) REFERENCES users(id));
             CREATE INDEX IF NOT EXISTS idx_user_status ON projects(user_id, status);
         """)
 init_db()
 def _db_execute(query, params=(), fetchone=False, fetchall=False, commit=False):
@@ -47,12 +46,10 @@ def _db_execute(query, params=(), fetchone=False, fetchall=False, commit=False):
 def hash_password(password): return hashlib.sha256(password.encode()).hexdigest()
 def verify_password(password, stored_hash): return hash_password(password) == stored_hash
 def create_user(username, password):
     try:
         return _db_execute("INSERT INTO users (username, password_hash) VALUES (?, ?)", (username, hash_password(password)), commit=True)
     except sqlite3.IntegrityError: return None
 def get_user_by_username(username): return _db_execute("SELECT * FROM users WHERE username = ?", (username,), fetchone=True)
 def get_user_projects(user_id, limit=20): return _db_execute("SELECT * FROM projects WHERE user_id = ? ORDER BY created_at DESC LIMIT ?", (user_id, limit), fetchall=True)
 def create_project(user_id, title, description): return _db_execute("INSERT INTO projects (user_id, title, description) VALUES (?, ?, ?)", (user_id, title, description), commit=True)
@@ -62,37 +59,56 @@ def get_project(project_id): return _db_execute("SELECT * FROM projects WHERE id
 # ------------------------------ MODEL LOADING & CACHING ------------------------------
 MODEL_REGISTRY = {
     "planner": "microsoft/Phi-3-mini-4k-instruct",
-    "architect": "Qwen/Qwen2.5-Coder-0.6B-Instruct",
-    "coder": "Qwen/Qwen2.5-Coder-0.6B-Instruct",
     "reviewer": "microsoft/Phi-3-mini-4k-instruct",
-    "tester": "Qwen/Qwen2.5-Coder-0.6B-Instruct",
     "publisher": "microsoft/Phi-3-mini-4k-instruct",
 }
 _MODEL_CACHE = {}
 def load_model(model_name):
-    if model_name in _MODEL_CACHE: return _MODEL_CACHE[model_name]
-    print(f"Loading model: {model_name}...")
     tokenizer = AutoTokenizer.from_pretrained(model_name)
-    model = AutoModelForCausalLM.from_pretrained(model_name, dtype="auto", device_map="auto", trust_remote_code=True, attn_implementation="eager")
     _MODEL_CACHE[model_name] = (tokenizer, model)
     print(f"Model {model_name} loaded and cached.")
     return tokenizer, model
-# ------------------------------ AGENT PROMPTS (SIMPLIFIED & ROBUST) ------------------------------
 ROLE_PROMPTS = {
-    "planner": """You are an expert file planner. Based on the user's request, determine the necessary file structure.
-    Output ONLY a single JSON object with a single key: "files".
-    The "files" key MUST be an array of strings representing complete file paths (e.g., ["src/main.py", "tests/test_main.py", "requirements.txt"]).""",
-    "architect": """You are a software architect. Create initial placeholder content for a list of files.
-    Output ONLY a single JSON object where keys are file paths and values are the initial content (e.g., a comment like '# Main application logic here').""",
     "coder": "You are a professional programmer. Your ONLY job is to write the complete, clean, and functional code for the single file requested. Do NOT add any explanations, introductions, or markdown formatting. Output ONLY the raw source code.",
-    "reviewer": """You are a meticulous code reviewer. Analyze the given code for bugs, style issues, and security vulnerabilities.
-    Output ONLY a single JSON object with two keys: "has_issues" (boolean) and "suggestions" (a string containing a bulleted list of required changes).""",
     "tester": "You are a QA engineer. Write a complete pytest test file for the given source code. Cover main functionality and edge cases. Output ONLY the raw source code for the test file.",
-    "publisher": """You are a release manager. Create final documentation and configuration files.
-    Output ONLY a single JSON object where keys are the filenames ("README.md", ".gitignore", "Dockerfile") and values are their complete string content."""
 }
 # ------------------------------ FILE SYSTEM & AI TOOLS ------------------------------
 def get_project_dir(user_id, project_id):
     path = os.path.join(PROJECT_ROOT, str(user_id), str(project_id))
@@ -102,20 +118,26 @@ def get_project_dir(user_id, project_id):
 def create_file(project_dir, path, content):
     full_path = os.path.join(project_dir, path)
     os.makedirs(os.path.dirname(full_path), exist_ok=True)
-    with open(full_path, 'w', encoding='utf-8') as f: f.write(content)
 def read_file(project_dir, path):
     full_path = os.path.join(project_dir, path)
     try:
-        with open(full_path, 'r', encoding='utf-8') as f: return f.read()
-    except FileNotFoundError: return None
 def zip_project(project_dir, project_id):
     zip_filename = f"project_{project_id}.zip"
     zip_path = os.path.join(os.path.dirname(project_dir), zip_filename)
     with zipfile.ZipFile(zip_path, 'w', zipfile.ZIP_DEFLATED) as zf:
         for root, _, files in os.walk(project_dir):
-            for file in files: zf.write(os.path.join(root, file), os.path.relpath(os.path.join(root, file), project_dir))
     return zip_path
 def _extract_json(text: str) -> Optional[Dict[str, Any]]:
@@ -135,7 +157,7 @@ def generate_with_model(role: str, prompt: str) -> str:
         input_text = tokenizer.apply_chat_template(messages, tokenize=False, add_generation_prompt=True)
         inputs = tokenizer(input_text, return_tensors="pt").to(model.device)
-        outputs = model.generate(**inputs, max_new_tokens=2048, pad_token_id=tokenizer.eos_token_id, use_cache=False)
         return tokenizer.decode(outputs[0][len(inputs.input_ids[0]):], skip_special_tokens=True).strip()
     except Exception as e:
@@ -156,24 +178,20 @@ def run_agent_chain(project_id, user_id, initial_prompt):
     try:
         log_step("SYSTEM", "Initializing project...")
-        # 1. PLANNER
-        log_step("PLANNER", "Determining file structure from user request...")
         plan_response = generate_with_model("planner", initial_prompt)
         plan_data = _extract_json(plan_response)
-        if not plan_data or "files" not in plan_data: raise ValueError("Planner failed to create a valid JSON plan with a 'files' key.")
         log_step("PLANNER", "File structure plan created.", json.dumps(plan_data, indent=2))
-        # 2. ARCHITECT
         log_step("ARCHITECT", "Creating initial file skeletons...")
         arch_prompt = f"Create initial content for these files:\n{json.dumps(plan_data['files'])}"
         arch_response = generate_with_model("architect", arch_prompt)
         arch_data = _extract_json(arch_response)
-        if not arch_data: raise ValueError("Architect failed to create valid JSON file structures.")
         for path, content in arch_data.items(): create_file(project_dir, path, content)
         log_step("ARCHITECT", "File skeletons created.", "\n".join(arch_data.keys()))
-        # 3. CODER
         source_files = [f for f in plan_data['files'] if f.startswith('src/') and f.endswith('.py')]
         for file_path in source_files:
             log_step("CODER", f"Writing complete code for `{file_path}`...")
@@ -182,37 +200,30 @@ def run_agent_chain(project_id, user_id, initial_prompt):
             create_file(project_dir, file_path, code)
             log_step("CODER", f"Finished writing `{file_path}`.", code)
-        # 4. REVIEWER
-        log_step("REVIEWER", "Reviewing all generated source code...")
         for file_path in source_files:
             code_content = read_file(project_dir, file_path)
             if not code_content: continue
-            review_prompt = f"Review this code from `{file_path}`:\n\n{code_content}"
-            review_response = generate_with_model("reviewer", review_prompt)
             log_step("REVIEWER", f"Review of `{file_path}` complete.", review_response)
-        # 5. TESTER
-        log_step("TESTER", "Writing unit tests...")
         for file_path in source_files:
             code_content = read_file(project_dir, file_path)
             if not code_content: continue
             test_file_path = os.path.join("tests", f"test_{os.path.basename(file_path)}")
-            tester_prompt = f"Write a pytest test file (`{test_file_path}`) for this code from `{file_path}`:\n\n{code_content}"
-            test_code = generate_with_model("tester", tester_prompt)
             create_file(project_dir, test_file_path, test_code)
             log_step("TESTER", f"Generated test `{test_file_path}`.", test_code)
-        # 6. PUBLISHER
         log_step("PUBLISHER", "Generating final documentation and configuration...")
-        all_files = [os.path.join(r, f).replace(project_dir, '', 1) for r, d, fs in os.walk(project_dir) for f in fs]
-        pub_prompt = f"Project file structure: {json.dumps(all_files)}. Generate README.md, .gitignore, and Dockerfile."
-        pub_response = generate_with_model("publisher", pub_prompt)
         pub_data = _extract_json(pub_response)
         if not pub_data: raise ValueError("Publisher failed to create valid final assets.")
         for path, content in pub_data.items(): create_file(project_dir, path, content)
         log_step("PUBLISHER", "Final assets created.", json.dumps(pub_data, indent=2))
-        # 7. FINALIZATION
         log_step("SYSTEM", "Packaging project into a ZIP file...")
         zip_path = zip_project(project_dir, project_id)
         update_project_status(project_id, "completed", logs="".join(log_entries), zip_path=zip_path)
@@ -228,5 +239,5 @@ def run_agent_chain(project_id, user_id, initial_prompt):
 executor = concurrent.futures.ThreadPoolExecutor(max_workers=1)
 def queue_job(project_id, user_id, prompt):
-    print(f"Queuing job for project_id: {project_id}, user_id: {user_id}")
     executor.submit(run_agent_chain, project_id, user_id, prompt)

+# backend.py — FINAL, STABLE & OPTIMIZED VERSION v1.6
 import sqlite3
 import os
 import json
 import torch
 import psutil
+from transformers import AutoTokenizer, AutoModelForCausalLM, BitsAndBytesConfig
 # --- CONFIGURATION ---
 DB_PATH = "code_agents_pro.db"
             CREATE TABLE IF NOT EXISTS projects (id INTEGER PRIMARY KEY, user_id INTEGER, title TEXT, description TEXT, status TEXT DEFAULT 'queued', zip_path TEXT, logs TEXT DEFAULT '', created_at DATETIME DEFAULT CURRENT_TIMESTAMP, FOREIGN KEY (user_id) REFERENCES users(id));
             CREATE INDEX IF NOT EXISTS idx_user_status ON projects(user_id, status);
         """)
 init_db()
 def _db_execute(query, params=(), fetchone=False, fetchall=False, commit=False):
 def hash_password(password): return hashlib.sha256(password.encode()).hexdigest()
 def verify_password(password, stored_hash): return hash_password(password) == stored_hash
 def create_user(username, password):
     try:
         return _db_execute("INSERT INTO users (username, password_hash) VALUES (?, ?)", (username, hash_password(password)), commit=True)
     except sqlite3.IntegrityError: return None
 def get_user_by_username(username): return _db_execute("SELECT * FROM users WHERE username = ?", (username,), fetchone=True)
 def get_user_projects(user_id, limit=20): return _db_execute("SELECT * FROM projects WHERE user_id = ? ORDER BY created_at DESC LIMIT ?", (user_id, limit), fetchall=True)
 def create_project(user_id, title, description): return _db_execute("INSERT INTO projects (user_id, title, description) VALUES (?, ?, ?)", (user_id, title, description), commit=True)
 # ------------------------------ MODEL LOADING & CACHING ------------------------------
 MODEL_REGISTRY = {
     "planner": "microsoft/Phi-3-mini-4k-instruct",
+    # --- FINAL, CORRECTED MODEL NAME AS PER YOUR INSTRUCTION ---
+    "architect": "Qwen/Qwen2.5-Coder-0.5B-Instruct",
+    "coder": "Qwen/Qwen2.5-Coder-0.5B-Instruct",
     "reviewer": "microsoft/Phi-3-mini-4k-instruct",
+    "tester": "Qwen/Qwen2.5-Coder-0.5B-Instruct",
     "publisher": "microsoft/Phi-3-mini-4k-instruct",
 }
 _MODEL_CACHE = {}
 def load_model(model_name):
+    if model_name in _MODEL_CACHE:
+        return _MODEL_CACHE[model_name]
+    # --- THIS IS THE FIX: Conditional Quantization for CPU/GPU compatibility ---
+    model_kwargs = {
+        "device_map": "auto",
+        "trust_remote_code": True,
+        "attn_implementation": "eager",
+    }
+    if torch.cuda.is_available():
+        print(f"CUDA is available. Loading model '{model_name}' in 4-bit for GPU acceleration.")
+        bnb_config = BitsAndBytesConfig(
+            load_in_4bit=True,
+            bnb_4bit_use_double_quant=True,
+            bnb_4bit_quant_type="nf4",
+            bnb_4bit_compute_dtype=torch.bfloat16
+        )
+        model_kwargs["quantization_config"] = bnb_config
+    else:
+        print(f"CUDA not available. Loading model '{model_name}' on CPU in default precision.")
+        # No quantization on CPU
     tokenizer = AutoTokenizer.from_pretrained(model_name)
+    model = AutoModelForCausalLM.from_pretrained(model_name, **model_kwargs)
     _MODEL_CACHE[model_name] = (tokenizer, model)
     print(f"Model {model_name} loaded and cached.")
     return tokenizer, model
+# ------------------------------ AGENT PROMPTS ------------------------------
 ROLE_PROMPTS = {
+    "planner": """You are an expert file planner. Based on the user's request, determine the necessary file structure. Output ONLY a single JSON object with a single key: "files". The "files" key MUST be an array of strings representing complete file paths (e.g., ["src/main.py", "tests/test_main.py", "requirements.txt"]).""",
+    "architect": """You are a software architect. Create initial placeholder content for a list of files. Output ONLY a single JSON object where keys are file paths and values are the initial content (e.g., a comment like '# Main application logic here').""",
     "coder": "You are a professional programmer. Your ONLY job is to write the complete, clean, and functional code for the single file requested. Do NOT add any explanations, introductions, or markdown formatting. Output ONLY the raw source code.",
+    "reviewer": """You are a meticulous code reviewer. Analyze the given code for bugs, style issues, and security vulnerabilities. Output ONLY a single JSON object with two keys: "has_issues" (boolean) and "suggestions" (a string containing a bulleted list of required changes).""",
     "tester": "You are a QA engineer. Write a complete pytest test file for the given source code. Cover main functionality and edge cases. Output ONLY the raw source code for the test file.",
+    "publisher": """You are a release manager. Create final documentation and configuration files. Output ONLY a single JSON object where keys are the filenames ("README.md", ".gitignore", "Dockerfile") and values are their complete string content."""
 }
 # ------------------------------ FILE SYSTEM & AI TOOLS ------------------------------
 def get_project_dir(user_id, project_id):
     path = os.path.join(PROJECT_ROOT, str(user_id), str(project_id))
 def create_file(project_dir, path, content):
     full_path = os.path.join(project_dir, path)
     os.makedirs(os.path.dirname(full_path), exist_ok=True)
+    with open(full_path, 'w', encoding='utf-8') as f:
+        f.write(content)
 def read_file(project_dir, path):
     full_path = os.path.join(project_dir, path)
     try:
+        with open(full_path, 'r', encoding='utf-8') as f:
+            return f.read()
+    except FileNotFoundError:
+        return None
 def zip_project(project_dir, project_id):
     zip_filename = f"project_{project_id}.zip"
     zip_path = os.path.join(os.path.dirname(project_dir), zip_filename)
     with zipfile.ZipFile(zip_path, 'w', zipfile.ZIP_DEFLATED) as zf:
         for root, _, files in os.walk(project_dir):
+            for file in files:
+                full_path = os.path.join(root, file)
+                arcname = os.path.relpath(full_path, project_dir)
+                zf.write(full_path, arcname)
     return zip_path
 def _extract_json(text: str) -> Optional[Dict[str, Any]]:
         input_text = tokenizer.apply_chat_template(messages, tokenize=False, add_generation_prompt=True)
         inputs = tokenizer(input_text, return_tensors="pt").to(model.device)
+        outputs = model.generate(**inputs, max_new_tokens=2048, pad_token_id=tokenizer.eos_token_id, use_cache=True)
         return tokenizer.decode(outputs[0][len(inputs.input_ids[0]):], skip_special_tokens=True).strip()
     except Exception as e:
     try:
         log_step("SYSTEM", "Initializing project...")
+        log_step("PLANNER", "Determining file structure...")
         plan_response = generate_with_model("planner", initial_prompt)
         plan_data = _extract_json(plan_response)
+        if not plan_data or "files" not in plan_data: raise ValueError("Planner failed to create a valid JSON plan.")
         log_step("PLANNER", "File structure plan created.", json.dumps(plan_data, indent=2))
         log_step("ARCHITECT", "Creating initial file skeletons...")
         arch_prompt = f"Create initial content for these files:\n{json.dumps(plan_data['files'])}"
         arch_response = generate_with_model("architect", arch_prompt)
         arch_data = _extract_json(arch_response)
+        if not arch_data: raise ValueError("Architect failed to create valid JSON skeletons.")
         for path, content in arch_data.items(): create_file(project_dir, path, content)
         log_step("ARCHITECT", "File skeletons created.", "\n".join(arch_data.keys()))
         source_files = [f for f in plan_data['files'] if f.startswith('src/') and f.endswith('.py')]
         for file_path in source_files:
             log_step("CODER", f"Writing complete code for `{file_path}`...")
             create_file(project_dir, file_path, code)
             log_step("CODER", f"Finished writing `{file_path}`.", code)
         for file_path in source_files:
             code_content = read_file(project_dir, file_path)
             if not code_content: continue
+            log_step("REVIEWER", f"Reviewing `{file_path}`...")
+            review_response = generate_with_model("reviewer", f"Review this code from `{file_path}`:\n\n{code_content}")
             log_step("REVIEWER", f"Review of `{file_path}` complete.", review_response)
         for file_path in source_files:
             code_content = read_file(project_dir, file_path)
             if not code_content: continue
             test_file_path = os.path.join("tests", f"test_{os.path.basename(file_path)}")
+            log_step("TESTER", f"Writing test for `{file_path}`...")
+            test_code = generate_with_model("tester", f"Write a pytest test file (`{test_file_path}`) for this code from `{file_path}`:\n\n{code_content}")
             create_file(project_dir, test_file_path, test_code)
             log_step("TESTER", f"Generated test `{test_file_path}`.", test_code)
+        all_files = [os.path.join(r, f).replace(project_dir, '', 1) for r, _, fs in os.walk(project_dir) for f in fs]
         log_step("PUBLISHER", "Generating final documentation and configuration...")
+        pub_response = generate_with_model("publisher", f"Project file structure: {json.dumps(all_files)}. Generate README.md, .gitignore, and Dockerfile.")
         pub_data = _extract_json(pub_response)
         if not pub_data: raise ValueError("Publisher failed to create valid final assets.")
         for path, content in pub_data.items(): create_file(project_dir, path, content)
         log_step("PUBLISHER", "Final assets created.", json.dumps(pub_data, indent=2))
         log_step("SYSTEM", "Packaging project into a ZIP file...")
         zip_path = zip_project(project_dir, project_id)
         update_project_status(project_id, "completed", logs="".join(log_entries), zip_path=zip_path)
 executor = concurrent.futures.ThreadPoolExecutor(max_workers=1)
 def queue_job(project_id, user_id, prompt):
+    print(f"Queuing job for project: {project_id}")
     executor.submit(run_agent_chain, project_id, user_id, prompt)