truemagic-coder
diff --git a/Diff for: ‎.vscode/settings.json
+1-1 b/Diff for: ‎.vscode/settings.json
+1-1
diff --git a/Diff for: ‎README.md
+13-30 b/Diff for: ‎README.md
+13-30
diff --git a/Diff for: ‎nemo_agent/main.py
+103-14 b/Diff for: ‎nemo_agent/main.py
+103-14
@@ -1,3 +1,3 @@
 {
-    "CodeGPT.apiKey": "OpenAI",
+    "CodeGPT.apiKey": "Anthropic",
 }
@@ -15,12 +15,13 @@ https://github.com/user-attachments/assets/51cf6ad1-196c-44ab-99ba-0035365f1bbd
 * Generates Python project structures automatically using `uv`
 * Writes Python code based on task descriptions
 * Executes development tasks using AI-generated commands
-* Utilizes the `mistral-nemo` or `OpenAI` language models for intelligent code generation
+* Utilizes the `Ollama`, `OpenAI`, or `Claude` language models for intelligent code generation
 * Implements best practices in Python development automatically
 * Writes and runs passing tests using `pytest` up to 80%+ test coverage 
 * Automatically fixes and styles code using `pylint` up to 7+/10
 * Calculates and improves the complexity score using `complexipy` to be under 15
 * Auto-formats the code with `autopep8`
+* Shows the token count used for the responses
 
 ## Community
 * Join our community - [Nemo Agent Telegram Group](https://t.me/+f-6nu2mUpgtiOGUx)
@@ -31,27 +32,28 @@ https://github.com/user-attachments/assets/51cf6ad1-196c-44ab-99ba-0035365f1bbd
 * `flask` web apps (app works - tests pass)
 * `streamlit` apps (app works - tests fail)  
 * `tkinter` apps (app works - tests fail)
-* Note: `OpenAI` succeeds more often the `mistral-nemo` in their runs
+* Note: `OpenAI` or `Claude` succeed more often the `mistral-nemo` in their runs
 * Note: Not all runs will be successful
 
 ## Install 
 
-### OpenAI Local Install
+### OpenAI or Claude Install
 
 #### Requirements
 * Python 3.9 or higher
-* OpenAI API KEY
+* OpenAI or Claude API KEY
 * Mac or Linux
 
 #### Requirements Installation
-* Install OpenAI API KEY for `zsh` shell
-    * `echo 'export OPENAI_API_KEY="YOUR_API_KEY"' >> ~/.zshrc`
+* Install OpenAI or Claude API KEY for `zsh` shell
+    * `echo 'export OPENAI_API_KEY="YOUR_API_KEY"' >> ~/.zshrc` or
+    * `echo 'export ANTHROPIC_API_KEY="YOUR_API_KEY"' >> ~/.zshrc`
 * `pip install nemo-agent`
 * You are ready to use `nemo-agent`
 
 ### OR
 
-### Mistral-Nemo Local Install
+### Mistral-Nemo Install
 
 #### Requirements
 * Python 3.9 or higher
@@ -65,43 +67,24 @@ https://github.com/user-attachments/assets/51cf6ad1-196c-44ab-99ba-0035365f1bbd
 * `pip install nemo-agent`
 * You are ready to use `nemo-agent`
 
-### OR
-
-### Mistral-Nemo Cloud Install
-
-#### Requirements
-* [RunPod](https://runpod.io) account setup with your SSH and billing information
-
-#### RunPod Setup
-* Make sure you have setup your SSH keys
-* Select a `4090` pod
-* Select the `RunPod Pytorch 2.1.1` template
-* Edit the template:
-    * Set `Container Disk` to 60 GB
-    * Set `Expose HTTP Ports` to `8888, 11434`
-    * Add `environment variables` with `OLLAMA_HOST` key and `0.0.0.0` value
-* Deploy your pod
-* After deploying then login via SSH
-* Run on the pod: `(curl -fsSL https://ollama.com/install.sh | sh && ollama serve > ollama.log 2>&1) &` and then press CTRL+C to exit
-* Run on the pod: `ollama pull mistral-nemo`
-* Run on the pod: `pip install nemo-agent`
-* You are ready to use `nemo-agent`
-
 ## Usage
 
 ### Prompt
 * `mistral-nemo`: `nemo-agent "create a fizzbuzz script"`
 * `openai`: `nemo-agent "create a fizzbuzz script" --provider openai`
+* `claude`: `nemo-agent "create a fizzbuzz script" --provider claude`
 
 ### Markdown File
 * `mistral-nemo`: `nemo-agent --file example.md`
 * `openai`: `nemo-agent --file example.md --provider openai`
+* `claude`: `nemo-agent --file example.md --provider claude`
 
 ## Model overrides
 
 * You can pass the `--model` flag to override the default model for the provider.
-* The default model for `openai` is `gpt-4o-2024-08-06`
 * The default model for `ollama` is `mistral-nemo`
+* The default model for `openai` is `gpt-4o-2024-08-06`
+* The default model for `claude` is `claude-3-5-sonnet-20240620`
 
 ## Contributing
 Contributions to Nemo Agent are welcome! Please feel free to submit a Pull Request.
 
@@ -15,13 +15,19 @@
 import requests
 import openai
 from anthropic import Anthropic
+import tiktoken
 
 
 class OllamaAPI:
     def __init__(self, model):
         self.model = model
         self.base_url = "http://localhost:11434/api"
+        self.token_count = 0
 
+    def count_tokens(self, text):
+        # Ollama doesn't provide a built-in token counter, so we'll use tiktoken as an approximation
+        return len(tiktoken.encoding_for_model("gpt-4o").encode(text))
+    
     def generate(self, prompt):
         url = f"{self.base_url}/generate"
         data = {"model": self.model, "prompt": prompt, "stream": True}
@@ -39,6 +45,18 @@ def generate(self, prompt):
                     except json.JSONDecodeError:
                         print(f"Error decoding JSON: {decoded_line}")
             print()  # Print a newline at the end
+            
+            # Extract content between markers
+            start_marker = "^^^start^^^"
+            end_marker = "^^^end^^^"
+            start_index = full_response.find(start_marker)
+            end_index = full_response.find(end_marker)
+            if start_index != -1 and end_index != -1:
+                full_response = full_response[start_index + len(start_marker):end_index].strip()
+            
+            self.token_count = self.count_tokens(full_response)
+            print(f"Token count: {self.token_count}")
+
             return full_response
         else:
             raise Exception(f"Ollama API error: {response.text}")
@@ -53,6 +71,10 @@ def __init__(self, model):
         if not self.api_key:
             raise ValueError("OPENAI_API_KEY environment variable is not set")
         openai.api_key = self.api_key
+        self.token_count = 0
+
+    def count_tokens(self, text):
+        return len(tiktoken.encoding_for_model(self.model).encode(text))
 
     def generate(self, prompt):
         try:
@@ -68,11 +90,24 @@ def generate(self, prompt):
                     full_response += chunk_text
                     print(chunk_text, end="", flush=True)
             print()  # Print a newline at the end
+            
+            # Extract content between markers
+            start_marker = "^^^start^^^"
+            end_marker = "^^^end^^^"
+            start_index = full_response.find(start_marker)
+            end_index = full_response.find(end_marker)
+            if start_index != -1 and end_index != -1:
+                full_response = full_response[start_index + len(start_marker):end_index].strip()
+            
+            self.token_count = self.count_tokens(full_response)
+            print(f"Token count: {self.token_count}")
+
             return full_response
         except Exception as e:
             raise Exception(f"OpenAI API error: {str(e)}")
 
 
+
 class ClaudeAPI:
     def __init__(self, model):
         if model == "mistral-nemo":
@@ -82,22 +117,53 @@ def __init__(self, model):
         if not self.api_key:
             raise ValueError("ANTHROPIC_API_KEY environment variable is not set")
         self.client = Anthropic(api_key=self.api_key)
+        self.token_count = 0
+
+    def count_tokens(self, text):
+        # Ollama doesn't provide a built-in token counter, so we'll use tiktoken as an approximation
+        return len(tiktoken.encoding_for_model("gpt-4o").encode(text))
 
     def generate(self, prompt):
         try:
-            response = self.client.messages.create(
-                model=self.model,
-                messages=[{"role": "user", "content": prompt}],
-                stream=True,
-                max_tokens=1000,
-            )
             full_response = ""
-            for completion in response:
-                if completion.type == "content_block_delta":
-                    chunk_text = completion.delta.text
-                    full_response += chunk_text
-                    print(chunk_text, end="", flush=True)
+            max_iterations = 5  # Adjust this value as needed
+            continuation_prompt = prompt
+
+            for iteration in range(max_iterations):
+                response = self.client.messages.create(
+                    model=self.model,
+                    messages=[{"role": "user", "content": continuation_prompt}],
+                    stream=True,
+                    max_tokens=1000,
+                )
+
+                chunk_response = ""
+                for completion in response:
+                    if completion.type == "content_block_delta":
+                        chunk_text = completion.delta.text
+                        chunk_response += chunk_text
+                        print(chunk_text, end="", flush=True)
+
+                full_response += chunk_response
+
+                if "^^^end^^^" in chunk_response:
+                    break
+
+                continuation_prompt = f"Continue from where you left off. Previous response: {chunk_response}"
+
             print()  # Print a newline at the end
+
+            # Extract content between markers
+            start_marker = "^^^start^^^"
+            end_marker = "^^^end^^^"
+            start_index = full_response.find(start_marker)
+            end_index = full_response.find(end_marker)
+            if start_index != -1 and end_index != -1:
+                full_response = full_response[start_index + len(start_marker):end_index].strip()
+
+            self.token_count = self.count_tokens(full_response)
+            print(f"Token count: {self.token_count}")
+
             return full_response
         except Exception as e:
             raise Exception(f"Claude API error: {str(e)}")
@@ -119,6 +185,11 @@ def __init__(
         self.pwd = os.getcwd() + "/" + self.project_name
         self.llm = self.setup_llm()
         self.previous_suggestions = set()
+        self.token_counts = {}
+
+    def count_tokens(self, text):
+        encoding = tiktoken.encoding_for_model("gpt-3.5-turbo")
+        return len(encoding.encode(text))
 
     def setup_llm(self):
         if self.provider == "ollama":
@@ -169,6 +240,9 @@ def run_task(self):
                 break
             test_check_attempts += 1
 
+        total_tokens = sum(self.token_counts.values())
+        print(f"\nTotal tokens used: {total_tokens}")
+
         print(
             "Task completed. Please review the output and make any necessary manual adjustments."
         )
@@ -303,7 +377,7 @@ def implement_solution(self, max_attempts=3):
         prompt = f"""
             Create a comprehensive implementation for the task: {self.task}.
             You must follow these rules strictly:
-                1, IMPORTANT: Never use pass statements in your code or tests. Always provide a meaningful implementation.
+                1. IMPORTANT: Never use pass statements in your code or tests. Always provide a meaningful implementation.
                 2. CRITICAL: Use the following code block format for specifying file content:                
                     For code files, use:
                     <<<main.py>>>
@@ -332,6 +406,7 @@ def implement_solution(self, max_attempts=3):
                 13. IMPORTANT: Always pytest parameterize tests for different cases.
                 14. CRITICAL: Always use `import main` to import the main.py file in the test file.
                 15. IMPORTANT: Only mock external services or APIs in tests.
+                16. IMPORTANT: Enclose your entire response between ^^^start^^^ and ^^^end^^^ markers.
             Working directory: {self.pwd}
             """
 
@@ -340,6 +415,14 @@ def implement_solution(self, max_attempts=3):
             solution = self.get_response(prompt)
             self.logger.info(f"Received solution:\n{solution}")
 
+            # Extract content between markers
+            start_marker = "^^^start^^^"
+            end_marker = "^^^end^^^"
+            start_index = solution.find(start_marker)
+            end_index = solution.find(end_marker)
+            if start_index != -1 and end_index != -1:
+                solution = solution[start_index + len(start_marker):end_index].strip()
+
             # Parse and execute any uv add commands
             uv_commands = [
                 line.strip()
@@ -392,11 +475,14 @@ def extract_file_contents_direct(self, solution):
 
     def get_response(self, prompt):
         try:
-            return self.llm.generate(prompt)
+            response = self.llm.generate(prompt)
+            prompt_key = prompt[:50]  # Use first 50 characters as a key
+            self.token_counts[prompt_key] = self.llm.token_count
+            return response
         except Exception as e:
             self.logger.error(f"Error getting response from {self.provider}: {str(e)}")
             return ""
-
+        
     def code_check(self, file_path):
         try:
             # Run autopep8 to automatically fix style issues
@@ -498,6 +584,7 @@ def improve_test_file(self, test_output):
         8. IMPORTANT: Always pytest parameterize tests for different cases.
         9. CRITICAL: Always use `import main` to import the main.py file in the test file.
         10. IMPORTANT: Only mock external services or APIs in tests.
+        11. IMPORTANT: Enclose your entire response between ^^^start^^^ and ^^^end^^^ markers.
         Working directory: {self.pwd}
         """
         proposed_improvements = self.get_response(prompt)
@@ -522,6 +609,7 @@ def validate_implementation(self, proposed_improvements):
         If the implementation is correct or mostly correct, respond with 'VALID'.
         If the implementation is completely unrelated or fundamentally flawed, respond with 'INVALID'.
         Do not provide any additional information or explanations.
+        IMPORTANT: Enclose your entire response between ^^^start^^^ and ^^^end^^^ markers.
         """
         response = self.get_response(prompt)
 
@@ -567,6 +655,7 @@ def improve_code(
                 # File content here
                 <<<end>>>
         7. CRITICAL: Do not explain the task only implement the required functionality in the code blocks.
+        8. IMPORTANT: Enclose your entire response between ^^^start^^^ and ^^^end^^^ markers.
         Working directory: {self.pwd}
         """
         proposed_improvements = self.get_response(prompt)
Original file line number	Diff line number	Diff line change
`@@ -1,3 +1,3 @@`
`1`	`1`	`{`
`2`		`- "CodeGPT.apiKey": "OpenAI",`
	`2`	`+ "CodeGPT.apiKey": "Anthropic",`
`3`	`3`	`}`