codedog-ai
diff --git a/‎README.md
+39 b/‎README.md
+39
diff --git a/‎codedog/actors/reporters/code_review.py
+161-4 b/‎codedog/actors/reporters/code_review.py
+161-4
diff --git a/‎codedog/templates/grimoire_en.py
+100-1 b/‎codedog/templates/grimoire_en.py
+100-1
diff --git a/‎codedog/templates/template_en.py
+19 b/‎codedog/templates/template_en.py
+19
@@ -13,6 +13,12 @@ Codedog leverages Large Language Models (LLMs) like GPT to automatically review
 *   **Code Review Suggestions**: Provides feedback and suggestions on code changes (experimental).
 *   **Multi-language Support**: Includes templates for English and Chinese reports.
 *   **Platform Support**: Works with GitHub and GitLab.
+*   **Automated Code Review**: Uses LLMs to analyze code changes, provide feedback, and suggest improvements
+*   **Scoring System**: Evaluates code across multiple dimensions, including correctness, readability, and maintainability
+*   **Multiple LLM Support**: Works with OpenAI, Azure OpenAI, DeepSeek, and MindConnect R1 models
+*   **Email Notifications**: Sends code review reports via email
+*   **Commit-Triggered Reviews**: Automatically reviews code when commits are made
+*   **Developer Evaluation**: Evaluates a developer's code over a specific time period
 
 ## Prerequisites
 
@@ -68,6 +74,13 @@ Codedog uses environment variables for configuration. You can set these directly
         *   `AZURE_OPENAI_DEPLOYMENT_ID="your_gpt_35_turbo_deployment_name"` (Used for code summaries/reviews)
         *   `AZURE_OPENAI_GPT4_DEPLOYMENT_ID="your_gpt_4_deployment_name"` (Used for PR summary)
         *   *(Optional)* `AZURE_OPENAI_API_VERSION="YYYY-MM-DD"` (Defaults to a recent preview version if not set)
+    *   **DeepSeek Models**: Set the following for DeepSeek models:
+        *   `DEEPSEEK_API_KEY="your_deepseek_api_key"`
+        *   *(Optional)* `DEEPSEEK_MODEL="deepseek-chat"` (Default model, options include: "deepseek-chat", "deepseek-coder", etc.)
+        *   *(Optional)* `DEEPSEEK_API_BASE="https://api.deepseek.com"` (Default API endpoint)
+        *   For **DeepSeek R1 model** specifically:
+            *   Set `DEEPSEEK_MODEL="deepseek-r1"`
+            *   *(Optional)* `DEEPSEEK_R1_API_BASE="https://your-r1-endpoint"` (If different from standard DeepSeek endpoint)
 
 **Example `.env` file:**
 
@@ -84,6 +97,32 @@ OPENAI_API_KEY="sk-xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxx"
 # AZURE_OPENAI_API_BASE="https://your-instance.openai.azure.com/"
 # AZURE_OPENAI_DEPLOYMENT_ID="gpt-35-turbo-16k"
 # AZURE_OPENAI_GPT4_DEPLOYMENT_ID="gpt-4-turbo"
+
+# LLM (DeepSeek example)
+# DEEPSEEK_API_KEY="your_deepseek_api_key"
+# DEEPSEEK_MODEL="deepseek-chat"
+# DEEPSEEK_API_BASE="https://api.deepseek.com"
+
+# LLM (DeepSeek R1 example)
+# DEEPSEEK_API_KEY="your_deepseek_api_key"
+# DEEPSEEK_MODEL="deepseek-r1"
+# DEEPSEEK_R1_API_BASE="https://your-r1-endpoint"
+
+# LLM (MindConnect R1 example)
+# MINDCONNECT_API_KEY="your_mindconnect_api_key"
+
+# Model selection (optional)
+CODE_SUMMARY_MODEL="gpt-3.5"
+PR_SUMMARY_MODEL="gpt-4"
+CODE_REVIEW_MODEL="deepseek"  # Can use "deepseek" or "deepseek-r1" here
+
+# Email notification (optional)
+EMAIL_ENABLED="true"
+NOTIFICATION_EMAILS="your_email@example.com,another_email@example.com"
+SMTP_SERVER="smtp.gmail.com"
+SMTP_PORT="587"
+SMTP_USERNAME="your_email@gmail.com"
+SMTP_PASSWORD="your_app_password"
 ```
 
 ## Running the Example (Quickstart)
 
@@ -1,3 +1,7 @@
+import json
+import re
+from typing import Dict, List, Tuple, Any
+
 from codedog.actors.reporters.base import Reporter
 from codedog.localization import Localization
 from codedog.models.code_review import CodeReview
@@ -7,6 +11,7 @@ class CodeReviewMarkdownReporter(Reporter, Localization):
     def __init__(self, code_reviews: list[CodeReview], language="en"):
         self._code_reviews: list[CodeReview] = code_reviews
         self._markdown: str = ""
+        self._scores: List[Dict] = []
 
         super().__init__(language=language)
 
@@ -16,17 +21,169 @@ def report(self) -> str:
 
         return self._markdown
 
+    def _extract_scores(self, review_text: str, file_name: str) -> Dict[str, Any]:
+        """Extract scores from the review text using a simple format."""
+        # Default empty score data
+        default_scores = {
+            "file": file_name,
+            "scores": {
+                "correctness": 0,
+                "readability": 0,
+                "maintainability": 0,
+                "standards_compliance": 0,
+                "performance": 0,
+                "security": 0,
+                "overall": 0
+            }
+        }
+        
+        try:
+            # Look for the scores section
+            scores_section = re.search(r'#{1,3}\s*SCORES:\s*([\s\S]*?)(?=#{1,3}|$)', review_text)
+            if not scores_section:
+                print(f"No scores section found for {file_name}")
+                return default_scores
+                
+            scores_text = scores_section.group(1)
+            
+            # Extract individual scores
+            correctness = self._extract_score(scores_text, "Correctness")
+            readability = self._extract_score(scores_text, "Readability")
+            maintainability = self._extract_score(scores_text, "Maintainability")
+            standards = self._extract_score(scores_text, "Standards Compliance")
+            performance = self._extract_score(scores_text, "Performance")
+            security = self._extract_score(scores_text, "Security")
+            overall = self._extract_score(scores_text, "Overall")
+            
+            # Update scores if found
+            if any([correctness, readability, maintainability, standards, performance, security, overall]):
+                return {
+                    "file": file_name,
+                    "scores": {
+                        "correctness": correctness or 0,
+                        "readability": readability or 0,
+                        "maintainability": maintainability or 0,
+                        "standards_compliance": standards or 0,
+                        "performance": performance or 0,
+                        "security": security or 0,
+                        "overall": overall or 0
+                    }
+                }
+                
+        except Exception as e:
+            print(f"Error extracting scores from review for {file_name}: {e}")
+        
+        return default_scores
+
+    def _extract_score(self, text: str, dimension: str) -> float:
+        """Extract a score for a specific dimension from text."""
+        try:
+            # Find patterns like "Correctness: 4.5 /5" or "- Readability: 3.8/5"
+            pattern = rf'[-\s]*{dimension}:\s*(\d+(?:\.\d+)?)\s*\/?5'
+            match = re.search(pattern, text, re.IGNORECASE)
+            if match:
+                return float(match.group(1))
+        except Exception as e:
+            print(f"Error extracting {dimension} score: {e}")
+        return 0
+
+    def _calculate_average_scores(self) -> Dict:
+        """Calculate the average scores across all files."""
+        if not self._scores:
+            return {
+                "avg_correctness": 0,
+                "avg_readability": 0,
+                "avg_maintainability": 0,
+                "avg_standards": 0,
+                "avg_performance": 0,
+                "avg_security": 0,
+                "avg_overall": 0
+            }
+        
+        total_files = len(self._scores)
+        avg_scores = {
+            "avg_correctness": sum(s["scores"]["correctness"] for s in self._scores) / total_files,
+            "avg_readability": sum(s["scores"]["readability"] for s in self._scores) / total_files,
+            "avg_maintainability": sum(s["scores"]["maintainability"] for s in self._scores) / total_files,
+            "avg_standards": sum(s["scores"]["standards_compliance"] for s in self._scores) / total_files,
+            "avg_performance": sum(s["scores"]["performance"] for s in self._scores) / total_files,
+            "avg_security": sum(s["scores"]["security"] for s in self._scores) / total_files,
+            "avg_overall": sum(s["scores"]["overall"] for s in self._scores) / total_files
+        }
+        
+        return avg_scores
+
+    def _get_quality_assessment(self, avg_overall: float) -> str:
+        """Generate a quality assessment based on the average overall score."""
+        if avg_overall >= 4.5:
+            return "Excellent code quality. The PR demonstrates outstanding adherence to best practices and coding standards."
+        elif avg_overall >= 4.0:
+            return "Very good code quality. The PR shows strong adherence to standards with only minor improvement opportunities."
+        elif avg_overall >= 3.5:
+            return "Good code quality. The PR meets most standards but has some areas for improvement."
+        elif avg_overall >= 3.0:
+            return "Satisfactory code quality. The PR is acceptable but has several areas that could be improved."
+        elif avg_overall >= 2.0:
+            return "Needs improvement. The PR has significant issues that should be addressed before merging."
+        else:
+            return "Poor code quality. The PR has major issues that must be fixed before it can be accepted."
+
+    def _generate_summary_table(self) -> str:
+        """Generate a summary table of all file scores."""
+        if not self._scores:
+            return ""
+        
+        file_score_rows = []
+        for score in self._scores:
+            file_name = score["file"]
+            s = score["scores"]
+            file_score_rows.append(
+                f"| {file_name} | {s['correctness']:.2f} | {s['readability']:.2f} | {s['maintainability']:.2f} | "
+                f"{s['standards_compliance']:.2f} | {s['performance']:.2f} | {s['security']:.2f} | {s['overall']:.2f} |"
+            )
+        
+        avg_scores = self._calculate_average_scores()
+        quality_assessment = self._get_quality_assessment(avg_scores["avg_overall"])
+        
+        return self.template.PR_REVIEW_SUMMARY_TABLE.format(
+            file_scores="\n".join(file_score_rows),
+            avg_correctness=avg_scores["avg_correctness"],
+            avg_readability=avg_scores["avg_readability"],
+            avg_maintainability=avg_scores["avg_maintainability"],
+            avg_standards=avg_scores["avg_standards"],
+            avg_performance=avg_scores["avg_performance"],
+            avg_security=avg_scores["avg_security"],
+            avg_overall=avg_scores["avg_overall"],
+            quality_assessment=quality_assessment
+        )
+
     def _generate_report(self):
         code_review_segs = []
+        
         for code_review in self._code_reviews:
+            # Extract scores if the review is not empty
+            if hasattr(code_review, 'review') and code_review.review.strip():
+                file_name = code_review.file.full_name if hasattr(code_review, 'file') and hasattr(code_review.file, 'full_name') else "Unknown"
+                score_data = self._extract_scores(code_review.review, file_name)
+                self._scores.append(score_data)
+            
+            # Add the review text (without modification)
             code_review_segs.append(
                 self.template.REPORT_CODE_REVIEW_SEGMENT.format(
-                    full_name=code_review.file.full_name,
-                    url=code_review.file.diff_url,
-                    review=code_review.review,
+                    full_name=code_review.file.full_name if hasattr(code_review, 'file') and hasattr(code_review.file, 'full_name') else "Unknown",
+                    url=code_review.file.diff_url if hasattr(code_review, 'file') and hasattr(code_review.file, 'diff_url') else "#",
+                    review=code_review.review if hasattr(code_review, 'review') else "",
                 )
             )
 
-        return self.template.REPORT_CODE_REVIEW.format(
+        # Generate review content
+        review_content = self.template.REPORT_CODE_REVIEW.format(
             feedback="\n".join(code_review_segs) if code_review_segs else self.template.REPORT_CODE_REVIEW_NO_FEEDBACK,
         )
+        
+        # Add summary table at the end if we have scores
+        summary_table = self._generate_summary_table()
+        if summary_table:
+            review_content += "\n\n" + summary_table
+        
+        return review_content
@@ -134,7 +134,86 @@
 """
 
 CODE_SUGGESTION = """Act as a Code Reviewer Assistant. I will give a code diff content.
-And I want you to check whether the code change is correct and give some suggestions to the author.
+And I want you to review the code changes, provide detailed feedback, and score the changes based on language-specific standards and best practices.
+
+## Review Requirements:
+1. Check correctness and logic of the code changes
+2. Evaluate adherence to language-specific coding standards 
+3. Identify potential bugs, performance issues, or security vulnerabilities
+4. Provide specific, actionable suggestions for improvement
+5. Score the code in multiple dimensions (see scoring system below)
+
+## Language-Specific Standards:
+{language} code should follow these standards:
+
+### Python:
+- PEP 8 style guide (spacing, naming conventions, line length)
+- Proper docstrings (Google, NumPy, or reST style)
+- Type hints for function parameters and return values
+- Error handling with specific exceptions
+- Avoid circular imports and global variables
+- Follow SOLID principles and avoid anti-patterns
+
+### JavaScript/TypeScript:
+- ESLint/TSLint standards
+- Proper async/await or Promise handling
+- Consistent styling (following project's style guide)
+- Proper error handling
+- Type definitions (for TypeScript)
+- Avoid direct DOM manipulation in frameworks
+
+### Java:
+- Follow Oracle Code Conventions
+- Proper exception handling
+- Appropriate access modifiers
+- Clear Javadoc comments
+- Correct resource management and memory handling
+- Follow SOLID principles
+
+### General (for all languages):
+- DRY (Don't Repeat Yourself) principle
+- Clear naming conventions
+- Appropriate comments for complex logic
+- Proper error handling
+- Security best practices
+
+## Scoring System (1-5 scale, where 5 is excellent):
+- **Correctness** (does the code function as intended?)
+- **Readability** (is the code easy to understand?)
+- **Maintainability** (how easy will this code be to maintain?)
+- **Standards Compliance** (does it follow language/framework conventions?)
+- **Performance** (any obvious performance issues?)
+- **Security** (any security concerns?)
+
+## Overall Score:
+- Calculate a weighted average as follows:
+  - Correctness: 30%
+  - Readability: 20%
+  - Maintainability: 20%
+  - Standards Compliance: 15%
+  - Performance: 10%
+  - Security: 5%
+
+## Format your review as follows:
+1. Brief summary of the changes (1-2 sentences)
+2. Detailed feedback with line references where appropriate
+3. Specific suggestions for improvement
+4. Scoring table with justifications for each dimension
+5. Overall score with brief conclusion
+
+## IMPORTANT: Scores Summary
+At the end of your review, include a clearly formatted score summary section like this:
+
+### SCORES:
+- Correctness: [score] /5
+- Readability: [score] /5
+- Maintainability: [score] /5
+- Standards Compliance: [score] /5
+- Performance: [score] /5
+- Security: [score] /5
+- Overall: [calculated_overall_score] /5
+
+Replace [score] with your actual numeric scores (e.g., 4.5).
 
 Here's the code diff from file {name}:
 ```{language}
@@ -154,3 +233,23 @@
 Note that the content might be used in markdown or other formatted text,
 so don't change the paragraph layout of the content or add symbols.
 Your translation:"""
+
+# Template for the summary score table at the end of PR review
+PR_REVIEW_SUMMARY_TABLE = """
+## PR Review Summary
+
+| File | Correctness | Readability | Maintainability | Standards | Performance | Security | Overall |
+|------|-------------|-------------|----------------|-----------|-------------|----------|---------|
+{file_scores}
+| **Average** | **{avg_correctness:.2f}** | **{avg_readability:.2f}** | **{avg_maintainability:.2f}** | **{avg_standards:.2f}** | **{avg_performance:.2f}** | **{avg_security:.2f}** | **{avg_overall:.2f}** |
+
+### Score Legend:
+- 5.00: Excellent
+- 4.00-4.99: Very Good
+- 3.00-3.99: Good
+- 2.00-2.99: Needs Improvement
+- 1.00-1.99: Poor
+
+### PR Quality Assessment:
+{quality_assessment}
+"""
@@ -89,6 +89,25 @@
 
 REPORT_CODE_REVIEW_NO_FEEDBACK = """No suggestions for this PR."""
 
+# --- Code Review Summary Table -----------------------------------------------
+PR_REVIEW_SUMMARY_TABLE = """
+## PR Review Summary
+
+| File | Correctness | Readability | Maintainability | Standards | Performance | Security | Overall |
+|------|-------------|-------------|----------------|-----------|-------------|----------|---------|
+{file_scores}
+| **Average** | **{avg_correctness:.2f}** | **{avg_readability:.2f}** | **{avg_maintainability:.2f}** | **{avg_standards:.2f}** | **{avg_performance:.2f}** | **{avg_security:.2f}** | **{avg_overall:.2f}** |
+
+### Score Legend:
+- 5.00: Excellent
+- 4.00-4.99: Very Good
+- 3.00-3.99: Good
+- 2.00-2.99: Needs Improvement
+- 1.00-1.99: Poor
+
+### PR Quality Assessment:
+{quality_assessment}
+"""
 
 # --- Materials ---------------------------------------------------------------