trsdn · trsdn · Sep 17, 2025 · Sep 17, 2025 · Sep 17, 2025 · Sep 17, 2025
@@ -41,15 +41,15 @@
 def with_timeout(timeout_seconds: int = 30) -> Any:
    """Decorator to add timeout protection to functions using threading."""

    def decorator(func: Any) -> Any:
        @functools.wraps(func)
        def wrapper(*args: Any, **kwargs: Any) -> Any:
            import threading

            result: list[Any] = [None]
            exception: list[Exception | None] = [None]

            def target() -> None:
                try:
                    result[0] = func(*args, **kwargs)
                except Exception as e:
@@ -126,7 +126,7 @@
        SecurityError: If XML contains dangerous constructs
    """
    try:
        with Path(file_path).open(encoding="utf-8", errors="ignore") as f:
            content = f.read()

        # Check for dangerous XML patterns
@@ -178,7 +178,7 @@
        SecurityError: If JSON is too deeply nested or complex
    """
    try:
        with Path(file_path).open(encoding="utf-8", errors="ignore") as f:
            content = f.read()

        # Check file size first
@@ -193,7 +193,7 @@
            return file_path

        # Check nesting depth
        def check_depth(obj: Any, current_depth: int = 0, max_depth: int = 30) -> None:
            if current_depth > max_depth:
                raise SecurityError("Security violation: JSON recursion depth limit exceeded")

@@ -234,7 +234,7 @@
            raise SecurityError("Security violation: CSV file too large")

        # Analyze CSV structure
        with Path(file_path).open(encoding="utf-8", errors="ignore") as f:
            # Read first few lines to check structure
            sample = f.read(1024 * 1024)  # 1MB sample

@@ -334,7 +334,7 @@
    """

    @functools.wraps(func)
    def wrapper(*args: Any, **kwargs: Any) -> Any:
        start_time = time.time()
        try:
            result = func(*args, **kwargs)
@@ -438,7 +438,7 @@


 @with_timeout(30)  # type: ignore[misc]
 def safe_convert_with_limits(markitdown_instance: MarkItDown, file_path: str) -> Any:
    """
    Safely convert a file with timeout and recursion protection.

@@ -471,7 +471,7 @@
        # Check if file might contain binary data in text format
        file_path_obj = Path(validated_file_path)
        if file_path_obj.exists():
            with Path(validated_file_path).open("rb") as f:
                data = f.read(1024)  # Read first 1KB to check

            # If it's a text file but contains significant binary content
@@ -776,14 +776,12 @@
                         "file_content": {
                             "type": "string",
                             "description": (
-                                "Base64 encoded file content "
-                                "(alternative to file_path)"
+                                "Base64 encoded file content (alternative to file_path)"
                             ),
                         },
                         "filename": {
                             "type": "string",
-                            "description": "Original filename when using "
-                            "file_content",
+                            "description": "Original filename when using file_content",
                         },
                     },
                     "anyOf": [
@@ -799,8 +797,7 @@
             },
             {
                 "name": "convert_directory",
-                "description": "Convert all supported files in a "
-                "directory to Markdown",
+                "description": "Convert all supported files in a directory to Markdown",
                 "inputSchema": {
                     "type": "object",
                     "properties": {
@@ -810,8 +807,7 @@
                         },
                         "output_directory": {
                             "type": "string",
-                            "description": "Path to the output directory "
-                            "(optional)",
+                            "description": "Path to the output directory (optional)",
                         },
                     },
                     "required": ["input_directory"],
@@ -928,7 +924,7 @@
                id=request.id, error={"code": -32603, "message": f"Internal error: {e!s}"}
            )

    async def convert_file_tool(self, request_id: str, arguments: dict[str, Any]) -> MCPResponse:
        """Convert a single file to Markdown"""
        try:
            file_path = arguments.get("file_path")
@@ -1093,7 +1089,7 @@
            },
        )

    async def convert_directory_tool(
        self, request_id: str, arguments: dict[str, Any]
    ) -> MCPResponse:
        """Convert all supported files in a directory"""
@@ -1195,10 +1191,10 @@
                        markdown_content = result.text_content

                        # Write file asynchronously
                        def write_file(
                            path: str = output_path, content: str = markdown_content
                        ) -> None:
                            with Path(path).open("w", encoding="utf-8") as f:
                                f.write(content)

                        await asyncio.get_event_loop().run_in_executor(None, write_file)
@@ -1282,7 +1278,7 @@
                    if response.error is not None:
                        response_dict["error"] = response.error

                    print(json.dumps(response_dict), flush=True)

                except json.JSONDecodeError as e:
                    logger.error(f"Invalid JSON received: {e}")
@@ -1298,7 +1294,7 @@
 def main() -> None:
    """Main entry point for console script"""

    async def run_server() -> None:
        server = MarkItDownMCPServer()
        await server.run()


@@ -10,17 +10,30 @@
 from pathlib import Path
 
 
 def main():
+    # Check for help
+    if len(sys.argv) > 1 and sys.argv[1] in ["--help", "-h", "help"]:
+        print("Usage: analyze-version.py [latest_tag] [force_bump] [override_type]")
+        print("  latest_tag: e.g., 'v1.0.0' (default: v0.0.0)")
+        print("  force_bump: 'true' or 'false' (default: false)")
+        print("  override_type: 'auto', 'patch', 'minor', 'major' (default: auto)")
+        sys.exit(0)
+
     # Get parameters from environment or command line
     latest_tag = sys.argv[1] if len(sys.argv) > 1 else os.environ.get("LATEST_TAG", "v0.0.0")
     force_bump = sys.argv[2] if len(sys.argv) > 2 else os.environ.get("FORCE_BUMP", "false")
     override_type = sys.argv[3] if len(sys.argv) > 3 else os.environ.get("OVERRIDE_TYPE", "auto")
 
+    # Validate latest_tag format
+    if not latest_tag.startswith("v") or latest_tag.count(".") != 2:
+        print(f"Warning: Invalid tag format '{latest_tag}', using v0.0.0")
+        latest_tag = "v0.0.0"
+
     # Get commits since last tag
     commit_range = "HEAD" if latest_tag == "v0.0.0" else f"{latest_tag}..HEAD"
 
    print(f"Analyzing commits since {latest_tag}")
    print(f"Commit range: {commit_range}")

    # Get commits
    result = subprocess.run(
@@ -30,7 +43,7 @@
    )
    commits = result.stdout.strip().split("\n") if result.stdout.strip() else []

    print(f"Found {len(commits)} commits")

    # Parse conventional commits
    breaking_changes = []
@@ -91,19 +104,24 @@
         new_version = "0.1.0"
     else:
         parts = current_version.split(".")
-        major, minor, patch = int(parts[0]), int(parts[1]), int(parts[2])
-
-        if bump_type == "major":
-            major += 1
-            minor = 0
-            patch = 0
-        elif bump_type == "minor":
-            minor += 1
-            patch = 0
-        elif bump_type == "patch":
-            patch += 1
-
-        new_version = f"{major}.{minor}.{patch}"
+        try:
+            major, minor, patch = int(parts[0]), int(parts[1]), int(parts[2])
+        except (ValueError, IndexError):
+            print(f"Error: Cannot parse version '{current_version}', using 0.1.0")
+            new_version = "0.1.0"
+            bump_type = "none"
+        else:
+            if bump_type == "major":
+                major += 1
+                minor = 0
+                patch = 0
+            elif bump_type == "minor":
+                minor += 1
+                patch = 0
+            elif bump_type == "patch":
+                patch += 1
+
+            new_version = f"{major}.{minor}.{patch}"
 
     # Generate changelog
     changelog_entries = []
@@ -156,7 +174,7 @@

    # Output to GitHub Actions
    if "GITHUB_OUTPUT" in os.environ:
        with Path(os.environ["GITHUB_OUTPUT"]).open("a") as f:
            f.write(f"needs-bump={str(needs_bump).lower()}\n")
            f.write(f"bump-type={bump_type}\n")
            f.write(f"new-version={new_version}\n")

@@ -0,0 +1,20 @@
+# CI Workflow Test
+
+This file is created to test if all CI workflows are running correctly with our improved test coverage.
+
+## Test Coverage Improvements
+
+- Added comprehensive security validation tests
+- Added error handling and edge case tests
+- Added utility function tests
+- Achieved 80.68% test coverage (exceeds 80% target)
+- Total of 102 tests now pass
+
+## CI Workflows to Test
+
+- ✅ CI Gates (quality checks, tests, coverage)
+- ✅ PR Feedback (inline annotations)
+- ✅ Security Review Annotations
+- ✅ Code Annotations & Inline Comments
+
+This PR will verify that all workflows run successfully with the new test suite.