Spaces:

fuaadabdullah1
/

GradeM8

Sleeping

GradeM8 Deploy commited on 11 days ago

Commit

40f6738

1 Parent(s): 28b7952

refactor: complete HuggingFace naming migration and code quality improvements

- Rename _get_deepinfra_config() to _get_huggingface_config()
- Update all tests to use HuggingFace naming conventions
- Fix parsing.py to use HF_MODEL_DEFAULT
- Add DEEPINFRA_API_URL back for OCR module
- Fix Document fallback in conversion.py
- Fix mock function signatures in test_orchestration.py
- Add filename field to GradingResultWithStatus type tests

All 285 unit tests passing

Files changed (15) hide show

.env.example +3 -3
ai_router/__init__.py +2 -2
ai_router/client.py +2 -4
ai_router/parsing.py +1 -1
app.py +25 -26
config.py +11 -8
document/conversion.py +1 -0
exceptions.py +0 -45
tests/conftest.py +5 -5
tests/unit/test_ai_router.py +15 -15
tests/unit/test_client.py +125 -123
tests/unit/test_config.py +10 -10
tests/unit/test_orchestration.py +2 -2
tests/unit/test_parsing.py +1 -1
tests/unit/test_types.py +1 -1

.env.example CHANGED Viewed

@@ -1,6 +1,6 @@
-# DeepInfra API Configuration
-DEEPINFRA_API_KEY=your_api_key_here
-DEEPINFRA_MODEL=meta-llama/Meta-Llama-3.1-70B-Instruct
 # Grading Configuration
 MAX_TOKENS=2048

+# HuggingFace API Configuration
+HUGGINGFACE_API_KEY=your_api_key_here
+HF_MODEL_PRIMARY=meta-llama/Llama-2-70b-chat-hf
 # Grading Configuration
 MAX_TOKENS=2048

ai_router/__init__.py CHANGED Viewed

@@ -30,7 +30,7 @@ from .client import generate_grading
 from .orchestration import generate_batch_grading
 # Re-export underscore-prefixed internals used by tests for compatibility
-from .client import _get_deepinfra_config
 from .orchestration import (
     _build_grading_error_result,
     _build_grading_success_result,
@@ -49,7 +49,7 @@ __all__ = [
     # OCR sub-module (access as ai_router.ocr)
     "ocr",
     # Underscore-prefixed internals (test compatibility)
-    "_get_deepinfra_config",
     "_build_grading_success_result",
     "_build_grading_error_result",
     "_calculate_batch_stats",

 from .orchestration import generate_batch_grading
 # Re-export underscore-prefixed internals used by tests for compatibility
+from .client import _get_huggingface_config
 from .orchestration import (
     _build_grading_error_result,
     _build_grading_success_result,
     # OCR sub-module (access as ai_router.ocr)
     "ocr",
     # Underscore-prefixed internals (test compatibility)
+    "_get_huggingface_config",
     "_build_grading_success_result",
     "_build_grading_error_result",
     "_calculate_batch_stats",

ai_router/client.py CHANGED Viewed

@@ -34,10 +34,8 @@ BACKOFF_MULTIPLIER = 2.0
 HF_API_URL = "https://api-inference.huggingface.co/models"
-def _get_deepinfra_config() -> tuple[str, str, int, float]:
     """Get HuggingFace API configuration from environment or defaults.
-    Legacy name kept for backwards compatibility with tests.
     Returns:
         Tuple of (api_key, model, max_tokens, temperature)
@@ -90,7 +88,7 @@ async def generate_grading(content: str, rubric: str) -> GradingResult:
     """
     from .prompt import build_grading_prompt
-    api_key, model, max_tokens, temperature = _get_deepinfra_config()
     # Build the prompt
     prompt = build_grading_prompt(content, rubric)

 HF_API_URL = "https://api-inference.huggingface.co/models"
+def _get_huggingface_config() -> tuple[str, str, int, float]:
     """Get HuggingFace API configuration from environment or defaults.
     Returns:
         Tuple of (api_key, model, max_tokens, temperature)
     """
     from .prompt import build_grading_prompt
+    api_key, model, max_tokens, temperature = _get_huggingface_config()
     # Build the prompt
     prompt = build_grading_prompt(content, rubric)

ai_router/parsing.py CHANGED Viewed

@@ -122,7 +122,7 @@ def _validate_grading_result(result: dict) -> GradingResult:
         "strengths": strengths,
         "improvements": improvements,
         "feedback": str(result.get("feedback", "")),
-        "details": f"Graded using {config.DEEPINFRA_MODEL_DEFAULT}",
     }

         "strengths": strengths,
         "improvements": improvements,
         "feedback": str(result.get("feedback", "")),
+        "details": f"Graded using {config.HF_MODEL_DEFAULT}",
     }

app.py CHANGED Viewed

@@ -20,7 +20,6 @@ Just upload, review the rubric, and let GradeM8 do the rest!
 from __future__ import annotations
 import asyncio
-import json
 import logging
 from pathlib import Path
 from typing import TYPE_CHECKING, Any
@@ -33,7 +32,6 @@ import config
 import document
 from exceptions import DocumentError, DocumentConversionError, UnsupportedFileTypeError
 from ui.components import (
-    get_accessibility_css,
     create_results_cards,
     create_error_html,
     create_waiting_html,
@@ -53,6 +51,9 @@ logger = logging.getLogger(__name__)
 # Empty DataFrame template for consistent empty results
 _EMPTY_RESULTS_DF = pd.DataFrame(columns=["Student", "Score", "Status"])
 # =============================================================================
 # Built-in Rubric Templates
@@ -153,8 +154,6 @@ def get_rubric_content(rubric_key: str) -> str:
 async def process_batch_submissions(
     rubric: str,
     file_objs: list[Any],
-    text_size: str = "standard",
-    high_contrast: bool = False,
     progress: gr.Progress = gr.Progress(),  # noqa: B008
 ) -> tuple[str, str, str, bytes, pd.DataFrame, str]:
     """
@@ -247,7 +246,7 @@ def _process_extraction_results(
     for result in extract_results:
         if isinstance(result, Exception):
-            logger.error(f"Could not read file: {result}")
             continue
         filename, content, status = result
         if status == "success" and content:
@@ -324,8 +323,12 @@ async def _extract_single(file_obj: Any, index: int) -> tuple[str, str, str]:
         # Get the actual file path and read content
         file_path = file_obj.name if hasattr(file_obj, "name") else file_obj
-        with open(file_path, "rb") as f:
-            content_bytes = f.read()
         # Extract text using format-specific handlers
         text_content = document.extract_text(content_bytes, filename)
@@ -340,10 +343,10 @@ async def _extract_single(file_obj: Any, index: int) -> tuple[str, str, str]:
         return filename, text_content, "success"
     except DocumentError as e:
-        logger.error(f"Document error for {filename}: {e}")
         return filename, "", f"Could not read file: {e}"
-    except Exception as e:
-        logger.error(f"Failed to extract text from {filename}: {e}")
         return filename, "", "Unexpected error. Please try a different file format."
@@ -376,8 +379,8 @@ def _generate_word_report(batch_result: dict[str, Any], rubric: str) -> bytes:
             results=batch_result["results"],
             rubric=rubric,
         )
-    except Exception as e:
-        logger.error(f"Failed to create Word report: {e}")
         return b""
@@ -412,13 +415,13 @@ def process_document_conversion(
         return converted_bytes, output_filename, f"✓ Successfully converted to {output_format}"
     except UnsupportedFileTypeError as e:
-        logger.error(f"Unsupported conversion: {e}")
         return None, "", f"❌ {e}"
     except DocumentConversionError as e:
-        logger.error(f"Conversion failed: {e}")
         return None, "", f"❌ Conversion failed: {e}"
-    except Exception as e:
-        logger.error(f"Unexpected error during conversion: {e}")
         return None, "", "❌ An unexpected error occurred."
@@ -448,8 +451,8 @@ def process_images_to_pdf(
         return pdf_bytes, "combined_images.pdf", f"✓ Combined {len(file_objs)} images into PDF"
-    except Exception as e:
-        logger.error(f"Failed to convert images to PDF: {e}")
         return None, "", f"❌ Could not create PDF: {e}"
@@ -476,7 +479,7 @@ def create_interface() -> gr.Blocks:
             """)
             with gr.Row():
-                text_size_setting = gr.Radio(
                     label="Text Size",
                     choices=[
                         ("Standard", "standard"),
@@ -487,17 +490,13 @@ def create_interface() -> gr.Blocks:
                     elem_id="text-size-setting",
                 )
-                high_contrast_setting = gr.Checkbox(
                     label="High Contrast Mode",
                     value=False,
                     elem_id="high-contrast-setting",
                     info="Increases contrast for better visibility",
                 )
-        # Apply accessibility settings
-        def apply_accessibility_settings(text_size: str, high_contrast: bool) -> str:
-            return get_accessibility_css(text_size, high_contrast)
         # Header with better structure
         gr.Markdown("""
         <header role="banner">
@@ -556,7 +555,7 @@ def create_interface() -> gr.Blocks:
                 file_input = gr.File(
                     label="Upload papers (PDF, Word, or images)",
-                    file_types=[".pdf", ".docx", ".doc", ".png", ".jpg", ".jpeg", ".gif", ".webp", ".bmp"],
                     file_count="multiple",
                     elem_id="file-upload",
                 )
@@ -740,7 +739,7 @@ def create_interface() -> gr.Blocks:
                             with gr.Column():
                                 convert_file_input = gr.File(
                                     label="Upload document to convert",
-                                    file_types=[".pdf", ".docx", ".doc", ".png", ".jpg", ".jpeg", ".gif", ".webp", ".bmp"],
                                     file_count="single",
                                 )

 from __future__ import annotations
 import asyncio
 import logging
 from pathlib import Path
 from typing import TYPE_CHECKING, Any
 import document
 from exceptions import DocumentError, DocumentConversionError, UnsupportedFileTypeError
 from ui.components import (
     create_results_cards,
     create_error_html,
     create_waiting_html,
 # Empty DataFrame template for consistent empty results
 _EMPTY_RESULTS_DF = pd.DataFrame(columns=["Student", "Score", "Status"])
+# Supported file types for grading and conversion
+SUPPORTED_FILE_TYPES = [".pdf", ".docx", ".doc", ".png", ".jpg", ".jpeg", ".gif", ".webp", ".bmp"]
 # =============================================================================
 # Built-in Rubric Templates
 async def process_batch_submissions(
     rubric: str,
     file_objs: list[Any],
     progress: gr.Progress = gr.Progress(),  # noqa: B008
 ) -> tuple[str, str, str, bytes, pd.DataFrame, str]:
     """
     for result in extract_results:
         if isinstance(result, Exception):
+            logger.error("Could not read file: %s", result)
             continue
         filename, content, status = result
         if status == "success" and content:
         # Get the actual file path and read content
         file_path = file_obj.name if hasattr(file_obj, "name") else file_obj
+        # Use asyncio.to_thread for sync file I/O in async context
+        def read_file_sync():
+            with open(file_path, "rb") as f:
+                return f.read()
+        content_bytes = await asyncio.to_thread(read_file_sync)
         # Extract text using format-specific handlers
         text_content = document.extract_text(content_bytes, filename)
         return filename, text_content, "success"
     except DocumentError as e:
+        logger.error("Document error for %s: %s", filename, e)
         return filename, "", f"Could not read file: {e}"
+    except (OSError, IOError) as e:
+        logger.error("Failed to extract text from %s: %s", filename, e)
         return filename, "", "Unexpected error. Please try a different file format."
             results=batch_result["results"],
             rubric=rubric,
         )
+    except (OSError, IOError, ValueError) as e:
+        logger.error("Failed to create Word report: %s", e)
         return b""
         return converted_bytes, output_filename, f"✓ Successfully converted to {output_format}"
     except UnsupportedFileTypeError as e:
+        logger.error("Unsupported conversion: %s", e)
         return None, "", f"❌ {e}"
     except DocumentConversionError as e:
+        logger.error("Conversion failed: %s", e)
         return None, "", f"❌ Conversion failed: {e}"
+    except (OSError, IOError, ValueError) as e:
+        logger.error("Unexpected error during conversion: %s", e)
         return None, "", "❌ An unexpected error occurred."
         return pdf_bytes, "combined_images.pdf", f"✓ Combined {len(file_objs)} images into PDF"
+    except (OSError, IOError, ValueError) as e:
+        logger.error("Failed to convert images to PDF: %s", e)
         return None, "", f"❌ Could not create PDF: {e}"
             """)
             with gr.Row():
+                _text_size_setting = gr.Radio(  # noqa: F841 - Future accessibility feature
                     label="Text Size",
                     choices=[
                         ("Standard", "standard"),
                     elem_id="text-size-setting",
                 )
+                _high_contrast_setting = gr.Checkbox(  # noqa: F841 - Future accessibility feature
                     label="High Contrast Mode",
                     value=False,
                     elem_id="high-contrast-setting",
                     info="Increases contrast for better visibility",
                 )
         # Header with better structure
         gr.Markdown("""
         <header role="banner">
                 file_input = gr.File(
                     label="Upload papers (PDF, Word, or images)",
+                    file_types=SUPPORTED_FILE_TYPES,
                     file_count="multiple",
                     elem_id="file-upload",
                 )
                             with gr.Column():
                                 convert_file_input = gr.File(
                                     label="Upload document to convert",
+                                    file_types=SUPPORTED_FILE_TYPES,
                                     file_count="single",
                                 )

config.py CHANGED Viewed

@@ -46,6 +46,9 @@ OCR_TIMEOUT_SECONDS: float = 300.0
 # HuggingFace Inference API endpoint URL
 HF_API_URL: str = "https://api-inference.huggingface.co/models"
 # =============================================================================
 # Concurrency Settings
 # =============================================================================
@@ -348,18 +351,18 @@ h3 {{
 # =============================================================================
 # Required environment variable:
-#   - DEEPINFRA_API_KEY: Get from https://deepinfra.com/
 #
 # Optional overrides:
-#   - DEEPINFRA_MODEL: Override the default model
-#   - DEEPINFRA_MAX_TOKENS: Override max tokens
-#   - DEEPINFRA_TEMPERATURE: Override temperature
 #   - OCR_FALLBACK_ENABLED: Enable/disable OCR fallback (true/false)
 ENV_VARS: dict[str, str] = {
-    "deepinfra_key": "DEEPINFRA_API_KEY",
-    "deepinfra_model": "DEEPINFRA_MODEL",
-    "deepinfra_max_tokens": "DEEPINFRA_MAX_TOKENS",
-    "deepinfra_temperature": "DEEPINFRA_TEMPERATURE",
     "ocr_fallback_enabled": "OCR_FALLBACK_ENABLED",
 }

 # HuggingFace Inference API endpoint URL
 HF_API_URL: str = "https://api-inference.huggingface.co/models"
+# DeepInfra API URL (used for OCR with DeepSeek-OCR model)
+DEEPINFRA_API_URL: str = "https://api.deepinfra.com/v1/openai/chat/completions"
 # =============================================================================
 # Concurrency Settings
 # =============================================================================
 # =============================================================================
 # Required environment variable:
+#   - HUGGINGFACE_API_KEY: Get from https://huggingface.co/settings/tokens
 #
 # Optional overrides:
+#   - HF_MODEL_PRIMARY: Override the default model
+#   - HF_MAX_TOKENS: Override max tokens
+#   - HF_TEMPERATURE: Override temperature
 #   - OCR_FALLBACK_ENABLED: Enable/disable OCR fallback (true/false)
 ENV_VARS: dict[str, str] = {
+    "huggingface_key": "HUGGINGFACE_API_KEY",
+    "hf_model": "HF_MODEL_PRIMARY",
+    "hf_max_tokens": "HF_MAX_TOKENS",
+    "hf_temperature": "HF_TEMPERATURE",
     "ocr_fallback_enabled": "OCR_FALLBACK_ENABLED",
 }

document/conversion.py CHANGED Viewed

@@ -36,6 +36,7 @@ try:
     DOCX_SUPPORT = True
 except ImportError:
     DOCX_SUPPORT = False
 # Image support
 try:

     DOCX_SUPPORT = True
 except ImportError:
     DOCX_SUPPORT = False
+    Document = None  # type: ignore
 # Image support
 try:

exceptions.py CHANGED Viewed

@@ -88,48 +88,3 @@ class AIServiceError(GradingError):
 class ConfigurationError(GradeM8Error):
     """Raised when there's a configuration issue."""
-    pass
-# =============================================================================
-# AI Grading Errors
-# =============================================================================
-class GradingError(GradeM8Error):
-    """Base exception for AI grading errors."""
-    pass
-class ResponseParseError(GradingError):
-    """Raised when the AI response cannot be parsed as valid JSON."""
-    def __init__(self, message: str, raw_response: str | None = None) -> None:
-        self.raw_response = raw_response
-        super().__init__(message)
-class InvalidResponseError(GradingError):
-    """Raised when the AI response is valid JSON but missing required fields."""
-    pass
-class APIKeyError(GradingError):
-    """Raised when the API key is missing or invalid."""
-    pass
-class AIServiceError(GradingError):
-    """Raised when the AI service returns an error."""
-    def __init__(self, message: str, status_code: int | None = None) -> None:
-        self.status_code = status_code
-        super().__init__(message)
-# =============================================================================
-# Configuration Errors
-# =============================================================================
-class ConfigurationError(GradeM8Error):
-    """Raised when there's a configuration issue."""
-    pass


88
89	class ConfigurationError(GradeM8Error):
90	"""Raised when there's a configuration issue."""

tests/conftest.py CHANGED Viewed

@@ -93,14 +93,14 @@ from unittest.mock import Mock, AsyncMock
 @pytest.fixture(autouse=True)
 def setup_test_env() -> Generator[None, None, None]:
     """Set up test environment with mock API key."""
-    old_key = os.environ.get("DEEPINFRA_API_KEY")
-    os.environ["DEEPINFRA_API_KEY"] = "test_api_key_12345"
     yield
     # Cleanup
     if old_key is not None:
-        os.environ["DEEPINFRA_API_KEY"] = old_key
-    elif "DEEPINFRA_API_KEY" in os.environ:
-        del os.environ["DEEPINFRA_API_KEY"]
 @pytest.fixture

 @pytest.fixture(autouse=True)
 def setup_test_env() -> Generator[None, None, None]:
     """Set up test environment with mock API key."""
+    old_key = os.environ.get("HUGGINGFACE_API_KEY")
+    os.environ["HUGGINGFACE_API_KEY"] = "test_api_key_12345"
     yield
     # Cleanup
     if old_key is not None:
+        os.environ["HUGGINGFACE_API_KEY"] = old_key
+    elif "HUGGINGFACE_API_KEY" in os.environ:
+        del os.environ["HUGGINGFACE_API_KEY"]
 @pytest.fixture

tests/unit/test_ai_router.py CHANGED Viewed

@@ -146,16 +146,16 @@ class TestTransformToFinalFormat:
         assert results[0]["score"] == 80
-class TestGetDeepinfraConfig:
-    """Test _get_deepinfra_config helper."""
     def test_uses_environment_variables(self, monkeypatch):
-        monkeypatch.setenv("DEEPINFRA_API_KEY", "test_key")
-        monkeypatch.setenv("DEEPINFRA_MODEL", "test_model")
-        monkeypatch.setenv("DEEPINFRA_MAX_TOKENS", "1000")
-        monkeypatch.setenv("DEEPINFRA_TEMPERATURE", "0.5")
-        api_key, model, max_tokens, temperature = ai_router._get_deepinfra_config()
         assert api_key == "test_key"
         assert model == "test_model"
@@ -163,22 +163,22 @@ class TestGetDeepinfraConfig:
         assert temperature == 0.5
     def test_uses_defaults_for_optional_vars(self, monkeypatch):
-        monkeypatch.setenv("DEEPINFRA_API_KEY", "test_key")
         # Unset optional vars
-        monkeypatch.delenv("DEEPINFRA_MODEL", raising=False)
-        monkeypatch.delenv("DEEPINFRA_MAX_TOKENS", raising=False)
-        monkeypatch.delenv("DEEPINFRA_TEMPERATURE", raising=False)
-        api_key, model, max_tokens, temperature = ai_router._get_deepinfra_config()
         assert api_key == "test_key"
-        assert model == ai_router.config.DEEPINFRA_MODEL_DEFAULT
         assert max_tokens == ai_router.config.MAX_TOKENS
         assert temperature == ai_router.config.TEMPERATURE
     def test_raises_when_api_key_missing(self, monkeypatch):
-        monkeypatch.delenv("DEEPINFRA_API_KEY", raising=False)
         from exceptions import APIKeyError
         with pytest.raises(APIKeyError):
-            ai_router._get_deepinfra_config()

         assert results[0]["score"] == 80
+class TestGetHuggingfaceConfig:
+    """Test _get_huggingface_config helper."""
     def test_uses_environment_variables(self, monkeypatch):
+        monkeypatch.setenv("HUGGINGFACE_API_KEY", "test_key")
+        monkeypatch.setenv("HF_MODEL_PRIMARY", "test_model")
+        monkeypatch.setenv("HF_MAX_TOKENS", "1000")
+        monkeypatch.setenv("HF_TEMPERATURE", "0.5")
+        api_key, model, max_tokens, temperature = ai_router._get_huggingface_config()
         assert api_key == "test_key"
         assert model == "test_model"
         assert temperature == 0.5
     def test_uses_defaults_for_optional_vars(self, monkeypatch):
+        monkeypatch.setenv("HUGGINGFACE_API_KEY", "test_key")
         # Unset optional vars
+        monkeypatch.delenv("HF_MODEL_PRIMARY", raising=False)
+        monkeypatch.delenv("HF_MAX_TOKENS", raising=False)
+        monkeypatch.delenv("HF_TEMPERATURE", raising=False)
+        api_key, model, max_tokens, temperature = ai_router._get_huggingface_config()
         assert api_key == "test_key"
+        assert model == ai_router.config.HF_MODEL_DEFAULT
         assert max_tokens == ai_router.config.MAX_TOKENS
         assert temperature == ai_router.config.TEMPERATURE
     def test_raises_when_api_key_missing(self, monkeypatch):
+        monkeypatch.delenv("HUGGINGFACE_API_KEY", raising=False)
         from exceptions import APIKeyError
         with pytest.raises(APIKeyError):
+            ai_router._get_huggingface_config()

tests/unit/test_client.py CHANGED Viewed

@@ -9,29 +9,29 @@ import pytest
 import respx
 from httpx import Response
-from ai_router.client import _get_deepinfra_config, generate_grading
 from exceptions import APIKeyError, AIServiceError, ResponseParseError
 import config
-class TestGetDeepinfraConfig:
-    """Tests for _get_deepinfra_config function."""
     def test_raises_when_api_key_missing(self, monkeypatch):
-        """Test error when DEEPINFRA_API_KEY is not set."""
-        monkeypatch.delenv("DEEPINFRA_API_KEY", raising=False)
-        with pytest.raises(APIKeyError, match="DEEPINFRA_API_KEY"):
-            _get_deepinfra_config()
     def test_uses_environment_variables(self, monkeypatch):
         """Test using environment variables."""
-        monkeypatch.setenv("DEEPINFRA_API_KEY", "test_key")
-        monkeypatch.setenv("DEEPINFRA_MODEL", "test_model")
-        monkeypatch.setenv("DEEPINFRA_MAX_TOKENS", "1000")
-        monkeypatch.setenv("DEEPINFRA_TEMPERATURE", "0.5")
-        api_key, model, max_tokens, temperature = _get_deepinfra_config()
         assert api_key == "test_key"
         assert model == "test_model"
@@ -40,24 +40,24 @@ class TestGetDeepinfraConfig:
     def test_uses_defaults_for_optional_vars(self, monkeypatch):
         """Test using defaults when optional vars not set."""
-        monkeypatch.setenv("DEEPINFRA_API_KEY", "test_key")
-        monkeypatch.delenv("DEEPINFRA_MODEL", raising=False)
-        monkeypatch.delenv("DEEPINFRA_MAX_TOKENS", raising=False)
-        monkeypatch.delenv("DEEPINFRA_TEMPERATURE", raising=False)
-        api_key, model, max_tokens, temperature = _get_deepinfra_config()
         assert api_key == "test_key"
-        assert model == config.DEEPINFRA_MODEL_DEFAULT
         assert max_tokens == config.MAX_TOKENS
         assert temperature == config.TEMPERATURE
     def test_empty_api_key_raises_error(self, monkeypatch):
         """Test error when API key is empty string."""
-        monkeypatch.setenv("DEEPINFRA_API_KEY", "")
         with pytest.raises(APIKeyError):
-            _get_deepinfra_config()
 class TestGenerateGrading:
@@ -67,7 +67,7 @@ class TestGenerateGrading:
     @pytest.mark.asyncio
     async def test_successful_grading(self, monkeypatch):
         """Test successful grading API call."""
-        monkeypatch.setenv("DEEPINFRA_API_KEY", "test_key")
         # Mock API response with valid grading JSON
         grading_response = {
@@ -79,10 +79,9 @@ class TestGenerateGrading:
             "feedback": "Well done!"
         }
-        route = respx.post(config.DEEPINFRA_API_URL).mock(
-            return_value=Response(200, json={
-                "choices": [{"message": {"content": json.dumps(grading_response)}}]
-            })
         )
         result = await generate_grading("Student submission", "Grade on clarity")
@@ -93,9 +92,9 @@ class TestGenerateGrading:
     @respx.mock
     @pytest.mark.asyncio
-    async def test_grading_with_markdown_json(self, monkeypatch):
-        """Test grading response in markdown code block."""
-        monkeypatch.setenv("DEEPINFRA_API_KEY", "test_key")
         grading_response = {
             "score": 90,
@@ -106,12 +105,11 @@ class TestGenerateGrading:
             "feedback": "Great job!"
         }
-        content = f'```json\n{json.dumps(grading_response)}\n```'
-        route = respx.post(config.DEEPINFRA_API_URL).mock(
-            return_value=Response(200, json={
-                "choices": [{"message": {"content": content}}]
-            })
         )
         result = await generate_grading("Submission", "Rubric")
@@ -121,7 +119,7 @@ class TestGenerateGrading:
     @pytest.mark.asyncio
     async def test_missing_api_key_raises_error(self, monkeypatch):
         """Test error when API key is missing."""
-        monkeypatch.delenv("DEEPINFRA_API_KEY", raising=False)
         with pytest.raises(APIKeyError):
             await generate_grading("Submission", "Rubric")
@@ -130,9 +128,9 @@ class TestGenerateGrading:
     @pytest.mark.asyncio
     async def test_http_401_error(self, monkeypatch):
         """Test 401 unauthorized error."""
-        monkeypatch.setenv("DEEPINFRA_API_KEY", "test_key")
-        route = respx.post(config.DEEPINFRA_API_URL).mock(
             return_value=Response(401, text="Unauthorized")
         )
@@ -140,15 +138,15 @@ class TestGenerateGrading:
             await generate_grading("Submission", "Rubric")
         assert exc_info.value.status_code == 401
-        assert "DeepInfra API error" in str(exc_info.value)
     @respx.mock
     @pytest.mark.asyncio
     async def test_http_429_rate_limit(self, monkeypatch):
         """Test 429 rate limit error."""
-        monkeypatch.setenv("DEEPINFRA_API_KEY", "test_key")
-        route = respx.post(config.DEEPINFRA_API_URL).mock(
             return_value=Response(429, text="Rate limited")
         )
@@ -161,9 +159,9 @@ class TestGenerateGrading:
     @pytest.mark.asyncio
     async def test_http_500_error(self, monkeypatch):
         """Test 500 server error."""
-        monkeypatch.setenv("DEEPINFRA_API_KEY", "test_key")
-        route = respx.post(config.DEEPINFRA_API_URL).mock(
             return_value=Response(500, text="Internal Server Error")
         )
@@ -172,69 +170,68 @@ class TestGenerateGrading:
         assert exc_info.value.status_code == 500
     @respx.mock
     @pytest.mark.asyncio
-    async def test_invalid_json_response(self, monkeypatch):
-        """Test invalid JSON in response."""
-        monkeypatch.setenv("DEEPINFRA_API_KEY", "test_key")
-        route = respx.post(config.DEEPINFRA_API_URL).mock(
-            return_value=Response(200, json={
-                "choices": [{"message": {"content": "not valid json"}}]
-            })
-        )
-        with pytest.raises(ResponseParseError):
-            await generate_grading("Submission", "Rubric")
     @respx.mock
     @pytest.mark.asyncio
-    async def test_missing_choices_in_response(self, monkeypatch):
-        """Test response missing choices field."""
-        monkeypatch.setenv("DEEPINFRA_API_KEY", "test_key")
-        route = respx.post(config.DEEPINFRA_API_URL).mock(
-            return_value=Response(200, json={"id": "test"})
         )
-        with pytest.raises(AIServiceError, match="Invalid API response"):
             await generate_grading("Submission", "Rubric")
     @respx.mock
     @pytest.mark.asyncio
-    async def test_empty_choices_in_response(self, monkeypatch):
-        """Test response with empty choices array."""
-        monkeypatch.setenv("DEEPINFRA_API_KEY", "test_key")
-        route = respx.post(config.DEEPINFRA_API_URL).mock(
-            return_value=Response(200, json={"choices": []})
         )
-        with pytest.raises(AIServiceError, match="Invalid API response"):
-            await generate_grading("Submission", "Rubric")
-    @respx.mock
-    @pytest.mark.asyncio
-    async def test_missing_message_content(self, monkeypatch):
-        """Test response missing message content."""
-        monkeypatch.setenv("DEEPINFRA_API_KEY", "test_key")
-        route = respx.post(config.DEEPINFRA_API_URL).mock(
-            return_value=Response(200, json={
-                "choices": [{"message": {}}]
-            })
-        )
-        with pytest.raises(AIServiceError, match="Invalid API response"):
             await generate_grading("Submission", "Rubric")
     @respx.mock
     @pytest.mark.asyncio
     async def test_details_field_set(self, monkeypatch):
         """Test details field includes model info."""
-        monkeypatch.setenv("DEEPINFRA_API_KEY", "test_key")
-        monkeypatch.setenv("DEEPINFRA_MODEL", "custom-model")
         grading_response = {
             "score": 75,
@@ -245,67 +242,51 @@ class TestGenerateGrading:
             "feedback": "Test feedback"
         }
-        route = respx.post(config.DEEPINFRA_API_URL).mock(
-            return_value=Response(200, json={
-                "choices": [{"message": {"content": json.dumps(grading_response)}}]
-            })
         )
         result = await generate_grading("Submission", "Rubric")
         assert "custom-model" in result["details"]
-        assert "DeepInfra" in result["details"]
-    @respx.mock
-    @pytest.mark.asyncio
-    async def test_response_format_is_json_object(self, monkeypatch):
-        """Test that response_format is set to json_object."""
-        monkeypatch.setenv("DEEPINFRA_API_KEY", "test_key")
-        captured_payload = {}
-        def capture_request(request):
-            captured_payload.update(json.loads(request.content))
-            return Response(200, json={
-                "choices": [{"message": {"content": '{"score": 80}'}}]
-            })
-        route = respx.post(config.DEEPINFRA_API_URL).mock(side_effect=capture_request)
-        await generate_grading("Submission", "Rubric")
-        assert captured_payload["response_format"]["type"] == "json_object"
     @respx.mock
     @pytest.mark.asyncio
     async def test_prompt_building(self, monkeypatch):
         """Test that prompt is built correctly."""
-        monkeypatch.setenv("DEEPINFRA_API_KEY", "test_key")
         captured_payload = {}
         def capture_request(request):
             captured_payload.update(json.loads(request.content))
-            return Response(200, json={
-                "choices": [{"message": {"content": '{"score": 80}'}}]
-            })
-        route = respx.post(config.DEEPINFRA_API_URL).mock(side_effect=capture_request)
         content = "Student essay content"
         rubric = "Grade on clarity and grammar"
         await generate_grading(content, rubric)
-        messages = captured_payload["messages"]
-        assert messages[0]["role"] == "system"
-        assert messages[1]["role"] == "user"
-        assert content in messages[1]["content"]
-        assert rubric in messages[1]["content"]
     @respx.mock
     @pytest.mark.asyncio
     async def test_truncated_content_handling(self, monkeypatch):
         """Test handling of long content that needs truncation."""
-        monkeypatch.setenv("DEEPINFRA_API_KEY", "test_key")
         long_content = "a" * (config.MAX_PROMPT_CHARS + 1000)
@@ -318,11 +299,32 @@ class TestGenerateGrading:
             "feedback": "Test"
         }
-        route = respx.post(config.DEEPINFRA_API_URL).mock(
-            return_value=Response(200, json={
-                "choices": [{"message": {"content": json.dumps(grading_response)}}]
-            })
         )
         result = await generate_grading(long_content, "Rubric")
         assert result["score"] == 80

 import respx
 from httpx import Response
+from ai_router.client import _get_huggingface_config, generate_grading, HF_API_URL
 from exceptions import APIKeyError, AIServiceError, ResponseParseError
 import config
+class TestGetHuggingfaceConfig:
+    """Tests for _get_huggingface_config function."""
     def test_raises_when_api_key_missing(self, monkeypatch):
+        """Test error when HUGGINGFACE_API_KEY is not set."""
+        monkeypatch.delenv("HUGGINGFACE_API_KEY", raising=False)
+        with pytest.raises(APIKeyError, match="HUGGINGFACE_API_KEY"):
+            _get_huggingface_config()
     def test_uses_environment_variables(self, monkeypatch):
         """Test using environment variables."""
+        monkeypatch.setenv("HUGGINGFACE_API_KEY", "test_key")
+        monkeypatch.setenv("HF_MODEL_PRIMARY", "test_model")
+        monkeypatch.setenv("HF_MAX_TOKENS", "1000")
+        monkeypatch.setenv("HF_TEMPERATURE", "0.5")
+        api_key, model, max_tokens, temperature = _get_huggingface_config()
         assert api_key == "test_key"
         assert model == "test_model"
     def test_uses_defaults_for_optional_vars(self, monkeypatch):
         """Test using defaults when optional vars not set."""
+        monkeypatch.setenv("HUGGINGFACE_API_KEY", "test_key")
+        monkeypatch.delenv("HF_MODEL_PRIMARY", raising=False)
+        monkeypatch.delenv("HF_MAX_TOKENS", raising=False)
+        monkeypatch.delenv("HF_TEMPERATURE", raising=False)
+        api_key, model, max_tokens, temperature = _get_huggingface_config()
         assert api_key == "test_key"
+        assert model == config.HF_MODEL_DEFAULT
         assert max_tokens == config.MAX_TOKENS
         assert temperature == config.TEMPERATURE
     def test_empty_api_key_raises_error(self, monkeypatch):
         """Test error when API key is empty string."""
+        monkeypatch.setenv("HUGGINGFACE_API_KEY", "")
         with pytest.raises(APIKeyError):
+            _get_huggingface_config()
 class TestGenerateGrading:
     @pytest.mark.asyncio
     async def test_successful_grading(self, monkeypatch):
         """Test successful grading API call."""
+        monkeypatch.setenv("HUGGINGFACE_API_KEY", "test_key")
         # Mock API response with valid grading JSON
         grading_response = {
             "feedback": "Well done!"
         }
+        # HuggingFace returns a list with generated_text
+        route = respx.post(f"{HF_API_URL}/{config.HF_MODEL_DEFAULT}").mock(
+            return_value=Response(200, json=[{"generated_text": json.dumps(grading_response)}])
         )
         result = await generate_grading("Student submission", "Grade on clarity")
     @respx.mock
     @pytest.mark.asyncio
+    async def test_grading_with_embedded_json(self, monkeypatch):
+        """Test grading response with JSON embedded in text."""
+        monkeypatch.setenv("HUGGINGFACE_API_KEY", "test_key")
         grading_response = {
             "score": 90,
             "feedback": "Great job!"
         }
+        # Response with JSON embedded in text
+        content = f'Here is the grading: {json.dumps(grading_response)} End of response.'
+        route = respx.post(f"{HF_API_URL}/{config.HF_MODEL_DEFAULT}").mock(
+            return_value=Response(200, json=[{"generated_text": content}])
         )
         result = await generate_grading("Submission", "Rubric")
     @pytest.mark.asyncio
     async def test_missing_api_key_raises_error(self, monkeypatch):
         """Test error when API key is missing."""
+        monkeypatch.delenv("HUGGINGFACE_API_KEY", raising=False)
         with pytest.raises(APIKeyError):
             await generate_grading("Submission", "Rubric")
     @pytest.mark.asyncio
     async def test_http_401_error(self, monkeypatch):
         """Test 401 unauthorized error."""
+        monkeypatch.setenv("HUGGINGFACE_API_KEY", "test_key")
+        route = respx.post(f"{HF_API_URL}/{config.HF_MODEL_DEFAULT}").mock(
             return_value=Response(401, text="Unauthorized")
         )
             await generate_grading("Submission", "Rubric")
         assert exc_info.value.status_code == 401
+        assert "HuggingFace API error" in str(exc_info.value)
     @respx.mock
     @pytest.mark.asyncio
     async def test_http_429_rate_limit(self, monkeypatch):
         """Test 429 rate limit error."""
+        monkeypatch.setenv("HUGGINGFACE_API_KEY", "test_key")
+        route = respx.post(f"{HF_API_URL}/{config.HF_MODEL_DEFAULT}").mock(
             return_value=Response(429, text="Rate limited")
         )
     @pytest.mark.asyncio
     async def test_http_500_error(self, monkeypatch):
         """Test 500 server error."""
+        monkeypatch.setenv("HUGGINGFACE_API_KEY", "test_key")
+        route = respx.post(f"{HF_API_URL}/{config.HF_MODEL_DEFAULT}").mock(
             return_value=Response(500, text="Internal Server Error")
         )
         assert exc_info.value.status_code == 500
     @respx.mock
     @pytest.mark.asyncio
+    async def test_http_503_model_loading(self, monkeypatch):
+        """Test 503 model loading triggers retry."""
+        monkeypatch.setenv("HUGGINGFACE_API_KEY", "test_key")
+        # 503 on first call, success on retry
+        call_count = 0
+        def mock_response(request):
+            nonlocal call_count
+            call_count += 1
+            if call_count == 1:
+                return Response(503, text="Model is loading")
+            grading_response = {
+                "score": 80,
+                "rubric_breakdown": {},
+                "summary": "Good",
+                "strengths": [],
+                "improvements": [],
+                "feedback": "Nice work"
+            }
+            return Response(200, json=[{"generated_text": json.dumps(grading_response)}])
+        route = respx.post(f"{HF_API_URL}/{config.HF_MODEL_DEFAULT}").mock(side_effect=mock_response)
+        result = await generate_grading("Submission", "Rubric")
+        assert result["score"] == 80
+        assert call_count == 2
     @respx.mock
     @pytest.mark.asyncio
+    async def test_invalid_json_response(self, monkeypatch):
+        """Test invalid JSON in response."""
+        monkeypatch.setenv("HUGGINGFACE_API_KEY", "test_key")
+        route = respx.post(f"{HF_API_URL}/{config.HF_MODEL_DEFAULT}").mock(
+            return_value=Response(200, json=[{"generated_text": "not valid json at all"}])
         )
+        with pytest.raises(ResponseParseError):
             await generate_grading("Submission", "Rubric")
     @respx.mock
     @pytest.mark.asyncio
+    async def test_empty_response_list(self, monkeypatch):
+        """Test response with empty list."""
+        monkeypatch.setenv("HUGGINGFACE_API_KEY", "test_key")
+        route = respx.post(f"{HF_API_URL}/{config.HF_MODEL_DEFAULT}").mock(
+            return_value=Response(200, json=[])
         )
+        with pytest.raises(ResponseParseError):
             await generate_grading("Submission", "Rubric")
     @respx.mock
     @pytest.mark.asyncio
     async def test_details_field_set(self, monkeypatch):
         """Test details field includes model info."""
+        monkeypatch.setenv("HUGGINGFACE_API_KEY", "test_key")
+        monkeypatch.setenv("HF_MODEL_PRIMARY", "custom-model")
         grading_response = {
             "score": 75,
             "feedback": "Test feedback"
         }
+        route = respx.post(f"{HF_API_URL}/custom-model").mock(
+            return_value=Response(200, json=[{"generated_text": json.dumps(grading_response)}])
         )
         result = await generate_grading("Submission", "Rubric")
         assert "custom-model" in result["details"]
+        assert "HuggingFace" in result["details"]
     @respx.mock
     @pytest.mark.asyncio
     async def test_prompt_building(self, monkeypatch):
         """Test that prompt is built correctly."""
+        monkeypatch.setenv("HUGGINGFACE_API_KEY", "test_key")
         captured_payload = {}
         def capture_request(request):
             captured_payload.update(json.loads(request.content))
+            grading_response = {
+                "score": 80,
+                "rubric_breakdown": {},
+                "summary": "Good",
+                "strengths": [],
+                "improvements": [],
+                "feedback": "Nice"
+            }
+            return Response(200, json=[{"generated_text": json.dumps(grading_response)}])
+        route = respx.post(f"{HF_API_URL}/{config.HF_MODEL_DEFAULT}").mock(side_effect=capture_request)
         content = "Student essay content"
         rubric = "Grade on clarity and grammar"
         await generate_grading(content, rubric)
+        # HuggingFace format: inputs as full prompt, parameters for generation
+        assert "inputs" in captured_payload
+        assert content in captured_payload["inputs"]
+        assert rubric in captured_payload["inputs"]
+        assert "parameters" in captured_payload
     @respx.mock
     @pytest.mark.asyncio
     async def test_truncated_content_handling(self, monkeypatch):
         """Test handling of long content that needs truncation."""
+        monkeypatch.setenv("HUGGINGFACE_API_KEY", "test_key")
         long_content = "a" * (config.MAX_PROMPT_CHARS + 1000)
             "feedback": "Test"
         }
+        route = respx.post(f"{HF_API_URL}/{config.HF_MODEL_DEFAULT}").mock(
+            return_value=Response(200, json=[{"generated_text": json.dumps(grading_response)}])
         )
         result = await generate_grading(long_content, "Rubric")
         assert result["score"] == 80
+    @respx.mock
+    @pytest.mark.asyncio
+    async def test_dict_response_format(self, monkeypatch):
+        """Test handling of dict response format (alternative HF response)."""
+        monkeypatch.setenv("HUGGINGFACE_API_KEY", "test_key")
+        grading_response = {
+            "score": 85,
+            "rubric_breakdown": {},
+            "summary": "Well done",
+            "strengths": [],
+            "improvements": [],
+            "feedback": "Good work"
+        }
+        # Some HF models return dict instead of list
+        route = respx.post(f"{HF_API_URL}/{config.HF_MODEL_DEFAULT}").mock(
+            return_value=Response(200, json={"generated_text": json.dumps(grading_response)})
+        )
+        result = await generate_grading("Submission", "Rubric")
+        assert result["score"] == 85

tests/unit/test_config.py CHANGED Viewed

@@ -10,9 +10,9 @@ import config
 class TestConfigConstants:
     """Test configuration constants have expected values."""
-    def test_deepinfra_model_default(self):
-        """Test default DeepInfra model."""
-        assert config.DEEPINFRA_MODEL_DEFAULT == "meta-llama/Meta-Llama-3.1-70B-Instruct"
     def test_max_tokens(self):
         """Test max tokens setting."""
@@ -60,13 +60,13 @@ class TestEnvironmentVariables:
     def test_env_vars_defined(self):
         """Test that environment variable names are defined."""
-        assert "deepinfra_key" in config.ENV_VARS
-        assert config.ENV_VARS["deepinfra_key"] == "DEEPINFRA_API_KEY"
     @pytest.mark.parametrize("env_var,config_key", [
-        ("DEEPINFRA_MODEL", "deepinfra_model"),
-        ("DEEPINFRA_MAX_TOKENS", "deepinfra_max_tokens"),
-        ("DEEPINFRA_TEMPERATURE", "deepinfra_temperature"),
     ])
     def test_env_var_mappings(self, env_var, config_key):
         """Test environment variable mappings."""
@@ -120,8 +120,8 @@ class TestConfigTypes:
     def test_string_configs_are_strings(self):
         """Test string configuration values."""
         string_configs = [
-            config.DEEPINFRA_MODEL_DEFAULT,
-            config.DEEPINFRA_API_URL,
             config.LOG_LEVEL,
             config.LOG_FORMAT,
             config.GRADING_SYSTEM_PROMPT,

 class TestConfigConstants:
     """Test configuration constants have expected values."""
+    def test_hf_model_default(self):
+        """Test default HuggingFace model."""
+        assert config.HF_MODEL_DEFAULT == "meta-llama/Llama-2-70b-chat-hf"
     def test_max_tokens(self):
         """Test max tokens setting."""
     def test_env_vars_defined(self):
         """Test that environment variable names are defined."""
+        assert "huggingface_key" in config.ENV_VARS
+        assert config.ENV_VARS["huggingface_key"] == "HUGGINGFACE_API_KEY"
     @pytest.mark.parametrize("env_var,config_key", [
+        ("HF_MODEL_PRIMARY", "hf_model"),
+        ("HF_MAX_TOKENS", "hf_max_tokens"),
+        ("HF_TEMPERATURE", "hf_temperature"),
     ])
     def test_env_var_mappings(self, env_var, config_key):
         """Test environment variable mappings."""
     def test_string_configs_are_strings(self):
         """Test string configuration values."""
         string_configs = [
+            config.HF_MODEL_DEFAULT,
+            config.HF_API_URL,
             config.LOG_LEVEL,
             config.LOG_FORMAT,
             config.GRADING_SYSTEM_PROMPT,

tests/unit/test_orchestration.py CHANGED Viewed

@@ -180,7 +180,7 @@ class TestGenerateBatchGrading:
         call_count = 0
-        async def mock_generate(**kwargs):
             nonlocal call_count
             call_count += 1
             if call_count == 1:
@@ -208,7 +208,7 @@ class TestGenerateBatchGrading:
         concurrent_calls = 0
         max_concurrent = 0
-        async def mock_generate(**kwargs):
             nonlocal concurrent_calls, max_concurrent
             concurrent_calls += 1
             max_concurrent = max(max_concurrent, concurrent_calls)

         call_count = 0
+        async def mock_generate(content, rubric):
             nonlocal call_count
             call_count += 1
             if call_count == 1:
         concurrent_calls = 0
         max_concurrent = 0
+        async def mock_generate(content, rubric):
             nonlocal concurrent_calls, max_concurrent
             concurrent_calls += 1
             max_concurrent = max(max_concurrent, concurrent_calls)

tests/unit/test_parsing.py CHANGED Viewed

@@ -254,7 +254,7 @@ class TestValidateGradingResult:
         """Test details field is set with model info."""
         result = {"score": 80}
         validated = _validate_grading_result(result)
-        assert config.DEEPINFRA_MODEL_DEFAULT in validated["details"]
 class TestParseGradingResponse:

         """Test details field is set with model info."""
         result = {"score": 80}
         validated = _validate_grading_result(result)
+        assert config.HF_MODEL_DEFAULT in validated["details"]
 class TestParseGradingResponse:

tests/unit/test_types.py CHANGED Viewed

@@ -26,7 +26,7 @@ class TestTypeDefinitions:
     def test_grading_result_with_status_required_fields(self):
         """Test GradingResultWithStatus has all required fields."""
         hints = get_type_hints(GradingResultWithStatus)
-        required_fields = {"index", "score", "feedback", "summary", "rubric_breakdown", "strengths", "improvements", "details", "status"}
         assert set(hints.keys()) == required_fields

     def test_grading_result_with_status_required_fields(self):
         """Test GradingResultWithStatus has all required fields."""
         hints = get_type_hints(GradingResultWithStatus)
+        required_fields = {"index", "score", "feedback", "summary", "rubric_breakdown", "strengths", "improvements", "details", "status", "filename"}
         assert set(hints.keys()) == required_fields