feat(03-02): create configurable hardware tier definitions

- Added comprehensive tier definitions for low_end, mid_range, high_end - Configurable thresholds for RAM, CPU cores, GPU requirements - Model size recommendations per tier (1B-70B parameter range) - Performance characteristics and scaling thresholds - Global settings for model selection and scaling behavior
2026-01-27 18:30:42 -05:00
parent 5d93e9715f
commit 0b4c270632
1 changed files with 120 additions and 0 deletions
--- a/src/config/resource_tiers.yaml
+++ b/src/config/resource_tiers.yaml
@@ -0,0 +1,120 @@
 # Hardware Tier Definitions for Mai
 # Configurable thresholds for classifying system capabilities
 # Edit these values to adjust tier boundaries without code changes
 tiers:
  # Low-end systems: Basic hardware, small models only
  low_end:
    ram_gb: 
      min: 2
      max: 4
      description: "Minimal RAM for basic operations"
    cpu_cores:
      min: 2
      max: 4
      description: "Basic processing capability"
    gpu_required: false
    gpu_vram_gb: 
      min: 0
      description: "GPU not required for this tier"
    preferred_models: ["small"]
    model_size_range:
      min: "1B"
      max: "3B"
      description: "Small language models only"
    scaling_thresholds:
      memory_percent: 75
      cpu_percent: 80
      description: "Conservative thresholds for stability on limited hardware"
    performance_characteristics:
      max_conversation_length: "short"
      context_compression: "aggressive"
      response_time: "slow"
      parallel_processing: false
    description: "Entry-level systems requiring conservative resource usage"
  # Mid-range systems: Moderate hardware, small to medium models
  mid_range:
    ram_gb: 
      min: 4
      max: 8
      description: "Sufficient RAM for medium-sized models"
    cpu_cores:
      min: 4
      max: 8
      description: "Good multi-core performance"
    gpu_required: false
    gpu_vram_gb: 
      min: 0
      max: 4
      description: "Integrated or entry-level GPU acceptable"
    preferred_models: ["small", "medium"]
    model_size_range:
      min: "3B"
      max: "7B"
      description: "Small to medium language models"
    scaling_thresholds:
      memory_percent: 80
      cpu_percent: 85
      description: "Moderate thresholds for balanced performance"
    performance_characteristics:
      max_conversation_length: "medium"
      context_compression: "moderate"
      response_time: "moderate"
      parallel_processing: false
    description: "Consumer-grade systems with balanced capabilities"
  # High-end systems: Powerful hardware, medium to large models
  high_end:
    ram_gb: 
      min: 8
      max: null
      description: "Substantial RAM for large models and contexts"
    cpu_cores:
      min: 6
      max: null
      description: "High-performance multi-core processing"
    gpu_required: true
    gpu_vram_gb: 
      min: 6
      max: null
      description: "Dedicated GPU with substantial VRAM"
    preferred_models: ["medium", "large"]
    model_size_range:
      min: "7B"
      max: "70B"
      description: "Medium to large language models"
    scaling_thresholds:
      memory_percent: 85
      cpu_percent: 90
      description: "Higher thresholds for maximum utilization"
    performance_characteristics:
      max_conversation_length: "long"
      context_compression: "minimal"
      response_time: "fast"
      parallel_processing: true
    description: "High-performance systems for demanding workloads"
 # Global settings
 global:
  # Model selection preferences
  model_selection:
    prefer_gpu: true
    fallback_to_cpu: true
    safety_margin_gb: 1.0
    description: "Keep 1GB RAM free for system stability"
  # Scaling behavior
  scaling:
    check_interval_seconds: 30
    sustained_threshold_minutes: 5
    auto_downgrade: true
    auto_upgrade: false
    description: "Downgrade automatically but require user approval for upgrades"
  # Performance tuning
  performance:
    cache_size_mb: 512
    batch_processing: true
    async_operations: true
    description: "Performance optimizations for capable systems"