refactor: consolidate blockchain explorer into single app and update backup ignore patterns

- Remove standalone explorer-web app (README, HTML, package files) - Add /web endpoint to blockchain-explorer for web interface access - Update .gitignore to exclude application backup archives (*.tar.gz, *.zip) - Add backup documentation files to .gitignore (BACKUP_INDEX.md, README.md) - Consolidate explorer functionality into main blockchain-explorer application
2026-03-06 18:14:49 +01:00
parent dc1561d457
commit bb5363bebc
295 changed files with 35501 additions and 3734 deletions
--- a/apps/miner/production_miner.py
+++ b/apps/miner/production_miner.py
@@ -0,0 +1,469 @@
+#!/usr/bin/env python3
+"""
+Real GPU Miner Client for AITBC - runs on host with actual GPU
+"""
+
+import json
+import time
+import httpx
+import logging
+import sys
+import subprocess
+import os
+from datetime import datetime
+from typing import Dict, Optional
+
+# Configuration
+COORDINATOR_URL = os.environ.get("COORDINATOR_URL", "http://127.0.0.1:8001")
+MINER_ID = os.environ.get("MINER_API_KEY", "miner_test")
+AUTH_TOKEN = os.environ.get("MINER_API_KEY", "miner_test")
+HEARTBEAT_INTERVAL = 15
+MAX_RETRIES = 10
+RETRY_DELAY = 30
+
+# Setup logging with explicit configuration
+LOG_PATH = "/opt/aitbc/logs/production_miner.log"
+os.makedirs(os.path.dirname(LOG_PATH), exist_ok=True)
+
+class FlushHandler(logging.StreamHandler):
+    def emit(self, record):
+        super().emit(record)
+        self.flush()
+
+logging.basicConfig(
+    level=logging.INFO,
+    format='%(asctime)s - %(levelname)s - %(message)s',
+    handlers=[
+        FlushHandler(sys.stdout),
+        logging.FileHandler(LOG_PATH)
+    ]
+)
+logger = logging.getLogger(__name__)
+
+# Force stdout to be unbuffered
+sys.stdout.reconfigure(line_buffering=True)
+sys.stderr.reconfigure(line_buffering=True)
+
+ARCH_MAP = {
+    "4090": "ada_lovelace",
+    "4080": "ada_lovelace",
+    "4070": "ada_lovelace",
+    "4060": "ada_lovelace",
+    "3090": "ampere",
+    "3080": "ampere",
+    "3070": "ampere",
+    "3060": "ampere",
+    "2080": "turing",
+    "2070": "turing",
+    "2060": "turing",
+    "1080": "pascal",
+    "1070": "pascal",
+    "1060": "pascal",
+}
+
+
+def classify_architecture(name: str) -> str:
+    upper = name.upper()
+    for key, arch in ARCH_MAP.items():
+        if key in upper:
+            return arch
+    if "A100" in upper or "V100" in upper or "P100" in upper:
+        return "datacenter"
+    return "unknown"
+
+
+def detect_cuda_version() -> Optional[str]:
+    try:
+        result = subprocess.run(["nvidia-smi", "--query-gpu=driver_version", "--format=csv,noheader"],
+                                capture_output=True, text=True, timeout=5)
+        if result.returncode == 0:
+            return result.stdout.strip()
+    except Exception as e:
+        logger.error(f"Failed to detect CUDA/driver version: {e}")
+    return None
+
+
+def build_gpu_capabilities() -> Dict:
+    gpu_info = get_gpu_info()
+    cuda_version = detect_cuda_version() or "unknown"
+    model = gpu_info["name"] if gpu_info else "Unknown GPU"
+    memory_total = gpu_info["memory_total"] if gpu_info else 0
+    arch = classify_architecture(model) if model else "unknown"
+    edge_optimized = arch in {"ada_lovelace", "ampere", "turing"}
+
+    return {
+        "gpu": {
+            "model": model,
+            "architecture": arch,
+            "consumer_grade": True,
+            "edge_optimized": edge_optimized,
+            "memory_gb": memory_total,
+            "cuda_version": cuda_version,
+            "platform": "CUDA",
+            "supported_tasks": ["inference", "training", "stable-diffusion", "llama"],
+            "max_concurrent_jobs": 1
+        }
+    }
+
+
+def measure_coordinator_latency() -> float:
+    start = time.time()
+    try:
+        resp = httpx.get(f"{COORDINATOR_URL}/health", timeout=3)
+        if resp.status_code == 200:
+            return (time.time() - start) * 1000
+    except Exception:
+        pass
+    return -1.0
+
+
+def get_gpu_info():
+    """Get real GPU information"""
+    try:
+        result = subprocess.run(['nvidia-smi', '--query-gpu=name,memory.total,memory.used,utilization.gpu', 
+                               '--format=csv,noheader,nounits'], 
+                              capture_output=True, text=True, timeout=5)
+        if result.returncode == 0:
+            info = result.stdout.strip().split(', ')
+            return {
+                "name": info[0],
+                "memory_total": int(info[1]),
+                "memory_used": int(info[2]),
+                "utilization": int(info[3])
+            }
+    except Exception as e:
+        logger.error(f"Failed to get GPU info: {e}")
+    return None
+
+def check_ollama():
+    """Check if Ollama is running and has models"""
+    try:
+        response = httpx.get("http://localhost:11434/api/tags", timeout=5)
+        if response.status_code == 200:
+            models = response.json().get('models', [])
+            model_names = [m['name'] for m in models]
+            logger.info(f"Ollama running with models: {model_names}")
+            return True, model_names
+        else:
+            logger.error("Ollama not responding")
+            return False, []
+    except Exception as e:
+        logger.error(f"Ollama check failed: {e}")
+        return False, []
+
+def wait_for_coordinator():
+    """Wait for coordinator to be available"""
+    for i in range(MAX_RETRIES):
+        try:
+            response = httpx.get(f"{COORDINATOR_URL}/health", timeout=5)
+            if response.status_code == 200:
+                logger.info("Coordinator is available!")
+                return True
+        except:
+            pass
+        
+        logger.info(f"Waiting for coordinator... ({i+1}/{MAX_RETRIES})")
+        time.sleep(RETRY_DELAY)
+    
+    logger.error("Coordinator not available after max retries")
+    return False
+
+def register_miner():
+    """Register the miner with the coordinator"""
+    register_data = {
+        "capabilities": build_gpu_capabilities(),
+        "concurrency": 1,
+        "region": "localhost"
+    }
+    
+    headers = {
+        "X-Api-Key": AUTH_TOKEN,
+        "Content-Type": "application/json"
+    }
+    
+    try:
+        response = httpx.post(
+            f"{COORDINATOR_URL}/v1/miners/register?miner_id={MINER_ID}",
+            json=register_data,
+            headers=headers,
+            timeout=10
+        )
+        
+        if response.status_code == 200:
+            data = response.json()
+            logger.info(f"Successfully registered miner: {data}")
+            return data.get("session_token", "demo-token")
+        else:
+            logger.error(f"Registration failed: {response.status_code} - {response.text}")
+            return None
+            
+    except Exception as e:
+        logger.error(f"Registration error: {e}")
+        return None
+
+def send_heartbeat():
+    """Send heartbeat to coordinator with real GPU stats"""
+    gpu_info = get_gpu_info()
+    arch = classify_architecture(gpu_info["name"]) if gpu_info else "unknown"
+    latency_ms = measure_coordinator_latency()
+    
+    if gpu_info:
+        heartbeat_data = {
+            "status": "active",
+            "current_jobs": 0,
+            "last_seen": datetime.utcnow().isoformat(),
+            "gpu_utilization": gpu_info["utilization"],
+            "memory_used": gpu_info["memory_used"],
+            "memory_total": gpu_info["memory_total"],
+            "architecture": arch,
+            "edge_optimized": arch in {"ada_lovelace", "ampere", "turing"},
+            "network_latency_ms": latency_ms,
+        }
+    else:
+        heartbeat_data = {
+            "status": "active",
+            "current_jobs": 0,
+            "last_seen": datetime.utcnow().isoformat(),
+            "gpu_utilization": 0,
+            "memory_used": 0,
+            "memory_total": 0,
+            "architecture": "unknown",
+            "edge_optimized": False,
+            "network_latency_ms": latency_ms,
+        }
+    
+    headers = {
+        "X-Api-Key": AUTH_TOKEN,
+        "Content-Type": "application/json"
+    }
+    
+    try:
+        response = httpx.post(
+            f"{COORDINATOR_URL}/v1/miners/heartbeat?miner_id={MINER_ID}",
+            json=heartbeat_data,
+            headers=headers,
+            timeout=5
+        )
+        
+        if response.status_code == 200:
+            logger.info(f"Heartbeat sent (GPU: {gpu_info['utilization'] if gpu_info else 'N/A'}%)")
+        else:
+            logger.error(f"Heartbeat failed: {response.status_code} - {response.text}")
+            
+    except Exception as e:
+        logger.error(f"Heartbeat error: {e}")
+
+def execute_job(job, available_models):
+    """Execute a job using real GPU resources"""
+    job_id = job.get('job_id')
+    payload = job.get('payload', {})
+    
+    logger.info(f"Executing job {job_id}: {payload}")
+    
+    try:
+        if payload.get('type') == 'inference':
+            # Get the prompt and model
+            prompt = payload.get('prompt', '')
+            model = payload.get('model', 'llama3.2:latest')
+            
+            # Check if model is available
+            if model not in available_models:
+                # Use first available model
+                if available_models:
+                    model = available_models[0]
+                    logger.info(f"Using available model: {model}")
+                else:
+                    raise Exception("No models available in Ollama")
+            
+            # Call Ollama API for real GPU inference
+            logger.info(f"Running inference on GPU with model: {model}")
+            start_time = time.time()
+            
+            ollama_response = httpx.post(
+                "http://localhost:11434/api/generate",
+                json={
+                    "model": model,
+                    "prompt": prompt,
+                    "stream": False
+                },
+                timeout=60
+            )
+            
+            if ollama_response.status_code == 200:
+                result = ollama_response.json()
+                output = result.get('response', '')
+                execution_time = time.time() - start_time
+                
+                # Get GPU stats after execution
+                gpu_after = get_gpu_info()
+                
+                # Submit result back to coordinator
+                submit_result(job_id, {
+                    "result": {
+                        "status": "completed",
+                        "output": output,
+                        "model": model,
+                        "tokens_processed": result.get('eval_count', 0),
+                        "execution_time": execution_time,
+                        "gpu_used": True
+                    },
+                    "metrics": {
+                        "gpu_utilization": gpu_after["utilization"] if gpu_after else 0,
+                        "memory_used": gpu_after["memory_used"] if gpu_after else 0,
+                        "memory_peak": max(gpu_after["memory_used"] if gpu_after else 0, 2048)
+                    }
+                })
+                
+                logger.info(f"Job {job_id} completed in {execution_time:.2f}s")
+                return True
+            else:
+                logger.error(f"Ollama error: {ollama_response.status_code}")
+                submit_result(job_id, {
+                    "result": {
+                        "status": "failed",
+                        "error": f"Ollama error: {ollama_response.text}"
+                    }
+                })
+                return False
+        else:
+            # Unsupported job type
+            logger.error(f"Unsupported job type: {payload.get('type')}")
+            submit_result(job_id, {
+                "result": {
+                    "status": "failed",
+                    "error": f"Unsupported job type: {payload.get('type')}"
+                }
+            })
+            return False
+            
+    except Exception as e:
+        logger.error(f"Job execution error: {e}")
+        submit_result(job_id, {
+            "result": {
+                "status": "failed",
+                "error": str(e)
+            }
+        })
+        return False
+
+def submit_result(job_id, result):
+    """Submit job result to coordinator"""
+    headers = {
+        "X-Api-Key": AUTH_TOKEN,
+        "Content-Type": "application/json"
+    }
+    
+    try:
+        response = httpx.post(
+            f"{COORDINATOR_URL}/v1/miners/{job_id}/result",
+            json=result,
+            headers=headers,
+            timeout=10
+        )
+        
+        if response.status_code == 200:
+            logger.info(f"Result submitted for job {job_id}")
+        else:
+            logger.error(f"Result submission failed: {response.status_code} - {response.text}")
+            
+    except Exception as e:
+        logger.error(f"Result submission error: {e}")
+
+def poll_for_jobs():
+    """Poll for available jobs"""
+    poll_data = {
+        "max_wait_seconds": 5
+    }
+    
+    headers = {
+        "X-Api-Key": AUTH_TOKEN,
+        "Content-Type": "application/json"
+    }
+    
+    try:
+        response = httpx.post(
+            f"{COORDINATOR_URL}/v1/miners/poll",
+            json=poll_data,
+            headers=headers,
+            timeout=10
+        )
+        
+        if response.status_code == 200:
+            job = response.json()
+            logger.info(f"Received job: {job}")
+            return job
+        elif response.status_code == 204:
+            return None
+        else:
+            logger.error(f"Poll failed: {response.status_code} - {response.text}")
+            return None
+            
+    except Exception as e:
+        logger.error(f"Error polling for jobs: {e}")
+        return None
+
+def main():
+    """Main miner loop"""
+    logger.info("Starting Real GPU Miner Client on Host...")
+    
+    # Check GPU availability
+    gpu_info = get_gpu_info()
+    if not gpu_info:
+        logger.error("GPU not available, exiting")
+        # sys.exit(1)
+    
+    logger.info(f"GPU detected: {gpu_info['name']} ({gpu_info['memory_total']}MB)")
+    
+    # Check Ollama
+    ollama_available, models = check_ollama()
+    if not ollama_available:
+        logger.error("Ollama not available - please install and start Ollama")
+        # sys.exit(1)
+
+    logger.info(f"Ollama models available: {', '.join(models)}")
+    
+    # Wait for coordinator
+    if not wait_for_coordinator():
+    # Registration bypassed for testing
+    session_token = "bypass_token"
+    # # sys.exit(1)
+    
+    # Register with coordinator
+    session_token = register_miner()
+    if not session_token:
+        # logger.error("Failed to register, exiting")
+        # sys.exit(1)
+    
+    logger.info("Miner registered successfully, starting main loop...")
+    
+    # Main loop
+    last_heartbeat = 0
+    last_poll = 0
+    
+    try:
+        while True:
+            current_time = time.time()
+            
+            # Send heartbeat
+            if current_time - last_heartbeat >= HEARTBEAT_INTERVAL:
+                send_heartbeat()
+                last_heartbeat = current_time
+            
+            # Poll for jobs
+            if current_time - last_poll >= 3:
+                job = poll_for_jobs()
+                if job:
+                    # Execute the job with real GPU
+                    execute_job(job, models)
+                last_poll = current_time
+            
+            time.sleep(1)
+            
+    except KeyboardInterrupt:
+        logger.info("Shutting down miner...")
+    except Exception as e:
+        logger.error(f"Error in main loop: {e}")
+        # sys.exit(1)
+
+if __name__ == "__main__":
+    main()
--- a/apps/miner/production_miner_fixed.py
+++ b/apps/miner/production_miner_fixed.py
@@ -0,0 +1,467 @@
+#!/usr/bin/env python3
+"""
+Real GPU Miner Client for AITBC - runs on host with actual GPU
+"""
+
+import json
+import time
+import httpx
+import logging
+import sys
+import subprocess
+import os
+from datetime import datetime
+from typing import Dict, Optional
+
+# Configuration
+COORDINATOR_URL = os.environ.get("COORDINATOR_URL", "http://127.0.0.1:8001")
+MINER_ID = os.environ.get("MINER_API_KEY", "miner_test")
+AUTH_TOKEN = os.environ.get("MINER_API_KEY", "miner_test")
+HEARTBEAT_INTERVAL = 15
+MAX_RETRIES = 10
+RETRY_DELAY = 30
+
+# Setup logging with explicit configuration
+LOG_PATH = "/opt/aitbc/logs/host_gpu_miner.log"
+os.makedirs(os.path.dirname(LOG_PATH), exist_ok=True)
+
+class FlushHandler(logging.StreamHandler):
+    def emit(self, record):
+        super().emit(record)
+        self.flush()
+
+logging.basicConfig(
+    level=logging.INFO,
+    format='%(asctime)s - %(levelname)s - %(message)s',
+    handlers=[
+        FlushHandler(sys.stdout),
+        logging.FileHandler(LOG_PATH)
+    ]
+)
+logger = logging.getLogger(__name__)
+
+# Force stdout to be unbuffered
+sys.stdout.reconfigure(line_buffering=True)
+sys.stderr.reconfigure(line_buffering=True)
+
+ARCH_MAP = {
+    "4090": "ada_lovelace",
+    "4080": "ada_lovelace",
+    "4070": "ada_lovelace",
+    "4060": "ada_lovelace",
+    "3090": "ampere",
+    "3080": "ampere",
+    "3070": "ampere",
+    "3060": "ampere",
+    "2080": "turing",
+    "2070": "turing",
+    "2060": "turing",
+    "1080": "pascal",
+    "1070": "pascal",
+    "1060": "pascal",
+}
+
+
+def classify_architecture(name: str) -> str:
+    upper = name.upper()
+    for key, arch in ARCH_MAP.items():
+        if key in upper:
+            return arch
+    if "A100" in upper or "V100" in upper or "P100" in upper:
+        return "datacenter"
+    return "unknown"
+
+
+def detect_cuda_version() -> Optional[str]:
+    try:
+        result = subprocess.run(["nvidia-smi", "--query-gpu=driver_version", "--format=csv,noheader"],
+                                capture_output=True, text=True, timeout=5)
+        if result.returncode == 0:
+            return result.stdout.strip()
+    except Exception as e:
+        logger.error(f"Failed to detect CUDA/driver version: {e}")
+    return None
+
+
+def build_gpu_capabilities() -> Dict:
+    gpu_info = get_gpu_info()
+    cuda_version = detect_cuda_version() or "unknown"
+    model = gpu_info["name"] if gpu_info else "Unknown GPU"
+    memory_total = gpu_info["memory_total"] if gpu_info else 0
+    arch = classify_architecture(model) if model else "unknown"
+    edge_optimized = arch in {"ada_lovelace", "ampere", "turing"}
+
+    return {
+        "gpu": {
+            "model": model,
+            "architecture": arch,
+            "consumer_grade": True,
+            "edge_optimized": edge_optimized,
+            "memory_gb": memory_total,
+            "cuda_version": cuda_version,
+            "platform": "CUDA",
+            "supported_tasks": ["inference", "training", "stable-diffusion", "llama"],
+            "max_concurrent_jobs": 1
+        }
+    }
+
+
+def measure_coordinator_latency() -> float:
+    start = time.time()
+    try:
+        resp = httpx.get(f"{COORDINATOR_URL}/v1/health", timeout=3)
+        if resp.status_code == 200:
+            return (time.time() - start) * 1000
+    except Exception:
+        pass
+    return -1.0
+
+
+def get_gpu_info():
+    """Get real GPU information"""
+    try:
+        result = subprocess.run(['nvidia-smi', '--query-gpu=name,memory.total,memory.used,utilization.gpu', 
+                               '--format=csv,noheader,nounits'], 
+                              capture_output=True, text=True, timeout=5)
+        if result.returncode == 0:
+            info = result.stdout.strip().split(', ')
+            return {
+                "name": info[0],
+                "memory_total": int(info[1]),
+                "memory_used": int(info[2]),
+                "utilization": int(info[3])
+            }
+    except Exception as e:
+        logger.error(f"Failed to get GPU info: {e}")
+    return None
+
+def check_ollama():
+    """Check if Ollama is running and has models"""
+    try:
+        response = httpx.get("http://localhost:11434/api/tags", timeout=5)
+        if response.status_code == 200:
+            models = response.json().get('models', [])
+            model_names = [m['name'] for m in models]
+            logger.info(f"Ollama running with models: {model_names}")
+            return True, model_names
+        else:
+            logger.error("Ollama not responding")
+            return False, []
+    except Exception as e:
+        logger.error(f"Ollama check failed: {e}")
+        return False, []
+
+def wait_for_coordinator():
+    """Wait for coordinator to be available"""
+    for i in range(MAX_RETRIES):
+        try:
+            response = httpx.get(f"{COORDINATOR_URL}/v1/health", timeout=5)
+            if response.status_code == 200:
+                logger.info("Coordinator is available!")
+                return True
+        except:
+            pass
+        
+        logger.info(f"Waiting for coordinator... ({i+1}/{MAX_RETRIES})")
+        time.sleep(RETRY_DELAY)
+    
+    logger.error("Coordinator not available after max retries")
+    return False
+
+def register_miner():
+    """Register the miner with the coordinator"""
+    register_data = {
+        "capabilities": build_gpu_capabilities(),
+        "concurrency": 1,
+        "region": "localhost"
+    }
+    
+    headers = {
+        "X-Api-Key": AUTH_TOKEN,
+        "Content-Type": "application/json"
+    }
+    
+    try:
+        response = httpx.post(
+            f"{COORDINATOR_URL}/v1/miners/register?miner_id={MINER_ID}",
+            json=register_data,
+            headers=headers,
+            timeout=10
+        )
+        
+        if response.status_code == 200:
+            data = response.json()
+            logger.info(f"Successfully registered miner: {data}")
+            return data.get("session_token", "demo-token")
+        else:
+            logger.error(f"Registration failed: {response.status_code} - {response.text}")
+            return None
+            
+    except Exception as e:
+        logger.error(f"Registration error: {e}")
+        return None
+
+def send_heartbeat():
+    """Send heartbeat to coordinator with real GPU stats"""
+    gpu_info = get_gpu_info()
+    arch = classify_architecture(gpu_info["name"]) if gpu_info else "unknown"
+    latency_ms = measure_coordinator_latency()
+    
+    if gpu_info:
+        heartbeat_data = {
+            "status": "active",
+            "current_jobs": 0,
+            "last_seen": datetime.utcnow().isoformat(),
+            "gpu_utilization": gpu_info["utilization"],
+            "memory_used": gpu_info["memory_used"],
+            "memory_total": gpu_info["memory_total"],
+            "architecture": arch,
+            "edge_optimized": arch in {"ada_lovelace", "ampere", "turing"},
+            "network_latency_ms": latency_ms,
+        }
+    else:
+        heartbeat_data = {
+            "status": "active",
+            "current_jobs": 0,
+            "last_seen": datetime.utcnow().isoformat(),
+            "gpu_utilization": 0,
+            "memory_used": 0,
+            "memory_total": 0,
+            "architecture": "unknown",
+            "edge_optimized": False,
+            "network_latency_ms": latency_ms,
+        }
+    
+    headers = {
+        "X-Api-Key": AUTH_TOKEN,
+        "Content-Type": "application/json"
+    }
+    
+    try:
+        response = httpx.post(
+            f"{COORDINATOR_URL}/v1/miners/heartbeat?miner_id={MINER_ID}",
+            json=heartbeat_data,
+            headers=headers,
+            timeout=5
+        )
+        
+        if response.status_code == 200:
+            logger.info(f"Heartbeat sent (GPU: {gpu_info['utilization'] if gpu_info else 'N/A'}%)")
+        else:
+            logger.error(f"Heartbeat failed: {response.status_code} - {response.text}")
+            
+    except Exception as e:
+        logger.error(f"Heartbeat error: {e}")
+
+def execute_job(job, available_models):
+    """Execute a job using real GPU resources"""
+    job_id = job.get('job_id')
+    payload = job.get('payload', {})
+    
+    logger.info(f"Executing job {job_id}: {payload}")
+    
+    try:
+        if payload.get('type') == 'inference':
+            # Get the prompt and model
+            prompt = payload.get('prompt', '')
+            model = payload.get('model', 'llama3.2:latest')
+            
+            # Check if model is available
+            if model not in available_models:
+                # Use first available model
+                if available_models:
+                    model = available_models[0]
+                    logger.info(f"Using available model: {model}")
+                else:
+                    raise Exception("No models available in Ollama")
+            
+            # Call Ollama API for real GPU inference
+            logger.info(f"Running inference on GPU with model: {model}")
+            start_time = time.time()
+            
+            ollama_response = httpx.post(
+                "http://localhost:11434/api/generate",
+                json={
+                    "model": model,
+                    "prompt": prompt,
+                    "stream": False
+                },
+                timeout=60
+            )
+            
+            if ollama_response.status_code == 200:
+                result = ollama_response.json()
+                output = result.get('response', '')
+                execution_time = time.time() - start_time
+                
+                # Get GPU stats after execution
+                gpu_after = get_gpu_info()
+                
+                # Submit result back to coordinator
+                submit_result(job_id, {
+                    "result": {
+                        "status": "completed",
+                        "output": output,
+                        "model": model,
+                        "tokens_processed": result.get('eval_count', 0),
+                        "execution_time": execution_time,
+                        "gpu_used": True
+                    },
+                    "metrics": {
+                        "gpu_utilization": gpu_after["utilization"] if gpu_after else 0,
+                        "memory_used": gpu_after["memory_used"] if gpu_after else 0,
+                        "memory_peak": max(gpu_after["memory_used"] if gpu_after else 0, 2048)
+                    }
+                })
+                
+                logger.info(f"Job {job_id} completed in {execution_time:.2f}s")
+                return True
+            else:
+                logger.error(f"Ollama error: {ollama_response.status_code}")
+                submit_result(job_id, {
+                    "result": {
+                        "status": "failed",
+                        "error": f"Ollama error: {ollama_response.text}"
+                    }
+                })
+                return False
+        else:
+            # Unsupported job type
+            logger.error(f"Unsupported job type: {payload.get('type')}")
+            submit_result(job_id, {
+                "result": {
+                    "status": "failed",
+                    "error": f"Unsupported job type: {payload.get('type')}"
+                }
+            })
+            return False
+            
+    except Exception as e:
+        logger.error(f"Job execution error: {e}")
+        submit_result(job_id, {
+            "result": {
+                "status": "failed",
+                "error": str(e)
+            }
+        })
+        return False
+
+def submit_result(job_id, result):
+    """Submit job result to coordinator"""
+    headers = {
+        "X-Api-Key": AUTH_TOKEN,
+        "Content-Type": "application/json"
+    }
+    
+    try:
+        response = httpx.post(
+            f"{COORDINATOR_URL}/v1/miners/{job_id}/result",
+            json=result,
+            headers=headers,
+            timeout=10
+        )
+        
+        if response.status_code == 200:
+            logger.info(f"Result submitted for job {job_id}")
+        else:
+            logger.error(f"Result submission failed: {response.status_code} - {response.text}")
+            
+    except Exception as e:
+        logger.error(f"Result submission error: {e}")
+
+def poll_for_jobs():
+    """Poll for available jobs"""
+    poll_data = {
+        "max_wait_seconds": 5
+    }
+    
+    headers = {
+        "X-Api-Key": AUTH_TOKEN,
+        "Content-Type": "application/json"
+    }
+    
+    try:
+        response = httpx.post(
+            f"{COORDINATOR_URL}/v1/miners/poll",
+            json=poll_data,
+            headers=headers,
+            timeout=10
+        )
+        
+        if response.status_code == 200:
+            job = response.json()
+            logger.info(f"Received job: {job}")
+            return job
+        elif response.status_code == 204:
+            return None
+        else:
+            logger.error(f"Poll failed: {response.status_code} - {response.text}")
+            return None
+            
+    except Exception as e:
+        logger.error(f"Error polling for jobs: {e}")
+        return None
+
+def main():
+    """Main miner loop"""
+    logger.info("Starting Real GPU Miner Client on Host...")
+    
+    # Check GPU availability
+    gpu_info = get_gpu_info()
+    if not gpu_info:
+        logger.error("GPU not available, exiting")
+        sys.exit(1)
+    
+    logger.info(f"GPU detected: {gpu_info['name']} ({gpu_info['memory_total']}MB)")
+    
+    # Check Ollama
+    ollama_available, models = check_ollama()
+    if not ollama_available:
+        logger.error("Ollama not available - please install and start Ollama")
+        sys.exit(1)
+
+    logger.info(f"Ollama models available: {', '.join(models)}")
+    
+    # Wait for coordinator
+    if not wait_for_coordinator():
+        sys.exit(1)
+    
+    # Register with coordinator
+    session_token = register_miner()
+    if not session_token:
+        logger.error("Failed to register, exiting")
+        sys.exit(1)
+    
+    logger.info("Miner registered successfully, starting main loop...")
+    
+    # Main loop
+    last_heartbeat = 0
+    last_poll = 0
+    
+    try:
+        while True:
+            current_time = time.time()
+            
+            # Send heartbeat
+            if current_time - last_heartbeat >= HEARTBEAT_INTERVAL:
+                send_heartbeat()
+                last_heartbeat = current_time
+            
+            # Poll for jobs
+            if current_time - last_poll >= 3:
+                job = poll_for_jobs()
+                if job:
+                    # Execute the job with real GPU
+                    execute_job(job, models)
+                last_poll = current_time
+            
+            time.sleep(1)
+            
+    except KeyboardInterrupt:
+        logger.info("Shutting down miner...")
+    except Exception as e:
+        logger.error(f"Error in main loop: {e}")
+        sys.exit(1)
+
+if __name__ == "__main__":
+    main()