diff --git a/apps/gpu-service/src/gpu_service/data/__init__.py b/apps/gpu-service/src/gpu_service/data/__init__.py new file mode 100644 index 00000000..60b1dae9 --- /dev/null +++ b/apps/gpu-service/src/gpu_service/data/__init__.py @@ -0,0 +1,7 @@ +""" +GPU Service data files +""" + +from .consumer_gpu_profiles import CONSUMER_GPU_PROFILES + +__all__ = ["CONSUMER_GPU_PROFILES"] diff --git a/apps/gpu-service/src/gpu_service/data/__pycache__/__init__.cpython-313.pyc b/apps/gpu-service/src/gpu_service/data/__pycache__/__init__.cpython-313.pyc new file mode 100644 index 00000000..e6e6e364 Binary files /dev/null and b/apps/gpu-service/src/gpu_service/data/__pycache__/__init__.cpython-313.pyc differ diff --git a/apps/gpu-service/src/gpu_service/data/__pycache__/consumer_gpu_profiles.cpython-313.pyc b/apps/gpu-service/src/gpu_service/data/__pycache__/consumer_gpu_profiles.cpython-313.pyc new file mode 100644 index 00000000..682fd044 Binary files /dev/null and b/apps/gpu-service/src/gpu_service/data/__pycache__/consumer_gpu_profiles.cpython-313.pyc differ diff --git a/apps/gpu-service/src/gpu_service/data/consumer_gpu_profiles.py b/apps/gpu-service/src/gpu_service/data/consumer_gpu_profiles.py new file mode 100644 index 00000000..9fc980a4 --- /dev/null +++ b/apps/gpu-service/src/gpu_service/data/consumer_gpu_profiles.py @@ -0,0 +1,79 @@ +"""Consumer GPU profiles data for edge GPU service""" + +CONSUMER_GPU_PROFILES = { + "gtx_1660": { + "gpu_model": "NVIDIA GTX 1660", + "architecture": "TURING", + "memory_gb": 6, + "cuda_cores": 1408, + "memory_bandwidth_gbps": 192.0, + "tensor_cores": 0, + "base_clock_mhz": 1530, + "boost_clock_mhz": 1785, + "power_consumption_w": 120, + "thermal_design_power_w": 120, + "noise_level_db": 35.0, + "fp32_tflops": 5.0, + "fp16_tflops": 10.0, + "int8_tops": 20.0, + "low_latency_mode": True, + "mobile_optimized": False, + "thermal_throttling_resistance": 0.8, + "supported_cuda_versions": ["11.0", "11.1", "11.2"], + "supported_tensorrt_versions": ["8.0", "8.1"], + "supported_ollama_models": ["llama-7b", "mistral-7b"], + "market_price_usd": 250.0, + "edge_premium_multiplier": 1.2, + "availability_score": 0.9, + }, + "rtx_3060": { + "gpu_model": "NVIDIA RTX 3060", + "architecture": "AMPERE", + "memory_gb": 12, + "cuda_cores": 3584, + "memory_bandwidth_gbps": 360.0, + "tensor_cores": 112, + "base_clock_mhz": 1320, + "boost_clock_mhz": 1777, + "power_consumption_w": 170, + "thermal_design_power_w": 170, + "noise_level_db": 38.0, + "fp32_tflops": 13.0, + "fp16_tflops": 26.0, + "int8_tops": 52.0, + "low_latency_mode": True, + "mobile_optimized": False, + "thermal_throttling_resistance": 0.85, + "supported_cuda_versions": ["11.4", "11.5", "11.6"], + "supported_tensorrt_versions": ["8.2", "8.3"], + "supported_ollama_models": ["llama-7b", "llama-13b", "mistral-7b", "mixtral-8x7b"], + "market_price_usd": 350.0, + "edge_premium_multiplier": 1.3, + "availability_score": 0.85, + }, + "rtx_4090": { + "gpu_model": "NVIDIA RTX 4090", + "architecture": "ADA_LOVELACE", + "memory_gb": 24, + "cuda_cores": 16384, + "memory_bandwidth_gbps": 1008.0, + "tensor_cores": 512, + "base_clock_mhz": 2235, + "boost_clock_mhz": 2520, + "power_consumption_w": 450, + "thermal_design_power_w": 450, + "noise_level_db": 42.0, + "fp32_tflops": 83.0, + "fp16_tflops": 166.0, + "int8_tops": 332.0, + "low_latency_mode": True, + "mobile_optimized": False, + "thermal_throttling_resistance": 0.9, + "supported_cuda_versions": ["11.8", "12.0"], + "supported_tensorrt_versions": ["8.5", "8.6"], + "supported_ollama_models": ["llama-7b", "llama-13b", "llama-70b", "mixtral-8x7b", "codellama-34b"], + "market_price_usd": 1600.0, + "edge_premium_multiplier": 1.5, + "availability_score": 0.7, + }, +}