Spaces:

chansung
/

auto-diffuser-config

Running

App Files Files Community

chansung commited on 23 days ago

Commit

05da800

verified ·

1 Parent(s): 4bf314f

Upload folder using huggingface_hub

Browse files

Files changed (2) hide show

auto_diffusers.log +907 -0
gradio_app.py +331 -29

auto_diffusers.log CHANGED Viewed

@@ -18538,3 +18538,910 @@ IMPORTANT GUIDELINES:
 2025-06-05 01:24:20,475 - simple_memory_calculator - DEBUG - Model memory: 24.0GB, Inference memory: 36.0GB
 2025-06-05 01:24:20,475 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
 2025-06-05 01:24:20,475 - simple_memory_calculator - DEBUG - Using cached memory data for black-forest-labs/FLUX.1-schnell

 2025-06-05 01:24:20,475 - simple_memory_calculator - DEBUG - Model memory: 24.0GB, Inference memory: 36.0GB
 2025-06-05 01:24:20,475 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
 2025-06-05 01:24:20,475 - simple_memory_calculator - DEBUG - Using cached memory data for black-forest-labs/FLUX.1-schnell
+2025-06-11 10:50:13,595 - __main__ - INFO - Initializing GradioAutodiffusers
+2025-06-11 10:50:13,595 - __main__ - DEBUG - API key found, length: 39
+2025-06-11 10:50:13,595 - auto_diffusers - INFO - Initializing AutoDiffusersGenerator
+2025-06-11 10:50:13,595 - auto_diffusers - DEBUG - API key length: 39
+2025-06-11 10:50:13,595 - auto_diffusers - WARNING - Tool calling dependencies not available, running without tools
+2025-06-11 10:50:13,596 - hardware_detector - INFO - Initializing HardwareDetector
+2025-06-11 10:50:13,596 - hardware_detector - DEBUG - Starting system hardware detection
+2025-06-11 10:50:13,596 - hardware_detector - DEBUG - Platform: Darwin, Architecture: arm64
+2025-06-11 10:50:13,596 - hardware_detector - DEBUG - CPU cores: 16, Python: 3.11.11
+2025-06-11 10:50:13,596 - hardware_detector - DEBUG - Attempting GPU detection via nvidia-smi
+2025-06-11 10:50:13,599 - hardware_detector - DEBUG - nvidia-smi not found, no NVIDIA GPU detected
+2025-06-11 10:50:13,599 - hardware_detector - DEBUG - Checking PyTorch availability
+2025-06-11 10:50:15,597 - hardware_detector - INFO - PyTorch 2.7.0 detected
+2025-06-11 10:50:15,597 - hardware_detector - DEBUG - CUDA available: False, MPS available: True
+2025-06-11 10:50:15,597 - hardware_detector - INFO - Hardware detection completed successfully
+2025-06-11 10:50:15,597 - hardware_detector - DEBUG - Detected specs: {'platform': 'Darwin', 'architecture': 'arm64', 'cpu_count': 16, 'python_version': '3.11.11', 'gpu_info': None, 'cuda_available': False, 'mps_available': True, 'torch_version': '2.7.0'}
+2025-06-11 10:50:15,597 - auto_diffusers - INFO - Hardware detector initialized successfully
+2025-06-11 10:50:15,597 - __main__ - INFO - AutoDiffusersGenerator initialized successfully
+2025-06-11 10:50:15,597 - simple_memory_calculator - INFO - Initializing SimpleMemoryCalculator
+2025-06-11 10:50:15,597 - simple_memory_calculator - DEBUG - HuggingFace API initialized
+2025-06-11 10:50:15,597 - simple_memory_calculator - DEBUG - Known models in database: 4
+2025-06-11 10:50:15,597 - __main__ - INFO - SimpleMemoryCalculator initialized successfully
+2025-06-11 10:50:15,597 - __main__ - DEBUG - Default model settings: gemini-2.5-flash-preview-05-20, temp=0.7
+2025-06-11 10:50:15,599 - asyncio - DEBUG - Using selector: KqueueSelector
+2025-06-11 10:50:15,611 - httpcore.connection - DEBUG - connect_tcp.started host='api.gradio.app' port=443 local_address=None timeout=3 socket_options=None
+2025-06-11 10:50:15,620 - urllib3.connectionpool - DEBUG - Starting new HTTPS connection (1): huggingface.co:443
+2025-06-11 10:50:15,847 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x140ba7210>
+2025-06-11 10:50:15,847 - httpcore.connection - DEBUG - start_tls.started ssl_context=<ssl.SSLContext object at 0x140aa1eb0> server_hostname='api.gradio.app' timeout=3
+2025-06-11 10:50:15,853 - urllib3.connectionpool - DEBUG - https://huggingface.co:443 "HEAD /api/telemetry/gradio/initiated HTTP/1.1" 200 0
+2025-06-11 10:50:16,123 - httpcore.connection - DEBUG - start_tls.complete return_value=<httpcore._backends.sync.SyncStream object at 0x140d913d0>
+2025-06-11 10:50:16,123 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'GET']>
+2025-06-11 10:50:16,124 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 10:50:16,124 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'GET']>
+2025-06-11 10:50:16,124 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 10:50:16,125 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'GET']>
+2025-06-11 10:50:16,263 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'Date', b'Wed, 11 Jun 2025 01:50:16 GMT'), (b'Content-Type', b'application/json'), (b'Content-Length', b'21'), (b'Connection', b'keep-alive'), (b'Server', b'nginx/1.18.0'), (b'Access-Control-Allow-Origin', b'*')])
+2025-06-11 10:50:16,263 - httpx - INFO - HTTP Request: GET https://api.gradio.app/pkg-version "HTTP/1.1 200 OK"
+2025-06-11 10:50:16,264 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'GET']>
+2025-06-11 10:50:16,264 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 10:50:16,264 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 10:50:16,264 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 10:50:16,264 - httpcore.connection - DEBUG - close.started
+2025-06-11 10:50:16,265 - httpcore.connection - DEBUG - close.complete
+2025-06-11 10:51:30,295 - __main__ - INFO - Initializing GradioAutodiffusers
+2025-06-11 10:51:30,295 - __main__ - DEBUG - API key found, length: 39
+2025-06-11 10:51:30,295 - auto_diffusers - INFO - Initializing AutoDiffusersGenerator
+2025-06-11 10:51:30,296 - auto_diffusers - DEBUG - API key length: 39
+2025-06-11 10:51:30,296 - auto_diffusers - WARNING - Tool calling dependencies not available, running without tools
+2025-06-11 10:51:30,296 - hardware_detector - INFO - Initializing HardwareDetector
+2025-06-11 10:51:30,296 - hardware_detector - DEBUG - Starting system hardware detection
+2025-06-11 10:51:30,296 - hardware_detector - DEBUG - Platform: Darwin, Architecture: arm64
+2025-06-11 10:51:30,296 - hardware_detector - DEBUG - CPU cores: 16, Python: 3.11.11
+2025-06-11 10:51:30,296 - hardware_detector - DEBUG - Attempting GPU detection via nvidia-smi
+2025-06-11 10:51:30,299 - hardware_detector - DEBUG - nvidia-smi not found, no NVIDIA GPU detected
+2025-06-11 10:51:30,299 - hardware_detector - DEBUG - Checking PyTorch availability
+2025-06-11 10:51:30,748 - hardware_detector - INFO - PyTorch 2.7.0 detected
+2025-06-11 10:51:30,748 - hardware_detector - DEBUG - CUDA available: False, MPS available: True
+2025-06-11 10:51:30,749 - hardware_detector - INFO - Hardware detection completed successfully
+2025-06-11 10:51:30,749 - hardware_detector - DEBUG - Detected specs: {'platform': 'Darwin', 'architecture': 'arm64', 'cpu_count': 16, 'python_version': '3.11.11', 'gpu_info': None, 'cuda_available': False, 'mps_available': True, 'torch_version': '2.7.0'}
+2025-06-11 10:51:30,749 - auto_diffusers - INFO - Hardware detector initialized successfully
+2025-06-11 10:51:30,749 - __main__ - INFO - AutoDiffusersGenerator initialized successfully
+2025-06-11 10:51:30,749 - simple_memory_calculator - INFO - Initializing SimpleMemoryCalculator
+2025-06-11 10:51:30,749 - simple_memory_calculator - DEBUG - HuggingFace API initialized
+2025-06-11 10:51:30,749 - simple_memory_calculator - DEBUG - Known models in database: 4
+2025-06-11 10:51:30,749 - __main__ - INFO - SimpleMemoryCalculator initialized successfully
+2025-06-11 10:51:30,749 - __main__ - DEBUG - Default model settings: gemini-2.5-flash-preview-05-20, temp=0.7
+2025-06-11 10:51:30,751 - asyncio - DEBUG - Using selector: KqueueSelector
+2025-06-11 10:51:30,764 - httpcore.connection - DEBUG - connect_tcp.started host='api.gradio.app' port=443 local_address=None timeout=3 socket_options=None
+2025-06-11 10:51:30,771 - urllib3.connectionpool - DEBUG - Starting new HTTPS connection (1): huggingface.co:443
+2025-06-11 10:51:30,850 - asyncio - DEBUG - Using selector: KqueueSelector
+2025-06-11 10:51:30,883 - httpcore.connection - DEBUG - connect_tcp.started host='localhost' port=7860 local_address=None timeout=None socket_options=None
+2025-06-11 10:51:30,884 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x119eae950>
+2025-06-11 10:51:30,884 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'GET']>
+2025-06-11 10:51:30,884 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 10:51:30,884 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'GET']>
+2025-06-11 10:51:30,884 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 10:51:30,885 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'GET']>
+2025-06-11 10:51:30,885 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'date', b'Wed, 11 Jun 2025 01:51:30 GMT'), (b'server', b'uvicorn'), (b'content-length', b'4'), (b'content-type', b'application/json')])
+2025-06-11 10:51:30,885 - httpx - INFO - HTTP Request: GET http://localhost:7860/gradio_api/startup-events "HTTP/1.1 200 OK"
+2025-06-11 10:51:30,885 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'GET']>
+2025-06-11 10:51:30,885 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 10:51:30,885 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 10:51:30,885 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 10:51:30,885 - httpcore.connection - DEBUG - close.started
+2025-06-11 10:51:30,885 - httpcore.connection - DEBUG - close.complete
+2025-06-11 10:51:30,886 - httpcore.connection - DEBUG - connect_tcp.started host='localhost' port=7860 local_address=None timeout=3 socket_options=None
+2025-06-11 10:51:30,886 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x11fb5e210>
+2025-06-11 10:51:30,886 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'HEAD']>
+2025-06-11 10:51:30,886 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 10:51:30,886 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'HEAD']>
+2025-06-11 10:51:30,886 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 10:51:30,886 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'HEAD']>
+2025-06-11 10:51:30,894 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'date', b'Wed, 11 Jun 2025 01:51:30 GMT'), (b'server', b'uvicorn'), (b'content-length', b'138668'), (b'content-type', b'text/html; charset=utf-8')])
+2025-06-11 10:51:30,894 - httpx - INFO - HTTP Request: HEAD http://localhost:7860/ "HTTP/1.1 200 OK"
+2025-06-11 10:51:30,894 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'HEAD']>
+2025-06-11 10:51:30,894 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 10:51:30,894 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 10:51:30,894 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 10:51:30,894 - httpcore.connection - DEBUG - close.started
+2025-06-11 10:51:30,894 - httpcore.connection - DEBUG - close.complete
+2025-06-11 10:51:30,906 - httpcore.connection - DEBUG - connect_tcp.started host='api.gradio.app' port=443 local_address=None timeout=30 socket_options=None
+2025-06-11 10:51:30,915 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x119317990>
+2025-06-11 10:51:30,915 - httpcore.connection - DEBUG - start_tls.started ssl_context=<ssl.SSLContext object at 0x111d311c0> server_hostname='api.gradio.app' timeout=3
+2025-06-11 10:51:31,035 - urllib3.connectionpool - DEBUG - https://huggingface.co:443 "HEAD /api/telemetry/gradio/initiated HTTP/1.1" 200 0
+2025-06-11 10:51:31,064 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x119c67f90>
+2025-06-11 10:51:31,064 - httpcore.connection - DEBUG - start_tls.started ssl_context=<ssl.SSLContext object at 0x11fae7f50> server_hostname='api.gradio.app' timeout=30
+2025-06-11 10:51:31,200 - httpcore.connection - DEBUG - start_tls.complete return_value=<httpcore._backends.sync.SyncStream object at 0x11a1284d0>
+2025-06-11 10:51:31,201 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'GET']>
+2025-06-11 10:51:31,201 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 10:51:31,201 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'GET']>
+2025-06-11 10:51:31,202 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 10:51:31,202 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'GET']>
+2025-06-11 10:51:31,345 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'Date', b'Wed, 11 Jun 2025 01:51:31 GMT'), (b'Content-Type', b'application/json'), (b'Content-Length', b'21'), (b'Connection', b'keep-alive'), (b'Server', b'nginx/1.18.0'), (b'Access-Control-Allow-Origin', b'*')])
+2025-06-11 10:51:31,346 - httpx - INFO - HTTP Request: GET https://api.gradio.app/pkg-version "HTTP/1.1 200 OK"
+2025-06-11 10:51:31,346 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'GET']>
+2025-06-11 10:51:31,346 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 10:51:31,346 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 10:51:31,346 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 10:51:31,347 - httpcore.connection - DEBUG - close.started
+2025-06-11 10:51:31,347 - httpcore.connection - DEBUG - close.complete
+2025-06-11 10:51:31,382 - httpcore.connection - DEBUG - start_tls.complete return_value=<httpcore._backends.sync.SyncStream object at 0x1198c9010>
+2025-06-11 10:51:31,382 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'GET']>
+2025-06-11 10:51:31,383 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 10:51:31,383 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'GET']>
+2025-06-11 10:51:31,383 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 10:51:31,383 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'GET']>
+2025-06-11 10:51:31,544 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'Date', b'Wed, 11 Jun 2025 01:51:31 GMT'), (b'Content-Type', b'text/html; charset=utf-8'), (b'Transfer-Encoding', b'chunked'), (b'Connection', b'keep-alive'), (b'Server', b'nginx/1.18.0'), (b'ContentType', b'application/json'), (b'Access-Control-Allow-Origin', b'*'), (b'Content-Encoding', b'gzip')])
+2025-06-11 10:51:31,544 - httpx - INFO - HTTP Request: GET https://api.gradio.app/v3/tunnel-request "HTTP/1.1 200 OK"
+2025-06-11 10:51:31,545 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'GET']>
+2025-06-11 10:51:31,545 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 10:51:31,545 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 10:51:31,546 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 10:51:31,546 - httpcore.connection - DEBUG - close.started
+2025-06-11 10:51:31,546 - httpcore.connection - DEBUG - close.complete
+2025-06-11 10:51:32,314 - urllib3.connectionpool - DEBUG - Starting new HTTPS connection (1): huggingface.co:443
+2025-06-11 10:51:32,526 - urllib3.connectionpool - DEBUG - https://huggingface.co:443 "HEAD /api/telemetry/gradio/launched HTTP/1.1" 200 0
+2025-06-11 10:51:41,746 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
+2025-06-11 10:51:41,746 - hardware_detector - INFO - Initializing HardwareDetector
+2025-06-11 10:51:41,746 - simple_memory_calculator - INFO - Using known memory data for black-forest-labs/FLUX.1-schnell
+2025-06-11 10:51:41,746 - hardware_detector - DEBUG - Starting system hardware detection
+2025-06-11 10:51:41,747 - simple_memory_calculator - DEBUG - Known data: {'params_billions': 12.0, 'fp16_gb': 24.0, 'inference_fp16_gb': 36.0}
+2025-06-11 10:51:41,747 - hardware_detector - DEBUG - Platform: Darwin, Architecture: arm64
+2025-06-11 10:51:41,747 - simple_memory_calculator - INFO - Generating memory recommendations for black-forest-labs/FLUX.1-schnell with 8.0GB VRAM
+2025-06-11 10:51:41,747 - hardware_detector - DEBUG - CPU cores: 16, Python: 3.11.11
+2025-06-11 10:51:41,747 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
+2025-06-11 10:51:41,747 - hardware_detector - DEBUG - Attempting GPU detection via nvidia-smi
+2025-06-11 10:51:41,747 - simple_memory_calculator - DEBUG - Using cached memory data for black-forest-labs/FLUX.1-schnell
+2025-06-11 10:51:41,747 - simple_memory_calculator - DEBUG - Model memory: 24.0GB, Inference memory: 36.0GB
+2025-06-11 10:51:41,748 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
+2025-06-11 10:51:41,748 - simple_memory_calculator - DEBUG - Using cached memory data for black-forest-labs/FLUX.1-schnell
+2025-06-11 10:51:41,754 - hardware_detector - DEBUG - nvidia-smi not found, no NVIDIA GPU detected
+2025-06-11 10:51:41,755 - hardware_detector - DEBUG - Checking PyTorch availability
+2025-06-11 10:51:41,755 - hardware_detector - INFO - PyTorch 2.7.0 detected
+2025-06-11 10:51:41,755 - hardware_detector - DEBUG - CUDA available: False, MPS available: True
+2025-06-11 10:51:41,755 - hardware_detector - INFO - Hardware detection completed successfully
+2025-06-11 10:51:41,755 - hardware_detector - DEBUG - Detected specs: {'platform': 'Darwin', 'architecture': 'arm64', 'cpu_count': 16, 'python_version': '3.11.11', 'gpu_info': None, 'cuda_available': False, 'mps_available': True, 'torch_version': '2.7.0'}
+2025-06-11 10:58:51,900 - __main__ - INFO - Initializing GradioAutodiffusers
+2025-06-11 10:58:51,900 - __main__ - DEBUG - API key found, length: 39
+2025-06-11 10:58:51,900 - auto_diffusers - INFO - Initializing AutoDiffusersGenerator
+2025-06-11 10:58:51,900 - auto_diffusers - DEBUG - API key length: 39
+2025-06-11 10:58:51,900 - auto_diffusers - WARNING - Tool calling dependencies not available, running without tools
+2025-06-11 10:58:51,900 - hardware_detector - INFO - Initializing HardwareDetector
+2025-06-11 10:58:51,900 - hardware_detector - DEBUG - Starting system hardware detection
+2025-06-11 10:58:51,900 - hardware_detector - DEBUG - Platform: Darwin, Architecture: arm64
+2025-06-11 10:58:51,900 - hardware_detector - DEBUG - CPU cores: 16, Python: 3.11.11
+2025-06-11 10:58:51,900 - hardware_detector - DEBUG - Attempting GPU detection via nvidia-smi
+2025-06-11 10:58:51,904 - hardware_detector - DEBUG - nvidia-smi not found, no NVIDIA GPU detected
+2025-06-11 10:58:51,904 - hardware_detector - DEBUG - Checking PyTorch availability
+2025-06-11 10:58:52,365 - hardware_detector - INFO - PyTorch 2.7.0 detected
+2025-06-11 10:58:52,365 - hardware_detector - DEBUG - CUDA available: False, MPS available: True
+2025-06-11 10:58:52,365 - hardware_detector - INFO - Hardware detection completed successfully
+2025-06-11 10:58:52,365 - hardware_detector - DEBUG - Detected specs: {'platform': 'Darwin', 'architecture': 'arm64', 'cpu_count': 16, 'python_version': '3.11.11', 'gpu_info': None, 'cuda_available': False, 'mps_available': True, 'torch_version': '2.7.0'}
+2025-06-11 10:58:52,365 - auto_diffusers - INFO - Hardware detector initialized successfully
+2025-06-11 10:58:52,365 - __main__ - INFO - AutoDiffusersGenerator initialized successfully
+2025-06-11 10:58:52,365 - simple_memory_calculator - INFO - Initializing SimpleMemoryCalculator
+2025-06-11 10:58:52,365 - simple_memory_calculator - DEBUG - HuggingFace API initialized
+2025-06-11 10:58:52,365 - simple_memory_calculator - DEBUG - Known models in database: 4
+2025-06-11 10:58:52,365 - __main__ - INFO - SimpleMemoryCalculator initialized successfully
+2025-06-11 10:58:52,365 - __main__ - DEBUG - Default model settings: gemini-2.5-flash-preview-05-20, temp=0.7
+2025-06-11 10:58:52,368 - asyncio - DEBUG - Using selector: KqueueSelector
+2025-06-11 10:58:52,381 - httpcore.connection - DEBUG - connect_tcp.started host='api.gradio.app' port=443 local_address=None timeout=3 socket_options=None
+2025-06-11 10:58:52,388 - urllib3.connectionpool - DEBUG - Starting new HTTPS connection (1): huggingface.co:443
+2025-06-11 10:58:52,468 - asyncio - DEBUG - Using selector: KqueueSelector
+2025-06-11 10:58:52,500 - httpcore.connection - DEBUG - connect_tcp.started host='localhost' port=7860 local_address=None timeout=None socket_options=None
+2025-06-11 10:58:52,501 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x11979ae90>
+2025-06-11 10:58:52,501 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'GET']>
+2025-06-11 10:58:52,501 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 10:58:52,501 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'GET']>
+2025-06-11 10:58:52,502 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 10:58:52,502 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'GET']>
+2025-06-11 10:58:52,502 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'date', b'Wed, 11 Jun 2025 01:58:52 GMT'), (b'server', b'uvicorn'), (b'content-length', b'4'), (b'content-type', b'application/json')])
+2025-06-11 10:58:52,502 - httpx - INFO - HTTP Request: GET http://localhost:7860/gradio_api/startup-events "HTTP/1.1 200 OK"
+2025-06-11 10:58:52,502 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'GET']>
+2025-06-11 10:58:52,502 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 10:58:52,502 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 10:58:52,502 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 10:58:52,502 - httpcore.connection - DEBUG - close.started
+2025-06-11 10:58:52,502 - httpcore.connection - DEBUG - close.complete
+2025-06-11 10:58:52,503 - httpcore.connection - DEBUG - connect_tcp.started host='localhost' port=7860 local_address=None timeout=3 socket_options=None
+2025-06-11 10:58:52,503 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x11e0c3990>
+2025-06-11 10:58:52,503 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'HEAD']>
+2025-06-11 10:58:52,503 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 10:58:52,503 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'HEAD']>
+2025-06-11 10:58:52,503 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 10:58:52,503 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'HEAD']>
+2025-06-11 10:58:52,510 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'date', b'Wed, 11 Jun 2025 01:58:52 GMT'), (b'server', b'uvicorn'), (b'content-length', b'145792'), (b'content-type', b'text/html; charset=utf-8')])
+2025-06-11 10:58:52,510 - httpx - INFO - HTTP Request: HEAD http://localhost:7860/ "HTTP/1.1 200 OK"
+2025-06-11 10:58:52,510 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'HEAD']>
+2025-06-11 10:58:52,510 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 10:58:52,510 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 10:58:52,511 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 10:58:52,511 - httpcore.connection - DEBUG - close.started
+2025-06-11 10:58:52,511 - httpcore.connection - DEBUG - close.complete
+2025-06-11 10:58:52,522 - httpcore.connection - DEBUG - connect_tcp.started host='api.gradio.app' port=443 local_address=None timeout=30 socket_options=None
+2025-06-11 10:58:52,627 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x119093c50>
+2025-06-11 10:58:52,627 - httpcore.connection - DEBUG - start_tls.started ssl_context=<ssl.SSLContext object at 0x107d31370> server_hostname='api.gradio.app' timeout=3
+2025-06-11 10:58:52,662 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x11e139450>
+2025-06-11 10:58:52,662 - httpcore.connection - DEBUG - start_tls.started ssl_context=<ssl.SSLContext object at 0x11e0c8a70> server_hostname='api.gradio.app' timeout=30
+2025-06-11 10:58:52,671 - urllib3.connectionpool - DEBUG - https://huggingface.co:443 "HEAD /api/telemetry/gradio/initiated HTTP/1.1" 200 0
+2025-06-11 10:58:52,933 - httpcore.connection - DEBUG - start_tls.complete return_value=<httpcore._backends.sync.SyncStream object at 0x11956d810>
+2025-06-11 10:58:52,933 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'GET']>
+2025-06-11 10:58:52,933 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 10:58:52,933 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'GET']>
+2025-06-11 10:58:52,933 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 10:58:52,933 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'GET']>
+2025-06-11 10:58:52,944 - httpcore.connection - DEBUG - start_tls.complete return_value=<httpcore._backends.sync.SyncStream object at 0x118fc5fd0>
+2025-06-11 10:58:52,944 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'GET']>
+2025-06-11 10:58:52,944 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 10:58:52,944 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'GET']>
+2025-06-11 10:58:52,944 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 10:58:52,945 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'GET']>
+2025-06-11 10:58:53,082 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'Date', b'Wed, 11 Jun 2025 01:58:53 GMT'), (b'Content-Type', b'application/json'), (b'Content-Length', b'21'), (b'Connection', b'keep-alive'), (b'Server', b'nginx/1.18.0'), (b'Access-Control-Allow-Origin', b'*')])
+2025-06-11 10:58:53,082 - httpx - INFO - HTTP Request: GET https://api.gradio.app/pkg-version "HTTP/1.1 200 OK"
+2025-06-11 10:58:53,083 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'GET']>
+2025-06-11 10:58:53,083 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 10:58:53,083 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 10:58:53,083 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 10:58:53,083 - httpcore.connection - DEBUG - close.started
+2025-06-11 10:58:53,084 - httpcore.connection - DEBUG - close.complete
+2025-06-11 10:58:53,087 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'Date', b'Wed, 11 Jun 2025 01:58:53 GMT'), (b'Content-Type', b'text/html; charset=utf-8'), (b'Transfer-Encoding', b'chunked'), (b'Connection', b'keep-alive'), (b'Server', b'nginx/1.18.0'), (b'ContentType', b'application/json'), (b'Access-Control-Allow-Origin', b'*'), (b'Content-Encoding', b'gzip')])
+2025-06-11 10:58:53,087 - httpx - INFO - HTTP Request: GET https://api.gradio.app/v3/tunnel-request "HTTP/1.1 200 OK"
+2025-06-11 10:58:53,088 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'GET']>
+2025-06-11 10:58:53,089 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 10:58:53,089 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 10:58:53,089 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 10:58:53,089 - httpcore.connection - DEBUG - close.started
+2025-06-11 10:58:53,090 - httpcore.connection - DEBUG - close.complete
+2025-06-11 10:58:53,778 - urllib3.connectionpool - DEBUG - Starting new HTTPS connection (1): huggingface.co:443
+2025-06-11 10:58:54,003 - urllib3.connectionpool - DEBUG - https://huggingface.co:443 "HEAD /api/telemetry/gradio/launched HTTP/1.1" 200 0
+2025-06-11 10:58:59,726 - hardware_detector - INFO - Initializing HardwareDetector
+2025-06-11 10:58:59,726 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
+2025-06-11 10:58:59,727 - hardware_detector - DEBUG - Starting system hardware detection
+2025-06-11 10:58:59,727 - simple_memory_calculator - INFO - Using known memory data for black-forest-labs/FLUX.1-schnell
+2025-06-11 10:58:59,727 - hardware_detector - DEBUG - Platform: Darwin, Architecture: arm64
+2025-06-11 10:58:59,727 - simple_memory_calculator - DEBUG - Known data: {'params_billions': 12.0, 'fp16_gb': 24.0, 'inference_fp16_gb': 36.0}
+2025-06-11 10:58:59,727 - hardware_detector - DEBUG - CPU cores: 16, Python: 3.11.11
+2025-06-11 10:58:59,727 - simple_memory_calculator - INFO - Generating memory recommendations for black-forest-labs/FLUX.1-schnell with 8.0GB VRAM
+2025-06-11 10:58:59,727 - hardware_detector - DEBUG - Attempting GPU detection via nvidia-smi
+2025-06-11 10:58:59,727 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
+2025-06-11 10:58:59,727 - simple_memory_calculator - DEBUG - Using cached memory data for black-forest-labs/FLUX.1-schnell
+2025-06-11 10:58:59,727 - simple_memory_calculator - DEBUG - Model memory: 24.0GB, Inference memory: 36.0GB
+2025-06-11 10:58:59,731 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
+2025-06-11 10:58:59,732 - simple_memory_calculator - DEBUG - Using cached memory data for black-forest-labs/FLUX.1-schnell
+2025-06-11 10:58:59,734 - hardware_detector - DEBUG - nvidia-smi not found, no NVIDIA GPU detected
+2025-06-11 10:58:59,734 - hardware_detector - DEBUG - Checking PyTorch availability
+2025-06-11 10:58:59,734 - hardware_detector - INFO - PyTorch 2.7.0 detected
+2025-06-11 10:58:59,734 - hardware_detector - DEBUG - CUDA available: False, MPS available: True
+2025-06-11 10:58:59,734 - hardware_detector - INFO - Hardware detection completed successfully
+2025-06-11 10:58:59,734 - hardware_detector - DEBUG - Detected specs: {'platform': 'Darwin', 'architecture': 'arm64', 'cpu_count': 16, 'python_version': '3.11.11', 'gpu_info': None, 'cuda_available': False, 'mps_available': True, 'torch_version': '2.7.0'}
+2025-06-11 10:59:29,945 - hardware_detector - INFO - Initializing HardwareDetector
+2025-06-11 10:59:29,946 - hardware_detector - DEBUG - Starting system hardware detection
+2025-06-11 10:59:29,946 - hardware_detector - DEBUG - Platform: Darwin, Architecture: arm64
+2025-06-11 10:59:29,946 - hardware_detector - DEBUG - CPU cores: 16, Python: 3.11.11
+2025-06-11 10:59:29,946 - hardware_detector - DEBUG - Attempting GPU detection via nvidia-smi
+2025-06-11 10:59:29,955 - hardware_detector - DEBUG - nvidia-smi not found, no NVIDIA GPU detected
+2025-06-11 10:59:29,956 - hardware_detector - DEBUG - Checking PyTorch availability
+2025-06-11 10:59:29,956 - hardware_detector - INFO - PyTorch 2.7.0 detected
+2025-06-11 10:59:29,956 - hardware_detector - DEBUG - CUDA available: False, MPS available: True
+2025-06-11 10:59:29,956 - hardware_detector - INFO - Hardware detection completed successfully
+2025-06-11 10:59:29,956 - hardware_detector - DEBUG - Detected specs: {'platform': 'Darwin', 'architecture': 'arm64', 'cpu_count': 16, 'python_version': '3.11.11', 'gpu_info': None, 'cuda_available': False, 'mps_available': True, 'torch_version': '2.7.0'}
+2025-06-11 11:02:06,705 - __main__ - INFO - Initializing GradioAutodiffusers
+2025-06-11 11:02:06,705 - __main__ - DEBUG - API key found, length: 39
+2025-06-11 11:02:06,705 - auto_diffusers - INFO - Initializing AutoDiffusersGenerator
+2025-06-11 11:02:06,705 - auto_diffusers - DEBUG - API key length: 39
+2025-06-11 11:02:06,705 - auto_diffusers - WARNING - Tool calling dependencies not available, running without tools
+2025-06-11 11:02:06,705 - hardware_detector - INFO - Initializing HardwareDetector
+2025-06-11 11:02:06,705 - hardware_detector - DEBUG - Starting system hardware detection
+2025-06-11 11:02:06,705 - hardware_detector - DEBUG - Platform: Darwin, Architecture: arm64
+2025-06-11 11:02:06,705 - hardware_detector - DEBUG - CPU cores: 16, Python: 3.11.11
+2025-06-11 11:02:06,705 - hardware_detector - DEBUG - Attempting GPU detection via nvidia-smi
+2025-06-11 11:02:06,708 - hardware_detector - DEBUG - nvidia-smi not found, no NVIDIA GPU detected
+2025-06-11 11:02:06,708 - hardware_detector - DEBUG - Checking PyTorch availability
+2025-06-11 11:02:07,162 - hardware_detector - INFO - PyTorch 2.7.0 detected
+2025-06-11 11:02:07,162 - hardware_detector - DEBUG - CUDA available: False, MPS available: True
+2025-06-11 11:02:07,162 - hardware_detector - INFO - Hardware detection completed successfully
+2025-06-11 11:02:07,162 - hardware_detector - DEBUG - Detected specs: {'platform': 'Darwin', 'architecture': 'arm64', 'cpu_count': 16, 'python_version': '3.11.11', 'gpu_info': None, 'cuda_available': False, 'mps_available': True, 'torch_version': '2.7.0'}
+2025-06-11 11:02:07,162 - auto_diffusers - INFO - Hardware detector initialized successfully
+2025-06-11 11:02:07,162 - __main__ - INFO - AutoDiffusersGenerator initialized successfully
+2025-06-11 11:02:07,162 - simple_memory_calculator - INFO - Initializing SimpleMemoryCalculator
+2025-06-11 11:02:07,162 - simple_memory_calculator - DEBUG - HuggingFace API initialized
+2025-06-11 11:02:07,162 - simple_memory_calculator - DEBUG - Known models in database: 4
+2025-06-11 11:02:07,162 - __main__ - INFO - SimpleMemoryCalculator initialized successfully
+2025-06-11 11:02:07,162 - __main__ - DEBUG - Default model settings: gemini-2.5-flash-preview-05-20, temp=0.7
+2025-06-11 11:02:07,164 - asyncio - DEBUG - Using selector: KqueueSelector
+2025-06-11 11:02:07,177 - httpcore.connection - DEBUG - connect_tcp.started host='api.gradio.app' port=443 local_address=None timeout=3 socket_options=None
+2025-06-11 11:02:07,184 - urllib3.connectionpool - DEBUG - Starting new HTTPS connection (1): huggingface.co:443
+2025-06-11 11:02:07,259 - asyncio - DEBUG - Using selector: KqueueSelector
+2025-06-11 11:02:07,291 - httpcore.connection - DEBUG - connect_tcp.started host='localhost' port=7860 local_address=None timeout=None socket_options=None
+2025-06-11 11:02:07,292 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x12cca70d0>
+2025-06-11 11:02:07,292 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'GET']>
+2025-06-11 11:02:07,292 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 11:02:07,292 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'GET']>
+2025-06-11 11:02:07,292 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 11:02:07,292 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'GET']>
+2025-06-11 11:02:07,293 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'date', b'Wed, 11 Jun 2025 02:02:07 GMT'), (b'server', b'uvicorn'), (b'content-length', b'4'), (b'content-type', b'application/json')])
+2025-06-11 11:02:07,293 - httpx - INFO - HTTP Request: GET http://localhost:7860/gradio_api/startup-events "HTTP/1.1 200 OK"
+2025-06-11 11:02:07,293 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'GET']>
+2025-06-11 11:02:07,293 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 11:02:07,293 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 11:02:07,293 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 11:02:07,293 - httpcore.connection - DEBUG - close.started
+2025-06-11 11:02:07,293 - httpcore.connection - DEBUG - close.complete
+2025-06-11 11:02:07,293 - httpcore.connection - DEBUG - connect_tcp.started host='localhost' port=7860 local_address=None timeout=3 socket_options=None
+2025-06-11 11:02:07,294 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x12f9793d0>
+2025-06-11 11:02:07,294 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'HEAD']>
+2025-06-11 11:02:07,294 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 11:02:07,294 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'HEAD']>
+2025-06-11 11:02:07,294 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 11:02:07,294 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'HEAD']>
+2025-06-11 11:02:07,301 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'date', b'Wed, 11 Jun 2025 02:02:07 GMT'), (b'server', b'uvicorn'), (b'content-length', b'145791'), (b'content-type', b'text/html; charset=utf-8')])
+2025-06-11 11:02:07,301 - httpx - INFO - HTTP Request: HEAD http://localhost:7860/ "HTTP/1.1 200 OK"
+2025-06-11 11:02:07,302 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'HEAD']>
+2025-06-11 11:02:07,302 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 11:02:07,302 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 11:02:07,302 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 11:02:07,302 - httpcore.connection - DEBUG - close.started
+2025-06-11 11:02:07,302 - httpcore.connection - DEBUG - close.complete
+2025-06-11 11:02:07,313 - httpcore.connection - DEBUG - connect_tcp.started host='api.gradio.app' port=443 local_address=None timeout=30 socket_options=None
+2025-06-11 11:02:07,341 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x12d6ce890>
+2025-06-11 11:02:07,341 - httpcore.connection - DEBUG - start_tls.started ssl_context=<ssl.SSLContext object at 0x12d5aa8d0> server_hostname='api.gradio.app' timeout=3
+2025-06-11 11:02:07,459 - urllib3.connectionpool - DEBUG - https://huggingface.co:443 "HEAD /api/telemetry/gradio/initiated HTTP/1.1" 200 0
+2025-06-11 11:02:07,459 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x12cf2e010>
+2025-06-11 11:02:07,459 - httpcore.connection - DEBUG - start_tls.started ssl_context=<ssl.SSLContext object at 0x12f96cb00> server_hostname='api.gradio.app' timeout=30
+2025-06-11 11:02:07,614 - httpcore.connection - DEBUG - start_tls.complete return_value=<httpcore._backends.sync.SyncStream object at 0x12f877590>
+2025-06-11 11:02:07,615 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'GET']>
+2025-06-11 11:02:07,615 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 11:02:07,616 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'GET']>
+2025-06-11 11:02:07,616 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 11:02:07,616 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'GET']>
+2025-06-11 11:02:07,752 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'Date', b'Wed, 11 Jun 2025 02:02:07 GMT'), (b'Content-Type', b'application/json'), (b'Content-Length', b'21'), (b'Connection', b'keep-alive'), (b'Server', b'nginx/1.18.0'), (b'Access-Control-Allow-Origin', b'*')])
+2025-06-11 11:02:07,753 - httpx - INFO - HTTP Request: GET https://api.gradio.app/pkg-version "HTTP/1.1 200 OK"
+2025-06-11 11:02:07,753 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'GET']>
+2025-06-11 11:02:07,753 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 11:02:07,753 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 11:02:07,753 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 11:02:07,753 - httpcore.connection - DEBUG - close.started
+2025-06-11 11:02:07,753 - httpcore.connection - DEBUG - close.complete
+2025-06-11 11:02:07,761 - httpcore.connection - DEBUG - start_tls.complete return_value=<httpcore._backends.sync.SyncStream object at 0x11b064750>
+2025-06-11 11:02:07,761 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'GET']>
+2025-06-11 11:02:07,761 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 11:02:07,761 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'GET']>
+2025-06-11 11:02:07,761 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 11:02:07,761 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'GET']>
+2025-06-11 11:02:07,910 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'Date', b'Wed, 11 Jun 2025 02:02:07 GMT'), (b'Content-Type', b'text/html; charset=utf-8'), (b'Transfer-Encoding', b'chunked'), (b'Connection', b'keep-alive'), (b'Server', b'nginx/1.18.0'), (b'ContentType', b'application/json'), (b'Access-Control-Allow-Origin', b'*'), (b'Content-Encoding', b'gzip')])
+2025-06-11 11:02:07,910 - httpx - INFO - HTTP Request: GET https://api.gradio.app/v3/tunnel-request "HTTP/1.1 200 OK"
+2025-06-11 11:02:07,910 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'GET']>
+2025-06-11 11:02:07,910 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 11:02:07,910 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 11:02:07,910 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 11:02:07,910 - httpcore.connection - DEBUG - close.started
+2025-06-11 11:02:07,910 - httpcore.connection - DEBUG - close.complete
+2025-06-11 11:02:08,533 - urllib3.connectionpool - DEBUG - Starting new HTTPS connection (1): huggingface.co:443
+2025-06-11 11:02:08,757 - urllib3.connectionpool - DEBUG - https://huggingface.co:443 "HEAD /api/telemetry/gradio/launched HTTP/1.1" 200 0
+2025-06-11 11:02:13,522 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
+2025-06-11 11:02:13,522 - simple_memory_calculator - INFO - Using known memory data for black-forest-labs/FLUX.1-schnell
+2025-06-11 11:02:13,522 - hardware_detector - INFO - Initializing HardwareDetector
+2025-06-11 11:02:13,522 - simple_memory_calculator - DEBUG - Known data: {'params_billions': 12.0, 'fp16_gb': 24.0, 'inference_fp16_gb': 36.0}
+2025-06-11 11:02:13,522 - hardware_detector - DEBUG - Starting system hardware detection
+2025-06-11 11:02:13,522 - simple_memory_calculator - INFO - Generating memory recommendations for black-forest-labs/FLUX.1-schnell with 8.0GB VRAM
+2025-06-11 11:02:13,522 - hardware_detector - DEBUG - Platform: Darwin, Architecture: arm64
+2025-06-11 11:02:13,522 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
+2025-06-11 11:02:13,522 - hardware_detector - DEBUG - CPU cores: 16, Python: 3.11.11
+2025-06-11 11:02:13,522 - simple_memory_calculator - DEBUG - Using cached memory data for black-forest-labs/FLUX.1-schnell
+2025-06-11 11:02:13,522 - hardware_detector - DEBUG - Attempting GPU detection via nvidia-smi
+2025-06-11 11:02:13,522 - simple_memory_calculator - DEBUG - Model memory: 24.0GB, Inference memory: 36.0GB
+2025-06-11 11:02:13,523 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
+2025-06-11 11:02:13,523 - simple_memory_calculator - DEBUG - Using cached memory data for black-forest-labs/FLUX.1-schnell
+2025-06-11 11:02:13,528 - hardware_detector - DEBUG - nvidia-smi not found, no NVIDIA GPU detected
+2025-06-11 11:02:13,529 - hardware_detector - DEBUG - Checking PyTorch availability
+2025-06-11 11:02:13,529 - hardware_detector - INFO - PyTorch 2.7.0 detected
+2025-06-11 11:02:13,529 - hardware_detector - DEBUG - CUDA available: False, MPS available: True
+2025-06-11 11:02:13,529 - hardware_detector - INFO - Hardware detection completed successfully
+2025-06-11 11:02:13,529 - hardware_detector - DEBUG - Detected specs: {'platform': 'Darwin', 'architecture': 'arm64', 'cpu_count': 16, 'python_version': '3.11.11', 'gpu_info': None, 'cuda_available': False, 'mps_available': True, 'torch_version': '2.7.0'}
+2025-06-11 11:02:13,529 - __main__ - INFO - 🔍 DEBUG: Full detected specs: {'platform': 'Darwin', 'architecture': 'arm64', 'cpu_count': 16, 'python_version': '3.11.11', 'gpu_info': None, 'cuda_available': False, 'mps_available': True, 'torch_version': '2.7.0'}
+2025-06-11 11:02:13,529 - __main__ - INFO - 🔍 DEBUG: Platform: Darwin
+2025-06-11 11:02:13,529 - __main__ - INFO - 🔍 DEBUG: Architecture: arm64
+2025-06-11 11:02:13,529 - __main__ - INFO - 🔍 DEBUG: MPS Available: True
+2025-06-11 11:02:13,529 - __main__ - INFO - 🔍 DEBUG: Is Apple Silicon: True
+2025-06-11 11:02:13,529 - __main__ - INFO - 🔍 DEBUG: GPU Info: None
+2025-06-11 11:02:13,529 - __main__ - INFO - 🔍 DEBUG: Detected RAM (GB): 16
+2025-06-11 11:02:13,783 - __main__ - INFO - 🔍 DEBUG: PSUtil detected 128GB unified memory
+2025-06-11 11:02:13,878 - __main__ - INFO - 🔍 DEBUG: System profiler output: hardware:
+    hardware overview:
+      model name: macbook pro
+      model identifier: mac16,5
+      model number: z1fs0002mkh/a
+      chip: apple m4 max
+      total number of cores: 16 (12 performance and 4 efficiency)
+      memory: 128 gb
+      system firmware version: 11881.61.3
+      os loader version: 11881.61.3
+      serial number (system): kkvqcmx4dt
+      hardware uuid: 92bfa67e-d816-5b1d-99bb-f9a2824999ba
+      provisioning udid: 00006041-001269200280801c
+      activation lock status: enabled
+2025-06-11 11:02:13,878 - __main__ - INFO - 🔍 DEBUG: Detected Apple chip: M4 Max
+2025-06-11 11:02:13,878 - __main__ - INFO - 🔍 DEBUG: Final values - Platform: Apple Silicon, GPU Vendor: Apple Silicon, GPU Name: M4 Max, Unified RAM: 128GB
+2025-06-11 11:04:13,169 - __main__ - INFO - Initializing GradioAutodiffusers
+2025-06-11 11:04:13,169 - __main__ - DEBUG - API key found, length: 39
+2025-06-11 11:04:13,169 - auto_diffusers - INFO - Initializing AutoDiffusersGenerator
+2025-06-11 11:04:13,169 - auto_diffusers - DEBUG - API key length: 39
+2025-06-11 11:04:13,169 - auto_diffusers - WARNING - Tool calling dependencies not available, running without tools
+2025-06-11 11:04:13,169 - hardware_detector - INFO - Initializing HardwareDetector
+2025-06-11 11:04:13,169 - hardware_detector - DEBUG - Starting system hardware detection
+2025-06-11 11:04:13,169 - hardware_detector - DEBUG - Platform: Darwin, Architecture: arm64
+2025-06-11 11:04:13,169 - hardware_detector - DEBUG - CPU cores: 16, Python: 3.11.11
+2025-06-11 11:04:13,169 - hardware_detector - DEBUG - Attempting GPU detection via nvidia-smi
+2025-06-11 11:04:13,173 - hardware_detector - DEBUG - nvidia-smi not found, no NVIDIA GPU detected
+2025-06-11 11:04:13,173 - hardware_detector - DEBUG - Checking PyTorch availability
+2025-06-11 11:04:13,635 - hardware_detector - INFO - PyTorch 2.7.0 detected
+2025-06-11 11:04:13,635 - hardware_detector - DEBUG - CUDA available: False, MPS available: True
+2025-06-11 11:04:13,636 - hardware_detector - INFO - Hardware detection completed successfully
+2025-06-11 11:04:13,636 - hardware_detector - DEBUG - Detected specs: {'platform': 'Darwin', 'architecture': 'arm64', 'cpu_count': 16, 'python_version': '3.11.11', 'gpu_info': None, 'cuda_available': False, 'mps_available': True, 'torch_version': '2.7.0'}
+2025-06-11 11:04:13,636 - auto_diffusers - INFO - Hardware detector initialized successfully
+2025-06-11 11:04:13,636 - __main__ - INFO - AutoDiffusersGenerator initialized successfully
+2025-06-11 11:04:13,636 - simple_memory_calculator - INFO - Initializing SimpleMemoryCalculator
+2025-06-11 11:04:13,636 - simple_memory_calculator - DEBUG - HuggingFace API initialized
+2025-06-11 11:04:13,636 - simple_memory_calculator - DEBUG - Known models in database: 4
+2025-06-11 11:04:13,636 - __main__ - INFO - SimpleMemoryCalculator initialized successfully
+2025-06-11 11:04:13,636 - __main__ - DEBUG - Default model settings: gemini-2.5-flash-preview-05-20, temp=0.7
+2025-06-11 11:04:13,638 - asyncio - DEBUG - Using selector: KqueueSelector
+2025-06-11 11:04:13,652 - httpcore.connection - DEBUG - connect_tcp.started host='api.gradio.app' port=443 local_address=None timeout=3 socket_options=None
+2025-06-11 11:04:13,657 - urllib3.connectionpool - DEBUG - Starting new HTTPS connection (1): huggingface.co:443
+2025-06-11 11:04:13,732 - asyncio - DEBUG - Using selector: KqueueSelector
+2025-06-11 11:04:13,765 - httpcore.connection - DEBUG - connect_tcp.started host='localhost' port=7860 local_address=None timeout=None socket_options=None
+2025-06-11 11:04:13,766 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x11f95aed0>
+2025-06-11 11:04:13,766 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'GET']>
+2025-06-11 11:04:13,766 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 11:04:13,766 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'GET']>
+2025-06-11 11:04:13,766 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 11:04:13,766 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'GET']>
+2025-06-11 11:04:13,767 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'date', b'Wed, 11 Jun 2025 02:04:13 GMT'), (b'server', b'uvicorn'), (b'content-length', b'4'), (b'content-type', b'application/json')])
+2025-06-11 11:04:13,767 - httpx - INFO - HTTP Request: GET http://localhost:7860/gradio_api/startup-events "HTTP/1.1 200 OK"
+2025-06-11 11:04:13,767 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'GET']>
+2025-06-11 11:04:13,767 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 11:04:13,767 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 11:04:13,767 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 11:04:13,767 - httpcore.connection - DEBUG - close.started
+2025-06-11 11:04:13,767 - httpcore.connection - DEBUG - close.complete
+2025-06-11 11:04:13,767 - httpcore.connection - DEBUG - connect_tcp.started host='localhost' port=7860 local_address=None timeout=3 socket_options=None
+2025-06-11 11:04:13,768 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x11f9707d0>
+2025-06-11 11:04:13,768 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'HEAD']>
+2025-06-11 11:04:13,768 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 11:04:13,768 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'HEAD']>
+2025-06-11 11:04:13,768 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 11:04:13,768 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'HEAD']>
+2025-06-11 11:04:13,775 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'date', b'Wed, 11 Jun 2025 02:04:13 GMT'), (b'server', b'uvicorn'), (b'content-length', b'144016'), (b'content-type', b'text/html; charset=utf-8')])
+2025-06-11 11:04:13,775 - httpx - INFO - HTTP Request: HEAD http://localhost:7860/ "HTTP/1.1 200 OK"
+2025-06-11 11:04:13,775 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'HEAD']>
+2025-06-11 11:04:13,775 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 11:04:13,775 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 11:04:13,775 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 11:04:13,775 - httpcore.connection - DEBUG - close.started
+2025-06-11 11:04:13,775 - httpcore.connection - DEBUG - close.complete
+2025-06-11 11:04:13,787 - httpcore.connection - DEBUG - connect_tcp.started host='api.gradio.app' port=443 local_address=None timeout=30 socket_options=None
+2025-06-11 11:04:13,828 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x11cd75e50>
+2025-06-11 11:04:13,828 - httpcore.connection - DEBUG - start_tls.started ssl_context=<ssl.SSLContext object at 0x109d35370> server_hostname='api.gradio.app' timeout=3
+2025-06-11 11:04:13,937 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x11f9d0f90>
+2025-06-11 11:04:13,937 - httpcore.connection - DEBUG - start_tls.started ssl_context=<ssl.SSLContext object at 0x11f960b00> server_hostname='api.gradio.app' timeout=30
+2025-06-11 11:04:13,939 - urllib3.connectionpool - DEBUG - https://huggingface.co:443 "HEAD /api/telemetry/gradio/initiated HTTP/1.1" 200 0
+2025-06-11 11:04:14,124 - httpcore.connection - DEBUG - start_tls.complete return_value=<httpcore._backends.sync.SyncStream object at 0x11b820d10>
+2025-06-11 11:04:14,124 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'GET']>
+2025-06-11 11:04:14,125 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 11:04:14,125 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'GET']>
+2025-06-11 11:04:14,125 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 11:04:14,126 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'GET']>
+2025-06-11 11:04:14,240 - httpcore.connection - DEBUG - start_tls.complete return_value=<httpcore._backends.sync.SyncStream object at 0x119caf6d0>
+2025-06-11 11:04:14,241 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'GET']>
+2025-06-11 11:04:14,241 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 11:04:14,241 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'GET']>
+2025-06-11 11:04:14,241 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 11:04:14,241 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'GET']>
+2025-06-11 11:04:14,272 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'Date', b'Wed, 11 Jun 2025 02:04:14 GMT'), (b'Content-Type', b'application/json'), (b'Content-Length', b'21'), (b'Connection', b'keep-alive'), (b'Server', b'nginx/1.18.0'), (b'Access-Control-Allow-Origin', b'*')])
+2025-06-11 11:04:14,274 - httpx - INFO - HTTP Request: GET https://api.gradio.app/pkg-version "HTTP/1.1 200 OK"
+2025-06-11 11:04:14,275 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'GET']>
+2025-06-11 11:04:14,275 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 11:04:14,275 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 11:04:14,275 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 11:04:14,275 - httpcore.connection - DEBUG - close.started
+2025-06-11 11:04:14,276 - httpcore.connection - DEBUG - close.complete
+2025-06-11 11:04:14,391 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'Date', b'Wed, 11 Jun 2025 02:04:14 GMT'), (b'Content-Type', b'text/html; charset=utf-8'), (b'Transfer-Encoding', b'chunked'), (b'Connection', b'keep-alive'), (b'Server', b'nginx/1.18.0'), (b'ContentType', b'application/json'), (b'Access-Control-Allow-Origin', b'*'), (b'Content-Encoding', b'gzip')])
+2025-06-11 11:04:14,391 - httpx - INFO - HTTP Request: GET https://api.gradio.app/v3/tunnel-request "HTTP/1.1 200 OK"
+2025-06-11 11:04:14,392 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'GET']>
+2025-06-11 11:04:14,392 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 11:04:14,392 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 11:04:14,392 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 11:04:14,392 - httpcore.connection - DEBUG - close.started
+2025-06-11 11:04:14,392 - httpcore.connection - DEBUG - close.complete
+2025-06-11 11:04:14,994 - urllib3.connectionpool - DEBUG - Starting new HTTPS connection (1): huggingface.co:443
+2025-06-11 11:04:15,564 - urllib3.connectionpool - DEBUG - https://huggingface.co:443 "HEAD /api/telemetry/gradio/launched HTTP/1.1" 200 0
+2025-06-11 11:05:42,002 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
+2025-06-11 11:05:42,003 - simple_memory_calculator - INFO - Using known memory data for black-forest-labs/FLUX.1-schnell
+2025-06-11 11:05:42,003 - simple_memory_calculator - DEBUG - Known data: {'params_billions': 12.0, 'fp16_gb': 24.0, 'inference_fp16_gb': 36.0}
+2025-06-11 11:05:42,003 - simple_memory_calculator - INFO - Generating memory recommendations for black-forest-labs/FLUX.1-schnell with 8.0GB VRAM
+2025-06-11 11:05:42,003 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
+2025-06-11 11:05:42,003 - simple_memory_calculator - DEBUG - Using cached memory data for black-forest-labs/FLUX.1-schnell
+2025-06-11 11:05:42,003 - simple_memory_calculator - DEBUG - Model memory: 24.0GB, Inference memory: 36.0GB
+2025-06-11 11:05:42,003 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
+2025-06-11 11:05:42,004 - simple_memory_calculator - DEBUG - Using cached memory data for black-forest-labs/FLUX.1-schnell
+2025-06-11 11:07:51,377 - __main__ - INFO - Initializing GradioAutodiffusers
+2025-06-11 11:07:51,377 - __main__ - DEBUG - API key found, length: 39
+2025-06-11 11:07:51,377 - auto_diffusers - INFO - Initializing AutoDiffusersGenerator
+2025-06-11 11:07:51,377 - auto_diffusers - DEBUG - API key length: 39
+2025-06-11 11:07:51,377 - auto_diffusers - WARNING - Tool calling dependencies not available, running without tools
+2025-06-11 11:07:51,377 - hardware_detector - INFO - Initializing HardwareDetector
+2025-06-11 11:07:51,377 - hardware_detector - DEBUG - Starting system hardware detection
+2025-06-11 11:07:51,377 - hardware_detector - DEBUG - Platform: Darwin, Architecture: arm64
+2025-06-11 11:07:51,377 - hardware_detector - DEBUG - CPU cores: 16, Python: 3.11.11
+2025-06-11 11:07:51,377 - hardware_detector - DEBUG - Attempting GPU detection via nvidia-smi
+2025-06-11 11:07:51,380 - hardware_detector - DEBUG - nvidia-smi not found, no NVIDIA GPU detected
+2025-06-11 11:07:51,381 - hardware_detector - DEBUG - Checking PyTorch availability
+2025-06-11 11:07:51,843 - hardware_detector - INFO - PyTorch 2.7.0 detected
+2025-06-11 11:07:51,843 - hardware_detector - DEBUG - CUDA available: False, MPS available: True
+2025-06-11 11:07:51,843 - hardware_detector - INFO - Hardware detection completed successfully
+2025-06-11 11:07:51,843 - hardware_detector - DEBUG - Detected specs: {'platform': 'Darwin', 'architecture': 'arm64', 'cpu_count': 16, 'python_version': '3.11.11', 'gpu_info': None, 'cuda_available': False, 'mps_available': True, 'torch_version': '2.7.0'}
+2025-06-11 11:07:51,843 - auto_diffusers - INFO - Hardware detector initialized successfully
+2025-06-11 11:07:51,843 - __main__ - INFO - AutoDiffusersGenerator initialized successfully
+2025-06-11 11:07:51,843 - simple_memory_calculator - INFO - Initializing SimpleMemoryCalculator
+2025-06-11 11:07:51,843 - simple_memory_calculator - DEBUG - HuggingFace API initialized
+2025-06-11 11:07:51,843 - simple_memory_calculator - DEBUG - Known models in database: 4
+2025-06-11 11:07:51,843 - __main__ - INFO - SimpleMemoryCalculator initialized successfully
+2025-06-11 11:07:51,843 - __main__ - DEBUG - Default model settings: gemini-2.5-flash-preview-05-20, temp=0.7
+2025-06-11 11:07:51,845 - asyncio - DEBUG - Using selector: KqueueSelector
+2025-06-11 11:07:51,859 - httpcore.connection - DEBUG - connect_tcp.started host='api.gradio.app' port=443 local_address=None timeout=3 socket_options=None
+2025-06-11 11:07:51,859 - urllib3.connectionpool - DEBUG - Starting new HTTPS connection (1): huggingface.co:443
+2025-06-11 11:07:51,938 - asyncio - DEBUG - Using selector: KqueueSelector
+2025-06-11 11:07:51,968 - httpcore.connection - DEBUG - connect_tcp.started host='localhost' port=7860 local_address=None timeout=None socket_options=None
+2025-06-11 11:07:51,969 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x1266d1610>
+2025-06-11 11:07:51,969 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'GET']>
+2025-06-11 11:07:51,969 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 11:07:51,969 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'GET']>
+2025-06-11 11:07:51,969 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 11:07:51,969 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'GET']>
+2025-06-11 11:07:51,970 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'date', b'Wed, 11 Jun 2025 02:07:51 GMT'), (b'server', b'uvicorn'), (b'content-length', b'4'), (b'content-type', b'application/json')])
+2025-06-11 11:07:51,970 - httpx - INFO - HTTP Request: GET http://localhost:7860/gradio_api/startup-events "HTTP/1.1 200 OK"
+2025-06-11 11:07:51,970 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'GET']>
+2025-06-11 11:07:51,970 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 11:07:51,970 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 11:07:51,970 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 11:07:51,970 - httpcore.connection - DEBUG - close.started
+2025-06-11 11:07:51,970 - httpcore.connection - DEBUG - close.complete
+2025-06-11 11:07:51,971 - httpcore.connection - DEBUG - connect_tcp.started host='localhost' port=7860 local_address=None timeout=3 socket_options=None
+2025-06-11 11:07:51,971 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x127b5b750>
+2025-06-11 11:07:51,971 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'HEAD']>
+2025-06-11 11:07:51,971 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 11:07:51,971 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'HEAD']>
+2025-06-11 11:07:51,971 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 11:07:51,971 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'HEAD']>
+2025-06-11 11:07:51,978 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'date', b'Wed, 11 Jun 2025 02:07:51 GMT'), (b'server', b'uvicorn'), (b'content-length', b'140375'), (b'content-type', b'text/html; charset=utf-8')])
+2025-06-11 11:07:51,978 - httpx - INFO - HTTP Request: HEAD http://localhost:7860/ "HTTP/1.1 200 OK"
+2025-06-11 11:07:51,978 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'HEAD']>
+2025-06-11 11:07:51,978 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 11:07:51,978 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 11:07:51,978 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 11:07:51,978 - httpcore.connection - DEBUG - close.started
+2025-06-11 11:07:51,978 - httpcore.connection - DEBUG - close.complete
+2025-06-11 11:07:51,990 - httpcore.connection - DEBUG - connect_tcp.started host='api.gradio.app' port=443 local_address=None timeout=30 socket_options=None
+2025-06-11 11:07:52,029 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x1264bdd50>
+2025-06-11 11:07:52,029 - httpcore.connection - DEBUG - start_tls.started ssl_context=<ssl.SSLContext object at 0x1263aa840> server_hostname='api.gradio.app' timeout=3
+2025-06-11 11:07:52,122 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x127bd9110>
+2025-06-11 11:07:52,122 - httpcore.connection - DEBUG - start_tls.started ssl_context=<ssl.SSLContext object at 0x127b64b00> server_hostname='api.gradio.app' timeout=30
+2025-06-11 11:07:52,188 - urllib3.connectionpool - DEBUG - https://huggingface.co:443 "HEAD /api/telemetry/gradio/initiated HTTP/1.1" 200 0
+2025-06-11 11:07:52,325 - httpcore.connection - DEBUG - start_tls.complete return_value=<httpcore._backends.sync.SyncStream object at 0x125acf010>
+2025-06-11 11:07:52,325 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'GET']>
+2025-06-11 11:07:52,325 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 11:07:52,326 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'GET']>
+2025-06-11 11:07:52,326 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 11:07:52,326 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'GET']>
+2025-06-11 11:07:52,388 - httpcore.connection - DEBUG - start_tls.complete return_value=<httpcore._backends.sync.SyncStream object at 0x125dc7210>
+2025-06-11 11:07:52,388 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'GET']>
+2025-06-11 11:07:52,389 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 11:07:52,389 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'GET']>
+2025-06-11 11:07:52,389 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 11:07:52,389 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'GET']>
+2025-06-11 11:07:52,474 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'Date', b'Wed, 11 Jun 2025 02:07:52 GMT'), (b'Content-Type', b'application/json'), (b'Content-Length', b'21'), (b'Connection', b'keep-alive'), (b'Server', b'nginx/1.18.0'), (b'Access-Control-Allow-Origin', b'*')])
+2025-06-11 11:07:52,475 - httpx - INFO - HTTP Request: GET https://api.gradio.app/pkg-version "HTTP/1.1 200 OK"
+2025-06-11 11:07:52,475 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'GET']>
+2025-06-11 11:07:52,475 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 11:07:52,475 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 11:07:52,475 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 11:07:52,475 - httpcore.connection - DEBUG - close.started
+2025-06-11 11:07:52,476 - httpcore.connection - DEBUG - close.complete
+2025-06-11 11:07:52,524 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'Date', b'Wed, 11 Jun 2025 02:07:52 GMT'), (b'Content-Type', b'text/html; charset=utf-8'), (b'Transfer-Encoding', b'chunked'), (b'Connection', b'keep-alive'), (b'Server', b'nginx/1.18.0'), (b'ContentType', b'application/json'), (b'Access-Control-Allow-Origin', b'*'), (b'Content-Encoding', b'gzip')])
+2025-06-11 11:07:52,524 - httpx - INFO - HTTP Request: GET https://api.gradio.app/v3/tunnel-request "HTTP/1.1 200 OK"
+2025-06-11 11:07:52,524 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'GET']>
+2025-06-11 11:07:52,525 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 11:07:52,525 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 11:07:52,525 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 11:07:52,526 - httpcore.connection - DEBUG - close.started
+2025-06-11 11:07:52,526 - httpcore.connection - DEBUG - close.complete
+2025-06-11 11:07:53,161 - urllib3.connectionpool - DEBUG - Starting new HTTPS connection (1): huggingface.co:443
+2025-06-11 11:07:53,383 - urllib3.connectionpool - DEBUG - https://huggingface.co:443 "HEAD /api/telemetry/gradio/launched HTTP/1.1" 200 0
+2025-06-11 11:07:56,235 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
+2025-06-11 11:07:56,235 - simple_memory_calculator - INFO - Using known memory data for black-forest-labs/FLUX.1-schnell
+2025-06-11 11:07:56,235 - simple_memory_calculator - DEBUG - Known data: {'params_billions': 12.0, 'fp16_gb': 24.0, 'inference_fp16_gb': 36.0}
+2025-06-11 11:07:56,235 - simple_memory_calculator - INFO - Generating memory recommendations for black-forest-labs/FLUX.1-schnell with 8.0GB VRAM
+2025-06-11 11:07:56,235 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
+2025-06-11 11:07:56,235 - simple_memory_calculator - DEBUG - Using cached memory data for black-forest-labs/FLUX.1-schnell
+2025-06-11 11:07:56,236 - simple_memory_calculator - DEBUG - Model memory: 24.0GB, Inference memory: 36.0GB
+2025-06-11 11:07:56,236 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
+2025-06-11 11:07:56,236 - simple_memory_calculator - DEBUG - Using cached memory data for black-forest-labs/FLUX.1-schnell
+2025-06-11 11:08:06,275 - __main__ - INFO - Initializing GradioAutodiffusers
+2025-06-11 11:08:06,275 - __main__ - DEBUG - API key found, length: 39
+2025-06-11 11:08:06,275 - auto_diffusers - INFO - Initializing AutoDiffusersGenerator
+2025-06-11 11:08:06,275 - auto_diffusers - DEBUG - API key length: 39
+2025-06-11 11:08:06,275 - auto_diffusers - WARNING - Tool calling dependencies not available, running without tools
+2025-06-11 11:08:06,275 - hardware_detector - INFO - Initializing HardwareDetector
+2025-06-11 11:08:06,275 - hardware_detector - DEBUG - Starting system hardware detection
+2025-06-11 11:08:06,275 - hardware_detector - DEBUG - Platform: Darwin, Architecture: arm64
+2025-06-11 11:08:06,275 - hardware_detector - DEBUG - CPU cores: 16, Python: 3.11.11
+2025-06-11 11:08:06,275 - hardware_detector - DEBUG - Attempting GPU detection via nvidia-smi
+2025-06-11 11:08:06,278 - hardware_detector - DEBUG - nvidia-smi not found, no NVIDIA GPU detected
+2025-06-11 11:08:06,278 - hardware_detector - DEBUG - Checking PyTorch availability
+2025-06-11 11:08:06,730 - hardware_detector - INFO - PyTorch 2.7.0 detected
+2025-06-11 11:08:06,730 - hardware_detector - DEBUG - CUDA available: False, MPS available: True
+2025-06-11 11:08:06,730 - hardware_detector - INFO - Hardware detection completed successfully
+2025-06-11 11:08:06,730 - hardware_detector - DEBUG - Detected specs: {'platform': 'Darwin', 'architecture': 'arm64', 'cpu_count': 16, 'python_version': '3.11.11', 'gpu_info': None, 'cuda_available': False, 'mps_available': True, 'torch_version': '2.7.0'}
+2025-06-11 11:08:06,730 - auto_diffusers - INFO - Hardware detector initialized successfully
+2025-06-11 11:08:06,730 - __main__ - INFO - AutoDiffusersGenerator initialized successfully
+2025-06-11 11:08:06,730 - simple_memory_calculator - INFO - Initializing SimpleMemoryCalculator
+2025-06-11 11:08:06,730 - simple_memory_calculator - DEBUG - HuggingFace API initialized
+2025-06-11 11:08:06,730 - simple_memory_calculator - DEBUG - Known models in database: 4
+2025-06-11 11:08:06,730 - __main__ - INFO - SimpleMemoryCalculator initialized successfully
+2025-06-11 11:08:06,730 - __main__ - DEBUG - Default model settings: gemini-2.5-flash-preview-05-20, temp=0.7
+2025-06-11 11:08:06,732 - asyncio - DEBUG - Using selector: KqueueSelector
+2025-06-11 11:08:06,745 - httpcore.connection - DEBUG - connect_tcp.started host='api.gradio.app' port=443 local_address=None timeout=3 socket_options=None
+2025-06-11 11:08:06,753 - urllib3.connectionpool - DEBUG - Starting new HTTPS connection (1): huggingface.co:443
+2025-06-11 11:08:06,825 - asyncio - DEBUG - Using selector: KqueueSelector
+2025-06-11 11:08:06,858 - httpcore.connection - DEBUG - connect_tcp.started host='localhost' port=7860 local_address=None timeout=None socket_options=None
+2025-06-11 11:08:06,858 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x11a17f410>
+2025-06-11 11:08:06,858 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'GET']>
+2025-06-11 11:08:06,859 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 11:08:06,859 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'GET']>
+2025-06-11 11:08:06,859 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 11:08:06,859 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'GET']>
+2025-06-11 11:08:06,859 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'date', b'Wed, 11 Jun 2025 02:08:06 GMT'), (b'server', b'uvicorn'), (b'content-length', b'4'), (b'content-type', b'application/json')])
+2025-06-11 11:08:06,859 - httpx - INFO - HTTP Request: GET http://localhost:7860/gradio_api/startup-events "HTTP/1.1 200 OK"
+2025-06-11 11:08:06,859 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'GET']>
+2025-06-11 11:08:06,860 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 11:08:06,860 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 11:08:06,860 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 11:08:06,860 - httpcore.connection - DEBUG - close.started
+2025-06-11 11:08:06,860 - httpcore.connection - DEBUG - close.complete
+2025-06-11 11:08:06,860 - httpcore.connection - DEBUG - connect_tcp.started host='localhost' port=7860 local_address=None timeout=3 socket_options=None
+2025-06-11 11:08:06,860 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x11fb5f990>
+2025-06-11 11:08:06,860 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'HEAD']>
+2025-06-11 11:08:06,861 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 11:08:06,861 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'HEAD']>
+2025-06-11 11:08:06,861 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 11:08:06,861 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'HEAD']>
+2025-06-11 11:08:06,867 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'date', b'Wed, 11 Jun 2025 02:08:06 GMT'), (b'server', b'uvicorn'), (b'content-length', b'142574'), (b'content-type', b'text/html; charset=utf-8')])
+2025-06-11 11:08:06,868 - httpx - INFO - HTTP Request: HEAD http://localhost:7860/ "HTTP/1.1 200 OK"
+2025-06-11 11:08:06,868 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'HEAD']>
+2025-06-11 11:08:06,868 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 11:08:06,868 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 11:08:06,868 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 11:08:06,868 - httpcore.connection - DEBUG - close.started
+2025-06-11 11:08:06,868 - httpcore.connection - DEBUG - close.complete
+2025-06-11 11:08:06,879 - httpcore.connection - DEBUG - connect_tcp.started host='api.gradio.app' port=443 local_address=None timeout=30 socket_options=None
+2025-06-11 11:08:06,892 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x11a1c8390>
+2025-06-11 11:08:06,892 - httpcore.connection - DEBUG - start_tls.started ssl_context=<ssl.SSLContext object at 0x107835370> server_hostname='api.gradio.app' timeout=3
+2025-06-11 11:08:07,028 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x11fbd9090>
+2025-06-11 11:08:07,028 - httpcore.connection - DEBUG - start_tls.started ssl_context=<ssl.SSLContext object at 0x11fb68a70> server_hostname='api.gradio.app' timeout=30
+2025-06-11 11:08:07,032 - urllib3.connectionpool - DEBUG - https://huggingface.co:443 "HEAD /api/telemetry/gradio/initiated HTTP/1.1" 200 0
+2025-06-11 11:08:07,169 - httpcore.connection - DEBUG - start_tls.complete return_value=<httpcore._backends.sync.SyncStream object at 0x118e975d0>
+2025-06-11 11:08:07,170 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'GET']>
+2025-06-11 11:08:07,170 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 11:08:07,170 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'GET']>
+2025-06-11 11:08:07,171 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 11:08:07,171 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'GET']>
+2025-06-11 11:08:07,310 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'Date', b'Wed, 11 Jun 2025 02:08:07 GMT'), (b'Content-Type', b'application/json'), (b'Content-Length', b'21'), (b'Connection', b'keep-alive'), (b'Server', b'nginx/1.18.0'), (b'Access-Control-Allow-Origin', b'*')])
+2025-06-11 11:08:07,311 - httpx - INFO - HTTP Request: GET https://api.gradio.app/pkg-version "HTTP/1.1 200 OK"
+2025-06-11 11:08:07,311 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'GET']>
+2025-06-11 11:08:07,312 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 11:08:07,312 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 11:08:07,312 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 11:08:07,312 - httpcore.connection - DEBUG - close.started
+2025-06-11 11:08:07,312 - httpcore.connection - DEBUG - close.complete
+2025-06-11 11:08:07,326 - httpcore.connection - DEBUG - start_tls.complete return_value=<httpcore._backends.sync.SyncStream object at 0x119af4110>
+2025-06-11 11:08:07,326 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'GET']>
+2025-06-11 11:08:07,326 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 11:08:07,326 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'GET']>
+2025-06-11 11:08:07,326 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 11:08:07,326 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'GET']>
+2025-06-11 11:08:07,477 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'Date', b'Wed, 11 Jun 2025 02:08:07 GMT'), (b'Content-Type', b'text/html; charset=utf-8'), (b'Transfer-Encoding', b'chunked'), (b'Connection', b'keep-alive'), (b'Server', b'nginx/1.18.0'), (b'ContentType', b'application/json'), (b'Access-Control-Allow-Origin', b'*'), (b'Content-Encoding', b'gzip')])
+2025-06-11 11:08:07,478 - httpx - INFO - HTTP Request: GET https://api.gradio.app/v3/tunnel-request "HTTP/1.1 200 OK"
+2025-06-11 11:08:07,478 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'GET']>
+2025-06-11 11:08:07,478 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 11:08:07,479 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 11:08:07,479 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 11:08:07,479 - httpcore.connection - DEBUG - close.started
+2025-06-11 11:08:07,479 - httpcore.connection - DEBUG - close.complete
+2025-06-11 11:08:08,331 - urllib3.connectionpool - DEBUG - Starting new HTTPS connection (1): huggingface.co:443
+2025-06-11 11:08:08,553 - urllib3.connectionpool - DEBUG - https://huggingface.co:443 "HEAD /api/telemetry/gradio/launched HTTP/1.1" 200 0
+2025-06-11 11:08:11,643 - hardware_detector - INFO - Initializing HardwareDetector
+2025-06-11 11:08:11,643 - hardware_detector - DEBUG - Starting system hardware detection
+2025-06-11 11:08:11,643 - hardware_detector - DEBUG - Platform: Darwin, Architecture: arm64
+2025-06-11 11:08:11,643 - hardware_detector - DEBUG - CPU cores: 16, Python: 3.11.11
+2025-06-11 11:08:11,643 - hardware_detector - DEBUG - Attempting GPU detection via nvidia-smi
+2025-06-11 11:08:11,650 - hardware_detector - DEBUG - nvidia-smi not found, no NVIDIA GPU detected
+2025-06-11 11:08:11,650 - hardware_detector - DEBUG - Checking PyTorch availability
+2025-06-11 11:08:11,650 - hardware_detector - INFO - PyTorch 2.7.0 detected
+2025-06-11 11:08:11,651 - hardware_detector - DEBUG - CUDA available: False, MPS available: True
+2025-06-11 11:08:11,651 - hardware_detector - INFO - Hardware detection completed successfully
+2025-06-11 11:08:11,651 - hardware_detector - DEBUG - Detected specs: {'platform': 'Darwin', 'architecture': 'arm64', 'cpu_count': 16, 'python_version': '3.11.11', 'gpu_info': None, 'cuda_available': False, 'mps_available': True, 'torch_version': '2.7.0'}
+2025-06-11 11:08:11,651 - __main__ - INFO - 🔍 DEBUG: Full detected specs: {'platform': 'Darwin', 'architecture': 'arm64', 'cpu_count': 16, 'python_version': '3.11.11', 'gpu_info': None, 'cuda_available': False, 'mps_available': True, 'torch_version': '2.7.0'}
+2025-06-11 11:08:11,651 - __main__ - INFO - 🔍 DEBUG: Platform: Darwin
+2025-06-11 11:08:11,651 - __main__ - INFO - 🔍 DEBUG: Architecture: arm64
+2025-06-11 11:08:11,651 - __main__ - INFO - 🔍 DEBUG: MPS Available: True
+2025-06-11 11:08:11,651 - __main__ - INFO - 🔍 DEBUG: Is Apple Silicon: True
+2025-06-11 11:08:11,651 - __main__ - INFO - 🔍 DEBUG: GPU Info: None
+2025-06-11 11:08:11,651 - __main__ - INFO - 🔍 DEBUG: Detected RAM (GB): 16
+2025-06-11 11:08:11,658 - __main__ - INFO - 🔍 DEBUG: PSUtil detected 128GB unified memory
+2025-06-11 11:08:11,694 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
+2025-06-11 11:08:11,694 - simple_memory_calculator - INFO - Using known memory data for black-forest-labs/FLUX.1-schnell
+2025-06-11 11:08:11,694 - simple_memory_calculator - DEBUG - Known data: {'params_billions': 12.0, 'fp16_gb': 24.0, 'inference_fp16_gb': 36.0}
+2025-06-11 11:08:11,694 - simple_memory_calculator - INFO - Generating memory recommendations for black-forest-labs/FLUX.1-schnell with 8.0GB VRAM
+2025-06-11 11:08:11,694 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
+2025-06-11 11:08:11,695 - simple_memory_calculator - DEBUG - Using cached memory data for black-forest-labs/FLUX.1-schnell
+2025-06-11 11:08:11,695 - simple_memory_calculator - DEBUG - Model memory: 24.0GB, Inference memory: 36.0GB
+2025-06-11 11:08:11,695 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
+2025-06-11 11:08:11,695 - simple_memory_calculator - DEBUG - Using cached memory data for black-forest-labs/FLUX.1-schnell
+2025-06-11 11:08:11,809 - __main__ - INFO - 🔍 DEBUG: System profiler output: hardware:
+    hardware overview:
+      model name: macbook pro
+      model identifier: mac16,5
+      model number: z1fs0002mkh/a
+      chip: apple m4 max
+      total number of cores: 16 (12 performance and 4 efficiency)
+      memory: 128 gb
+      system firmware version: 11881.61.3
+      os loader version: 11881.61.3
+      serial number (system): kkvqcmx4dt
+      hardware uuid: 92bfa67e-d816-5b1d-99bb-f9a2824999ba
+      provisioning udid: 00006041-001269200280801c
+      activation lock status: enabled
+2025-06-11 11:08:11,809 - __main__ - INFO - 🔍 DEBUG: Detected Apple chip: M4 Max
+2025-06-11 11:08:11,809 - __main__ - INFO - 🔍 DEBUG: Final values - Platform: Apple Silicon, GPU Vendor: Apple Silicon, GPU Name: M4 Max, Unified RAM: 128GB
+2025-06-11 11:09:25,254 - __main__ - INFO - Initializing GradioAutodiffusers
+2025-06-11 11:09:25,254 - __main__ - DEBUG - API key found, length: 39
+2025-06-11 11:09:25,254 - auto_diffusers - INFO - Initializing AutoDiffusersGenerator
+2025-06-11 11:09:25,254 - auto_diffusers - DEBUG - API key length: 39
+2025-06-11 11:09:25,254 - auto_diffusers - WARNING - Tool calling dependencies not available, running without tools
+2025-06-11 11:09:25,254 - hardware_detector - INFO - Initializing HardwareDetector
+2025-06-11 11:09:25,254 - hardware_detector - DEBUG - Starting system hardware detection
+2025-06-11 11:09:25,254 - hardware_detector - DEBUG - Platform: Darwin, Architecture: arm64
+2025-06-11 11:09:25,254 - hardware_detector - DEBUG - CPU cores: 16, Python: 3.11.11
+2025-06-11 11:09:25,254 - hardware_detector - DEBUG - Attempting GPU detection via nvidia-smi
+2025-06-11 11:09:25,258 - hardware_detector - DEBUG - nvidia-smi not found, no NVIDIA GPU detected
+2025-06-11 11:09:25,258 - hardware_detector - DEBUG - Checking PyTorch availability
+2025-06-11 11:09:25,724 - hardware_detector - INFO - PyTorch 2.7.0 detected
+2025-06-11 11:09:25,724 - hardware_detector - DEBUG - CUDA available: False, MPS available: True
+2025-06-11 11:09:25,724 - hardware_detector - INFO - Hardware detection completed successfully
+2025-06-11 11:09:25,724 - hardware_detector - DEBUG - Detected specs: {'platform': 'Darwin', 'architecture': 'arm64', 'cpu_count': 16, 'python_version': '3.11.11', 'gpu_info': None, 'cuda_available': False, 'mps_available': True, 'torch_version': '2.7.0'}
+2025-06-11 11:09:25,724 - auto_diffusers - INFO - Hardware detector initialized successfully
+2025-06-11 11:09:25,724 - __main__ - INFO - AutoDiffusersGenerator initialized successfully
+2025-06-11 11:09:25,724 - simple_memory_calculator - INFO - Initializing SimpleMemoryCalculator
+2025-06-11 11:09:25,724 - simple_memory_calculator - DEBUG - HuggingFace API initialized
+2025-06-11 11:09:25,724 - simple_memory_calculator - DEBUG - Known models in database: 4
+2025-06-11 11:09:25,724 - __main__ - INFO - SimpleMemoryCalculator initialized successfully
+2025-06-11 11:09:25,724 - __main__ - DEBUG - Default model settings: gemini-2.5-flash-preview-05-20, temp=0.7
+2025-06-11 11:09:25,726 - asyncio - DEBUG - Using selector: KqueueSelector
+2025-06-11 11:09:25,738 - httpcore.connection - DEBUG - connect_tcp.started host='api.gradio.app' port=443 local_address=None timeout=3 socket_options=None
+2025-06-11 11:09:25,747 - urllib3.connectionpool - DEBUG - Starting new HTTPS connection (1): huggingface.co:443
+2025-06-11 11:09:25,821 - asyncio - DEBUG - Using selector: KqueueSelector
+2025-06-11 11:09:25,852 - httpcore.connection - DEBUG - connect_tcp.started host='localhost' port=7860 local_address=None timeout=None socket_options=None
+2025-06-11 11:09:25,853 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x12867ed90>
+2025-06-11 11:09:25,853 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'GET']>
+2025-06-11 11:09:25,853 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 11:09:25,853 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'GET']>
+2025-06-11 11:09:25,853 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 11:09:25,854 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'GET']>
+2025-06-11 11:09:25,854 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'date', b'Wed, 11 Jun 2025 02:09:25 GMT'), (b'server', b'uvicorn'), (b'content-length', b'4'), (b'content-type', b'application/json')])
+2025-06-11 11:09:25,854 - httpx - INFO - HTTP Request: GET http://localhost:7860/gradio_api/startup-events "HTTP/1.1 200 OK"
+2025-06-11 11:09:25,854 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'GET']>
+2025-06-11 11:09:25,854 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 11:09:25,854 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 11:09:25,854 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 11:09:25,854 - httpcore.connection - DEBUG - close.started
+2025-06-11 11:09:25,854 - httpcore.connection - DEBUG - close.complete
+2025-06-11 11:09:25,855 - httpcore.connection - DEBUG - connect_tcp.started host='localhost' port=7860 local_address=None timeout=3 socket_options=None
+2025-06-11 11:09:25,855 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x12c65f3d0>
+2025-06-11 11:09:25,855 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'HEAD']>
+2025-06-11 11:09:25,855 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 11:09:25,855 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'HEAD']>
+2025-06-11 11:09:25,855 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 11:09:25,855 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'HEAD']>
+2025-06-11 11:09:25,862 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'date', b'Wed, 11 Jun 2025 02:09:25 GMT'), (b'server', b'uvicorn'), (b'content-length', b'142574'), (b'content-type', b'text/html; charset=utf-8')])
+2025-06-11 11:09:25,862 - httpx - INFO - HTTP Request: HEAD http://localhost:7860/ "HTTP/1.1 200 OK"
+2025-06-11 11:09:25,862 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'HEAD']>
+2025-06-11 11:09:25,862 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 11:09:25,862 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 11:09:25,862 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 11:09:25,862 - httpcore.connection - DEBUG - close.started
+2025-06-11 11:09:25,862 - httpcore.connection - DEBUG - close.complete
+2025-06-11 11:09:25,874 - httpcore.connection - DEBUG - connect_tcp.started host='api.gradio.app' port=443 local_address=None timeout=30 socket_options=None
+2025-06-11 11:09:25,904 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x12868d1d0>
+2025-06-11 11:09:25,904 - httpcore.connection - DEBUG - start_tls.started ssl_context=<ssl.SSLContext object at 0x10cd35370> server_hostname='api.gradio.app' timeout=3
+2025-06-11 11:09:26,016 - httpcore.connection - DEBUG - connect_tcp.complete return_value=<httpcore._backends.sync.SyncStream object at 0x12c6d3790>
+2025-06-11 11:09:26,016 - httpcore.connection - DEBUG - start_tls.started ssl_context=<ssl.SSLContext object at 0x12c668a70> server_hostname='api.gradio.app' timeout=30
+2025-06-11 11:09:26,028 - urllib3.connectionpool - DEBUG - https://huggingface.co:443 "HEAD /api/telemetry/gradio/initiated HTTP/1.1" 200 0
+2025-06-11 11:09:26,177 - httpcore.connection - DEBUG - start_tls.complete return_value=<httpcore._backends.sync.SyncStream object at 0x12c3e0950>
+2025-06-11 11:09:26,177 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'GET']>
+2025-06-11 11:09:26,177 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 11:09:26,177 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'GET']>
+2025-06-11 11:09:26,177 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 11:09:26,177 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'GET']>
+2025-06-11 11:09:26,306 - httpcore.connection - DEBUG - start_tls.complete return_value=<httpcore._backends.sync.SyncStream object at 0x11c64e6d0>
+2025-06-11 11:09:26,307 - httpcore.http11 - DEBUG - send_request_headers.started request=<Request [b'GET']>
+2025-06-11 11:09:26,307 - httpcore.http11 - DEBUG - send_request_headers.complete
+2025-06-11 11:09:26,308 - httpcore.http11 - DEBUG - send_request_body.started request=<Request [b'GET']>
+2025-06-11 11:09:26,308 - httpcore.http11 - DEBUG - send_request_body.complete
+2025-06-11 11:09:26,308 - httpcore.http11 - DEBUG - receive_response_headers.started request=<Request [b'GET']>
+2025-06-11 11:09:26,315 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'Date', b'Wed, 11 Jun 2025 02:09:26 GMT'), (b'Content-Type', b'application/json'), (b'Content-Length', b'21'), (b'Connection', b'keep-alive'), (b'Server', b'nginx/1.18.0'), (b'Access-Control-Allow-Origin', b'*')])
+2025-06-11 11:09:26,315 - httpx - INFO - HTTP Request: GET https://api.gradio.app/pkg-version "HTTP/1.1 200 OK"
+2025-06-11 11:09:26,315 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'GET']>
+2025-06-11 11:09:26,316 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 11:09:26,316 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 11:09:26,316 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 11:09:26,316 - httpcore.connection - DEBUG - close.started
+2025-06-11 11:09:26,316 - httpcore.connection - DEBUG - close.complete
+2025-06-11 11:09:26,454 - httpcore.http11 - DEBUG - receive_response_headers.complete return_value=(b'HTTP/1.1', 200, b'OK', [(b'Date', b'Wed, 11 Jun 2025 02:09:26 GMT'), (b'Content-Type', b'text/html; charset=utf-8'), (b'Transfer-Encoding', b'chunked'), (b'Connection', b'keep-alive'), (b'Server', b'nginx/1.18.0'), (b'ContentType', b'application/json'), (b'Access-Control-Allow-Origin', b'*'), (b'Content-Encoding', b'gzip')])
+2025-06-11 11:09:26,455 - httpx - INFO - HTTP Request: GET https://api.gradio.app/v3/tunnel-request "HTTP/1.1 200 OK"
+2025-06-11 11:09:26,455 - httpcore.http11 - DEBUG - receive_response_body.started request=<Request [b'GET']>
+2025-06-11 11:09:26,455 - httpcore.http11 - DEBUG - receive_response_body.complete
+2025-06-11 11:09:26,456 - httpcore.http11 - DEBUG - response_closed.started
+2025-06-11 11:09:26,456 - httpcore.http11 - DEBUG - response_closed.complete
+2025-06-11 11:09:26,456 - httpcore.connection - DEBUG - close.started
+2025-06-11 11:09:26,457 - httpcore.connection - DEBUG - close.complete
+2025-06-11 11:09:27,037 - urllib3.connectionpool - DEBUG - Starting new HTTPS connection (1): huggingface.co:443
+2025-06-11 11:09:27,127 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
+2025-06-11 11:09:27,127 - hardware_detector - INFO - Initializing HardwareDetector
+2025-06-11 11:09:27,127 - simple_memory_calculator - INFO - Using known memory data for black-forest-labs/FLUX.1-schnell
+2025-06-11 11:09:27,127 - hardware_detector - DEBUG - Starting system hardware detection
+2025-06-11 11:09:27,127 - simple_memory_calculator - DEBUG - Known data: {'params_billions': 12.0, 'fp16_gb': 24.0, 'inference_fp16_gb': 36.0}
+2025-06-11 11:09:27,127 - hardware_detector - DEBUG - Platform: Darwin, Architecture: arm64
+2025-06-11 11:09:27,127 - simple_memory_calculator - INFO - Generating memory recommendations for black-forest-labs/FLUX.1-schnell with 8.0GB VRAM
+2025-06-11 11:09:27,127 - hardware_detector - DEBUG - CPU cores: 16, Python: 3.11.11
+2025-06-11 11:09:27,127 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
+2025-06-11 11:09:27,127 - hardware_detector - DEBUG - Attempting GPU detection via nvidia-smi
+2025-06-11 11:09:27,128 - simple_memory_calculator - DEBUG - Using cached memory data for black-forest-labs/FLUX.1-schnell
+2025-06-11 11:09:27,128 - simple_memory_calculator - DEBUG - Model memory: 24.0GB, Inference memory: 36.0GB
+2025-06-11 11:09:27,132 - simple_memory_calculator - INFO - Getting memory requirements for model: black-forest-labs/FLUX.1-schnell
+2025-06-11 11:09:27,133 - simple_memory_calculator - DEBUG - Using cached memory data for black-forest-labs/FLUX.1-schnell
+2025-06-11 11:09:27,134 - hardware_detector - DEBUG - nvidia-smi not found, no NVIDIA GPU detected
+2025-06-11 11:09:27,135 - hardware_detector - DEBUG - Checking PyTorch availability
+2025-06-11 11:09:27,135 - hardware_detector - INFO - PyTorch 2.7.0 detected
+2025-06-11 11:09:27,135 - hardware_detector - DEBUG - CUDA available: False, MPS available: True
+2025-06-11 11:09:27,135 - hardware_detector - INFO - Hardware detection completed successfully
+2025-06-11 11:09:27,135 - hardware_detector - DEBUG - Detected specs: {'platform': 'Darwin', 'architecture': 'arm64', 'cpu_count': 16, 'python_version': '3.11.11', 'gpu_info': None, 'cuda_available': False, 'mps_available': True, 'torch_version': '2.7.0'}
+2025-06-11 11:09:27,135 - __main__ - INFO - 🔍 DEBUG: Full detected specs: {'platform': 'Darwin', 'architecture': 'arm64', 'cpu_count': 16, 'python_version': '3.11.11', 'gpu_info': None, 'cuda_available': False, 'mps_available': True, 'torch_version': '2.7.0'}
+2025-06-11 11:09:27,135 - __main__ - INFO - 🔍 DEBUG: Platform: Darwin
+2025-06-11 11:09:27,135 - __main__ - INFO - 🔍 DEBUG: Architecture: arm64
+2025-06-11 11:09:27,135 - __main__ - INFO - 🔍 DEBUG: MPS Available: True
+2025-06-11 11:09:27,135 - __main__ - INFO - 🔍 DEBUG: Is Apple Silicon: True
+2025-06-11 11:09:27,135 - __main__ - INFO - 🔍 DEBUG: GPU Info: None
+2025-06-11 11:09:27,135 - __main__ - INFO - 🔍 DEBUG: Detected RAM (GB): 16
+2025-06-11 11:09:27,140 - __main__ - INFO - 🔍 DEBUG: PSUtil detected 128GB unified memory
+2025-06-11 11:09:27,218 - __main__ - INFO - 🔍 DEBUG: System profiler output: hardware:
+    hardware overview:
+      model name: macbook pro
+      model identifier: mac16,5
+      model number: z1fs0002mkh/a
+      chip: apple m4 max
+      total number of cores: 16 (12 performance and 4 efficiency)
+      memory: 128 gb
+      system firmware version: 11881.61.3
+      os loader version: 11881.61.3
+      serial number (system): kkvqcmx4dt
+      hardware uuid: 92bfa67e-d816-5b1d-99bb-f9a2824999ba
+      provisioning udid: 00006041-001269200280801c
+      activation lock status: enabled
+2025-06-11 11:09:27,218 - __main__ - INFO - 🔍 DEBUG: Detected Apple chip: M4 Max
+2025-06-11 11:09:27,218 - __main__ - INFO - 🔍 DEBUG: Final values - Platform: Apple Silicon, GPU Vendor: Apple Silicon, GPU Name: M4 Max, Unified RAM: 128GB
+2025-06-11 11:09:27,258 - urllib3.connectionpool - DEBUG - https://huggingface.co:443 "HEAD /api/telemetry/gradio/launched HTTP/1.1" 200 0

gradio_app.py CHANGED Viewed

@@ -1,10 +1,12 @@
 import os
 import logging
 import gradio as gr
 from dotenv import load_dotenv
 import google.generativeai as genai
 from auto_diffusers import AutoDiffusersGenerator
 from simple_memory_calculator import SimpleMemoryCalculator
 load_dotenv()
@@ -170,8 +172,12 @@ class GradioAutodiffusers:
             return f"Error generating code: {str(e)}"
-def create_gradio_interface():
-    """Create and configure the Gradio interface."""
     app = GradioAutodiffusers()
@@ -1641,7 +1647,7 @@ def create_gradio_interface():
         # Hardware Selection Section
         with gr.Group(elem_classes="glass-card"):
-            with gr.Accordion("⚙️ Hardware Specifications", open=False) as hardware_accordion:
                 gr.HTML("""
                 <div class="section-header" style="text-align: center;">
                     <p style="margin: 0; color: #6a443a; font-size: 1.1rem; font-weight: 600; font-family: 'Georgia', serif;">
@@ -1653,7 +1659,7 @@ def create_gradio_interface():
                 # Platform, VRAM, and RAM in a single row
                 with gr.Row():
                     platform = gr.Dropdown(
-                        choices=["Linux", "Darwin", "Windows"],
                         label="🖥️ Platform",
                         value="Linux",
                         info="Your operating system"
@@ -1672,6 +1678,14 @@ def create_gradio_interface():
                         maximum=256,
                         info="Total system memory"
                     )
                 # GPU configuration on separate lines
                 gpu_vendor = gr.Dropdown(
@@ -1711,6 +1725,7 @@ def create_gradio_interface():
                     visible=False
                 )
         # Model Configuration Section
         with gr.Group(elem_classes="glass-card"):
             with gr.Accordion("🤖 Model Configuration", open=True) as model_accordion:
@@ -1819,6 +1834,25 @@ def create_gradio_interface():
                     value=""
                 )
         def on_gpu_vendor_change(vendor):
             """Handle GPU vendor selection and update series dropdown."""
             if vendor == "Custom (Manual Input)":
@@ -1944,12 +1978,16 @@ def create_gradio_interface():
             else:
                 return vendor if vendor != "Custom (Manual Input)" else "Custom GPU"
-        def update_hardware_accordion_title(platform, gpu_vendor, gpu_model, vram_gb, ram_gb):
             """Update hardware accordion title with current configuration."""
             final_gpu = get_final_gpu_name(gpu_vendor, "", gpu_model)
             if not final_gpu:
                 final_gpu = gpu_vendor if gpu_vendor != "Custom (Manual Input)" else "Custom GPU"
             # Extract GPU name and VRAM for cleaner display
             gpu_display = final_gpu
             if gpu_model and "(" in gpu_model and "GB" in gpu_model:
@@ -2014,6 +2052,13 @@ def create_gradio_interface():
                 error_msg = str(e)
                 return f"**Note:** {error_msg} (API error)", model_name
         # Connect GPU dropdown change handlers with memory analysis updates
         gpu_vendor.change(
             on_gpu_vendor_change,
@@ -2069,18 +2114,195 @@ def create_gradio_interface():
         )
         # Create wrapper functions that return gr.update for accordion labels
-        def update_hardware_accordion(platform, gpu_vendor, gpu_model, vram_gb, ram_gb):
-            title = update_hardware_accordion_title(platform, gpu_vendor, gpu_model, vram_gb, ram_gb)
             return gr.update(label=title)
         def update_model_accordion(model_name, dtype_selection, width, height, inference_steps, memory_analysis_text=""):
             title = update_model_accordion_title(model_name, dtype_selection, width, height, inference_steps, memory_analysis_text)
             return gr.update(label=title)
         # Load initial accordion titles on startup
         interface.load(
             update_hardware_accordion,
-            inputs=[platform, gpu_vendor, gpu_model, vram_gb, ram_gb],
             outputs=hardware_accordion
         )
@@ -2093,10 +2315,10 @@ def create_gradio_interface():
         # Accordion title update event handlers
         # Hardware accordion title updates
-        for component in [platform, gpu_vendor, gpu_model, vram_gb, ram_gb]:
             component.change(
                 update_hardware_accordion,
-                inputs=[platform, gpu_vendor, gpu_model, vram_gb, ram_gb],
                 outputs=hardware_accordion
             )
@@ -2191,20 +2413,28 @@ def create_gradio_interface():
             return '\n'.join(filtered_lines)
-        def generate_with_combined_gpu_name(gpu_vendor, gpu_series, gpu_model, vram_gb, ram_gb, platform, model_name, dtype_selection, width, height, inference_steps):
             """Generate code with the correct GPU name from multi-level selection, including memory analysis."""
             final_gpu_name = get_final_gpu_name(gpu_vendor, gpu_series, gpu_model)
             # Constant prompt text
             prompt_text = "A cat holding a sign that says hello world"
             # STEP 1: Perform memory analysis BEFORE code generation
             memory_analysis_data = None
             memory_header = ""
             try:
-                if model_name and vram_gb and vram_gb > 0:
-                    memory_info, recommendations, _ = app.analyze_model_memory(model_name, vram_gb)
                     # Package memory analysis for Gemini API
                     memory_analysis_data = {
@@ -2241,8 +2471,17 @@ def create_gradio_interface():
                     optimization_strategy = get_optimization_strategy(recommendations)
-                    memory_header = f"""# Memory Analysis for {model_name}:
-# GPU: {final_gpu_name if final_gpu_name else 'Not specified'} ({vram_gb}GB VRAM)
 # Model Memory Requirements: {memory_info.get('estimated_inference_memory_fp16_gb', 'Unknown')} GB
 # Recommendation: {', '.join(recommendations.get('recommendations', ['N/A']))}
 # Optimization Strategy: {optimization_strategy}
@@ -2256,9 +2495,25 @@ def create_gradio_interface():
 """
             # STEP 2: Get the actual prompt that will be sent to Gemini
-            actual_prompt = app.get_generation_prompt(
-                model_name, prompt_text, (int(height), int(width)), int(inference_steps),
-                {
                     'platform': platform,
                     'architecture': 'manual_input',
                     'cpu_count': 8,
@@ -2267,16 +2522,20 @@ def create_gradio_interface():
                     'mps_available': platform == 'Darwin' and 'apple' in final_gpu_name.lower() if final_gpu_name else False,
                     'torch_version': '2.0+',
                     'manual_input': True,
-                    'ram_gb': int(ram_gb) if ram_gb else 16,
                     'user_dtype': f"torch.{dtype_selection}" if dtype_selection != "Auto" else None,
-                    'gpu_info': [{'name': final_gpu_name, 'memory_mb': int(vram_gb) * 1024}] if final_gpu_name and vram_gb else None
-                },
                 optimization_profile="balanced"
             )
             # STEP 3: Generate the optimized code WITH memory analysis information
             generated_code = app.generate_code_with_manual_specs(
-                final_gpu_name, vram_gb, ram_gb, platform,
                 model_name, prompt_text, dtype_selection, width, height, inference_steps,
                 memory_analysis_data
             )
@@ -2294,11 +2553,11 @@ def create_gradio_interface():
         full_code_storage = gr.State(value="")
         prompt_storage = gr.State(value="")
-        def generate_and_store_code(gpu_vendor, gpu_series, gpu_model, vram_gb, ram_gb, platform, model_name, dtype_selection, width, height, inference_steps):
             """Generate code and return code for display and full code for storage."""
             summary, full_code, actual_prompt = generate_with_combined_gpu_name(
                 gpu_vendor, gpu_series, gpu_model, vram_gb, ram_gb, platform,
-                model_name, dtype_selection, width, height, inference_steps
             )
             # Show the view prompt button after generation and close accordions
             return (full_code, full_code, False, gr.update(visible=True), actual_prompt,
@@ -2317,7 +2576,7 @@ def create_gradio_interface():
             generate_and_store_code,
             inputs=[
                 gpu_vendor, gpu_series, gpu_model, vram_gb, ram_gb, platform,
-                model_name, dtype_selection, width, height, inference_steps
             ],
             outputs=[code_output, full_code_storage, code_collapsed, view_prompt_btn, prompt_storage, hardware_accordion, model_accordion]
         )
@@ -2334,6 +2593,7 @@ def create_gradio_interface():
             hide_modal,
             outputs=[prompt_modal, prompt_display]
         )
@@ -2342,12 +2602,54 @@ def create_gradio_interface():
 def main():
     """Launch the Gradio application."""
     try:
-        interface = create_gradio_interface()
         interface.launch(
-            server_name="0.0.0.0",
-            server_port=7860,
-            share=True,
             show_error=True
         )
     except Exception as e:

 import os
 import logging
+import argparse
 import gradio as gr
 from dotenv import load_dotenv
 import google.generativeai as genai
 from auto_diffusers import AutoDiffusersGenerator
 from simple_memory_calculator import SimpleMemoryCalculator
+from hardware_detector import HardwareDetector
 load_dotenv()
             return f"Error generating code: {str(e)}"
+def create_gradio_interface(auto_hardware_detection=False):
+    """Create and configure the Gradio interface.
+    Args:
+        auto_hardware_detection (bool): Whether to enable automatic hardware detection on startup
+    """
     app = GradioAutodiffusers()
         # Hardware Selection Section
         with gr.Group(elem_classes="glass-card"):
+            with gr.Accordion("⚙️ Hardware Specifications", open=True) as hardware_accordion:
                 gr.HTML("""
                 <div class="section-header" style="text-align: center;">
                     <p style="margin: 0; color: #6a443a; font-size: 1.1rem; font-weight: 600; font-family: 'Georgia', serif;">
                 # Platform, VRAM, and RAM in a single row
                 with gr.Row():
                     platform = gr.Dropdown(
+                        choices=["Linux", "Darwin", "Windows", "Apple Silicon"],
                         label="🖥️ Platform",
                         value="Linux",
                         info="Your operating system"
                         maximum=256,
                         info="Total system memory"
                     )
+                    unified_ram_gb = gr.Number(
+                        label="🔗 Unified RAM (GB)",
+                        value=16,
+                        minimum=8,
+                        maximum=256,
+                        visible=False,
+                        info="Total unified memory (shared by CPU and GPU)"
+                    )
                 # GPU configuration on separate lines
                 gpu_vendor = gr.Dropdown(
                     visible=False
                 )
         # Model Configuration Section
         with gr.Group(elem_classes="glass-card"):
             with gr.Accordion("🤖 Model Configuration", open=True) as model_accordion:
                     value=""
                 )
+        def on_platform_change(platform_value):
+            """Handle platform selection and update field visibility."""
+            if platform_value == "Apple Silicon":
+                # Hide VRAM, System RAM, and GPU Series; show Unified RAM
+                return (
+                    gr.update(visible=False),  # vram_gb
+                    gr.update(visible=False),  # ram_gb
+                    gr.update(visible=True),   # unified_ram_gb
+                    gr.update(visible=False)   # gpu_series
+                )
+            else:
+                # Show VRAM and System RAM, hide Unified RAM, show GPU Series
+                return (
+                    gr.update(visible=True),   # vram_gb
+                    gr.update(visible=True),   # ram_gb
+                    gr.update(visible=False),  # unified_ram_gb
+                    gr.update(visible=True)    # gpu_series
+                )
         def on_gpu_vendor_change(vendor):
             """Handle GPU vendor selection and update series dropdown."""
             if vendor == "Custom (Manual Input)":
             else:
                 return vendor if vendor != "Custom (Manual Input)" else "Custom GPU"
+        def update_hardware_accordion_title(platform, gpu_vendor, gpu_model, vram_gb, ram_gb, unified_ram_gb=None):
             """Update hardware accordion title with current configuration."""
             final_gpu = get_final_gpu_name(gpu_vendor, "", gpu_model)
             if not final_gpu:
                 final_gpu = gpu_vendor if gpu_vendor != "Custom (Manual Input)" else "Custom GPU"
+            # Handle Apple Silicon unified memory display
+            if platform == "Apple Silicon":
+                return f"⚙️ Hardware: Apple Silicon | {unified_ram_gb}GB Unified Memory"
             # Extract GPU name and VRAM for cleaner display
             gpu_display = final_gpu
             if gpu_model and "(" in gpu_model and "GB" in gpu_model:
                 error_msg = str(e)
                 return f"**Note:** {error_msg} (API error)", model_name
+        # Connect platform change handler
+        platform.change(
+            on_platform_change,
+            inputs=[platform],
+            outputs=[vram_gb, ram_gb, unified_ram_gb, gpu_series]
+        )
         # Connect GPU dropdown change handlers with memory analysis updates
         gpu_vendor.change(
             on_gpu_vendor_change,
         )
         # Create wrapper functions that return gr.update for accordion labels
+        def update_hardware_accordion(platform, gpu_vendor, gpu_model, vram_gb, ram_gb, unified_ram_gb):
+            title = update_hardware_accordion_title(platform, gpu_vendor, gpu_model, vram_gb, ram_gb, unified_ram_gb)
             return gr.update(label=title)
         def update_model_accordion(model_name, dtype_selection, width, height, inference_steps, memory_analysis_text=""):
             title = update_model_accordion_title(model_name, dtype_selection, width, height, inference_steps, memory_analysis_text)
             return gr.update(label=title)
+        def auto_detect_hardware():
+            """Auto-detect hardware specifications and return values for form fields."""
+            try:
+                detector = HardwareDetector()
+                specs = detector.specs
+                # DEBUG: Log all detected specs
+                logger.info(f"🔍 DEBUG: Full detected specs: {specs}")
+                # Extract platform
+                detected_platform = specs.get('platform', 'Linux')
+                logger.info(f"🔍 DEBUG: Platform: {detected_platform}")
+                logger.info(f"🔍 DEBUG: Architecture: {specs.get('architecture')}")
+                logger.info(f"🔍 DEBUG: MPS Available: {specs.get('mps_available')}")
+                # Check for Apple Silicon specifically
+                is_apple_silicon = (
+                    detected_platform == 'Darwin' and
+                    specs.get('architecture') == 'arm64' and
+                    specs.get('mps_available', False)
+                )
+                logger.info(f"🔍 DEBUG: Is Apple Silicon: {is_apple_silicon}")
+                if is_apple_silicon:
+                    detected_platform = "Apple Silicon"
+                # Extract GPU info
+                gpu_info = specs.get('gpu_info', [])
+                logger.info(f"🔍 DEBUG: GPU Info: {gpu_info}")
+                detected_gpu_name = ""
+                detected_vram = 8  # default
+                detected_unified_ram = 16  # default for Apple Silicon
+                if gpu_info and len(gpu_info) > 0:
+                    gpu = gpu_info[0]  # Take first GPU
+                    detected_gpu_name = gpu.get('name', '')
+                    detected_vram = gpu.get('memory_mb', 8192) // 1024  # Convert MB to GB
+                    logger.info(f"🔍 DEBUG: GPU Name: {detected_gpu_name}")
+                    logger.info(f"🔍 DEBUG: GPU Memory MB: {gpu.get('memory_mb')}")
+                # Extract RAM - try multiple methods for Apple Silicon
+                detected_ram = specs.get('ram_gb', 16)
+                logger.info(f"🔍 DEBUG: Detected RAM (GB): {detected_ram}")
+                # For Apple Silicon, try to get more accurate memory info
+                if is_apple_silicon:
+                    # Try to get system memory in different ways
+                    try:
+                        import psutil
+                        total_memory_bytes = psutil.virtual_memory().total
+                        total_memory_gb = total_memory_bytes / (1024**3)
+                        detected_unified_ram = round(total_memory_gb)
+                        logger.info(f"🔍 DEBUG: PSUtil detected {detected_unified_ram}GB unified memory")
+                    except:
+                        # Fallback to specs value
+                        detected_unified_ram = detected_ram
+                        logger.info(f"🔍 DEBUG: Using specs RAM value: {detected_unified_ram}GB")
+                # Map detected GPU to vendor categories
+                gpu_vendor = "Custom (Manual Input)"
+                # For Apple Silicon, try to detect the chip series
+                if is_apple_silicon:
+                    # Try to detect Apple Silicon chip from system info
+                    try:
+                        import subprocess
+                        # Get chip info from system profiler
+                        result = subprocess.run(['system_profiler', 'SPHardwareDataType'],
+                                              capture_output=True, text=True, timeout=5)
+                        chip_info = result.stdout.lower()
+                        logger.info(f"🔍 DEBUG: System profiler output: {chip_info}")
+                        if 'm1' in chip_info:
+                            if 'ultra' in chip_info:
+                                detected_gpu_name = "M1 Ultra"
+                            elif 'max' in chip_info:
+                                detected_gpu_name = "M1 Max"
+                            elif 'pro' in chip_info:
+                                detected_gpu_name = "M1 Pro"
+                            else:
+                                detected_gpu_name = "M1"
+                        elif 'm2' in chip_info:
+                            if 'ultra' in chip_info:
+                                detected_gpu_name = "M2 Ultra"
+                            elif 'max' in chip_info:
+                                detected_gpu_name = "M2 Max"
+                            elif 'pro' in chip_info:
+                                detected_gpu_name = "M2 Pro"
+                            else:
+                                detected_gpu_name = "M2"
+                        elif 'm3' in chip_info:
+                            if 'ultra' in chip_info:
+                                detected_gpu_name = "M3 Ultra"
+                            elif 'max' in chip_info:
+                                detected_gpu_name = "M3 Max"
+                            elif 'pro' in chip_info:
+                                detected_gpu_name = "M3 Pro"
+                            else:
+                                detected_gpu_name = "M3"
+                        elif 'm4' in chip_info:
+                            if 'ultra' in chip_info:
+                                detected_gpu_name = "M4 Ultra"
+                            elif 'max' in chip_info:
+                                detected_gpu_name = "M4 Max"
+                            elif 'pro' in chip_info:
+                                detected_gpu_name = "M4 Pro"
+                            else:
+                                detected_gpu_name = "M4"
+                        logger.info(f"🔍 DEBUG: Detected Apple chip: {detected_gpu_name}")
+                    except Exception as e:
+                        logger.warning(f"🔍 DEBUG: Could not detect Apple chip: {e}")
+                        detected_gpu_name = "Apple Silicon GPU"
+                    gpu_vendor = "Apple Silicon"
+                elif detected_gpu_name:
+                    gpu_lower = detected_gpu_name.lower()
+                    if 'rtx' in gpu_lower and ('geforce' in gpu_lower or '30' in gpu_lower or '40' in gpu_lower or '50' in gpu_lower):
+                        gpu_vendor = "NVIDIA Consumer (GeForce RTX)"
+                    elif 'rtx' in gpu_lower and ('a' in gpu_lower or 'quadro' in gpu_lower):
+                        gpu_vendor = "NVIDIA Professional (RTX A-Series)"
+                    elif any(x in gpu_lower for x in ['h100', 'a100', 'v100', 'l40', 'l4']):
+                        gpu_vendor = "NVIDIA Data Center"
+                    elif 'm1' in gpu_lower or 'm2' in gpu_lower or 'm3' in gpu_lower or 'm4' in gpu_lower or 'apple' in gpu_lower:
+                        gpu_vendor = "Apple Silicon"
+                    elif 'radeon' in gpu_lower or 'rx ' in gpu_lower or 'instinct' in gpu_lower:
+                        gpu_vendor = "AMD"
+                    elif 'arc' in gpu_lower:
+                        gpu_vendor = "Intel"
+                logger.info(f"🔍 DEBUG: Final values - Platform: {detected_platform}, GPU Vendor: {gpu_vendor}, GPU Name: {detected_gpu_name}, Unified RAM: {detected_unified_ram}GB")
+                return detected_platform, gpu_vendor, detected_gpu_name, detected_vram, detected_ram, detected_unified_ram
+            except Exception as e:
+                logger.warning(f"Auto hardware detection failed: {e}")
+                # Return defaults if detection fails
+                return "Linux", "Custom (Manual Input)", "", 8, 16, 16
+        # Auto hardware detection on startup (if enabled)
+        if auto_hardware_detection:
+            def populate_hardware_on_load():
+                """Populate hardware fields with auto-detected values on load."""
+                detected_platform, detected_gpu_vendor, detected_gpu_name, detected_vram, detected_ram, detected_unified_ram = auto_detect_hardware()
+                # Handle Apple Silicon field visibility
+                if detected_platform == "Apple Silicon":
+                    vram_visible = False
+                    ram_visible = False
+                    unified_visible = True
+                    gpu_series_visible = False
+                else:
+                    vram_visible = True
+                    ram_visible = True
+                    unified_visible = False
+                    gpu_series_visible = True
+                # Update all hardware fields
+                updates = [
+                    gr.update(value=detected_platform),  # platform
+                    gr.update(value=detected_gpu_vendor),  # gpu_vendor
+                    gr.update(value=detected_gpu_name),  # gpu_name
+                    gr.update(value=detected_vram, visible=vram_visible),  # vram_gb
+                    gr.update(value=detected_ram, visible=ram_visible),  # ram_gb
+                    gr.update(value=detected_unified_ram, visible=unified_visible),  # unified_ram_gb
+                    gr.update(visible=gpu_series_visible),  # gpu_series
+                ]
+                return updates
+            interface.load(
+                populate_hardware_on_load,
+                outputs=[platform, gpu_vendor, gpu_name, vram_gb, ram_gb, unified_ram_gb, gpu_series]
+            )
         # Load initial accordion titles on startup
         interface.load(
             update_hardware_accordion,
+            inputs=[platform, gpu_vendor, gpu_model, vram_gb, ram_gb, unified_ram_gb],
             outputs=hardware_accordion
         )
         # Accordion title update event handlers
         # Hardware accordion title updates
+        for component in [platform, gpu_vendor, gpu_model, vram_gb, ram_gb, unified_ram_gb]:
             component.change(
                 update_hardware_accordion,
+                inputs=[platform, gpu_vendor, gpu_model, vram_gb, ram_gb, unified_ram_gb],
                 outputs=hardware_accordion
             )
             return '\n'.join(filtered_lines)
+        def generate_with_combined_gpu_name(gpu_vendor, gpu_series, gpu_model, vram_gb, ram_gb, platform, model_name, dtype_selection, width, height, inference_steps, unified_ram_gb=None):
             """Generate code with the correct GPU name from multi-level selection, including memory analysis."""
             final_gpu_name = get_final_gpu_name(gpu_vendor, gpu_series, gpu_model)
             # Constant prompt text
             prompt_text = "A cat holding a sign that says hello world"
+            # Handle Apple Silicon unified memory
+            effective_vram = vram_gb
+            effective_ram = ram_gb
+            if platform == "Apple Silicon" and unified_ram_gb:
+                # For Apple Silicon, unified memory serves as both VRAM and RAM
+                effective_vram = unified_ram_gb
+                effective_ram = unified_ram_gb
             # STEP 1: Perform memory analysis BEFORE code generation
             memory_analysis_data = None
             memory_header = ""
             try:
+                if model_name and effective_vram and effective_vram > 0:
+                    memory_info, recommendations, _ = app.analyze_model_memory(model_name, effective_vram)
                     # Package memory analysis for Gemini API
                     memory_analysis_data = {
                     optimization_strategy = get_optimization_strategy(recommendations)
+                    if platform == "Apple Silicon":
+                        memory_header = f"""# Memory Analysis for {model_name}:
+# Platform: Apple Silicon with {unified_ram_gb}GB Unified Memory (shared CPU/GPU)
+# Model Memory Requirements: {memory_info.get('estimated_inference_memory_fp16_gb', 'Unknown')} GB
+# Recommendation: {', '.join(recommendations.get('recommendations', ['N/A']))}
+# Optimization Strategy: {optimization_strategy}
+"""
+                    else:
+                        memory_header = f"""# Memory Analysis for {model_name}:
+# GPU: {final_gpu_name if final_gpu_name else 'Not specified'} ({effective_vram}GB VRAM)
 # Model Memory Requirements: {memory_info.get('estimated_inference_memory_fp16_gb', 'Unknown')} GB
 # Recommendation: {', '.join(recommendations.get('recommendations', ['N/A']))}
 # Optimization Strategy: {optimization_strategy}
 """
             # STEP 2: Get the actual prompt that will be sent to Gemini
+            # Create hardware specs based on platform
+            if platform == "Apple Silicon":
+                hardware_specs = {
+                    'platform': 'Darwin',  # Use Darwin for backend compatibility
+                    'architecture': 'arm64',
+                    'cpu_count': 8,
+                    'python_version': '3.11',
+                    'cuda_available': False,
+                    'mps_available': True,  # Apple Silicon supports MPS
+                    'torch_version': '2.0+',
+                    'manual_input': True,
+                    'ram_gb': int(effective_ram) if effective_ram else 16,
+                    'unified_memory': True,  # Special flag for Apple Silicon
+                    'unified_memory_gb': int(unified_ram_gb) if unified_ram_gb else 16,
+                    'user_dtype': f"torch.{dtype_selection}" if dtype_selection != "Auto" else None,
+                    'gpu_info': None  # Apple Silicon doesn't report discrete GPU info
+                }
+            else:
+                hardware_specs = {
                     'platform': platform,
                     'architecture': 'manual_input',
                     'cpu_count': 8,
                     'mps_available': platform == 'Darwin' and 'apple' in final_gpu_name.lower() if final_gpu_name else False,
                     'torch_version': '2.0+',
                     'manual_input': True,
+                    'ram_gb': int(effective_ram) if effective_ram else 16,
                     'user_dtype': f"torch.{dtype_selection}" if dtype_selection != "Auto" else None,
+                    'gpu_info': [{'name': final_gpu_name, 'memory_mb': int(effective_vram) * 1024}] if final_gpu_name and effective_vram else None
+                }
+            actual_prompt = app.get_generation_prompt(
+                model_name, prompt_text, (int(height), int(width)), int(inference_steps),
+                hardware_specs,
                 optimization_profile="balanced"
             )
             # STEP 3: Generate the optimized code WITH memory analysis information
             generated_code = app.generate_code_with_manual_specs(
+                final_gpu_name, effective_vram, effective_ram, platform,
                 model_name, prompt_text, dtype_selection, width, height, inference_steps,
                 memory_analysis_data
             )
         full_code_storage = gr.State(value="")
         prompt_storage = gr.State(value="")
+        def generate_and_store_code(gpu_vendor, gpu_series, gpu_model, vram_gb, ram_gb, platform, model_name, dtype_selection, width, height, inference_steps, unified_ram_gb):
             """Generate code and return code for display and full code for storage."""
             summary, full_code, actual_prompt = generate_with_combined_gpu_name(
                 gpu_vendor, gpu_series, gpu_model, vram_gb, ram_gb, platform,
+                model_name, dtype_selection, width, height, inference_steps, unified_ram_gb
             )
             # Show the view prompt button after generation and close accordions
             return (full_code, full_code, False, gr.update(visible=True), actual_prompt,
             generate_and_store_code,
             inputs=[
                 gpu_vendor, gpu_series, gpu_model, vram_gb, ram_gb, platform,
+                model_name, dtype_selection, width, height, inference_steps, unified_ram_gb
             ],
             outputs=[code_output, full_code_storage, code_collapsed, view_prompt_btn, prompt_storage, hardware_accordion, model_accordion]
         )
             hide_modal,
             outputs=[prompt_modal, prompt_display]
         )
 def main():
     """Launch the Gradio application."""
+    parser = argparse.ArgumentParser(description="Auto-Diffusers Code Generator")
+    parser.add_argument(
+        "--auto-hardware-detection",
+        action="store_true",
+        default=False,
+        help="Enable automatic hardware detection on startup"
+    )
+    parser.add_argument(
+        "--no-auto-hardware-detection",
+        action="store_true",
+        help="Disable automatic hardware detection on startup (default: True)"
+    )
+    parser.add_argument(
+        "--port",
+        type=int,
+        default=7860,
+        help="Port to run the server on (default: 7860)"
+    )
+    parser.add_argument(
+        "--host",
+        type=str,
+        default="0.0.0.0",
+        help="Host to run the server on (default: 0.0.0.0)"
+    )
+    parser.add_argument(
+        "--no-share",
+        action="store_true",
+        help="Disable public sharing of the interface"
+    )
+    args = parser.parse_args()
+    # Handle auto hardware detection flag
+    auto_hardware_detection = args.auto_hardware_detection and not args.no_auto_hardware_detection
+    # Log startup configuration
+    print(f"🚀 Starting Auto-Diffusers Code Generator...")
+    print(f"   Host: {args.host}")
+    print(f"   Port: {args.port}")
+    print(f"   Share: {not args.no_share}")
+    print(f"   Auto Hardware Detection: {'Enabled' if auto_hardware_detection else 'Disabled'}")
     try:
+        interface = create_gradio_interface(auto_hardware_detection=auto_hardware_detection)
         interface.launch(
+            server_name=args.host,
+            server_port=args.port,
+            share=not args.no_share,
             show_error=True
         )
     except Exception as e: