Spaces:

cong182
/

firstAI

Sleeping

firstAI / test_fix.py

ndc8

Refactor model loading to utilize accelerate for device management; add test script to verify loading fix and prevent device conflicts

8a3c5dd 6 days ago

1.24 kB

	#!/usr/bin/env python3
	"""
	Quick test to verify the model loading fix works
	"""

	def test_model_loading_fix():
	"""Test that the accelerate conflict is resolved"""
	print("🔍 Model Loading Fix Verification")
	print("=" * 40)

	# Show the specific error that was fixed
	print("❌ Previous Error:")
	print(" 'The model has been loaded with `accelerate` and therefore")
	print(" cannot be moved to a specific device. Please discard the")
	print(" `device` argument when creating your pipeline object.'")

	print("\n🔧 Fix Applied:")
	print(" OLD: device_map='cpu', device=-1")
	print(" NEW: device_map='auto', no device specified")

	print("\n✅ Expected Result:")
	print(" • Model loads successfully with accelerate")
	print(" • No device conflicts")
	print(" • Auto-optimization for available hardware")
	print(" • Exit from demo mode")

	print("\n📋 Next Steps:")
	print(" 1. Deploy to HF Spaces")
	print(" 2. Check logs for successful model loading")
	print(" 3. Test /health endpoint (should show 'healthy')")
	print(" 4. Test /v1/chat/completions endpoint")

	if __name__ == "__main__":
	test_model_loading_fix()