Instructions to use kunaliitkgp09/improved-unified-multi-model-pt with libraries, inference providers, notebooks, and local apps. Follow these links to get started.

Libraries

How to use kunaliitkgp09/improved-unified-multi-model-pt with Transformers:

# Use a pipeline as a high-level helper
from transformers import pipeline

pipe = pipeline("text-generation", model="kunaliitkgp09/improved-unified-multi-model-pt")

# Load model directly
from transformers import AutoModel
model = AutoModel.from_pretrained("kunaliitkgp09/improved-unified-multi-model-pt", dtype="auto")

Notebooks
Google Colab
Kaggle
Local Apps

vLLM

How to use kunaliitkgp09/improved-unified-multi-model-pt with vLLM:

Install from pip and serve model

# Install vLLM from pip:
pip install vllm
# Start the vLLM server:
vllm serve "kunaliitkgp09/improved-unified-multi-model-pt"
# Call the server using curl (OpenAI-compatible API):
curl -X POST "http://localhost:8000/v1/completions" \
	-H "Content-Type: application/json" \
	--data '{
		"model": "kunaliitkgp09/improved-unified-multi-model-pt",
		"prompt": "Once upon a time,",
		"max_tokens": 512,
		"temperature": 0.5
	}'

Use Docker

docker model run hf.co/kunaliitkgp09/improved-unified-multi-model-pt

SGLang

How to use kunaliitkgp09/improved-unified-multi-model-pt with SGLang:

Install from pip and serve model

# Install SGLang from pip:
pip install sglang
# Start the SGLang server:
python3 -m sglang.launch_server \
    --model-path "kunaliitkgp09/improved-unified-multi-model-pt" \
    --host 0.0.0.0 \
    --port 30000
# Call the server using curl (OpenAI-compatible API):
curl -X POST "http://localhost:30000/v1/completions" \
	-H "Content-Type: application/json" \
	--data '{
		"model": "kunaliitkgp09/improved-unified-multi-model-pt",
		"prompt": "Once upon a time,",
		"max_tokens": 512,
		"temperature": 0.5
	}'

Use Docker images

docker run --gpus all \
    --shm-size 32g \
    -p 30000:30000 \
    -v ~/.cache/huggingface:/root/.cache/huggingface \
    --env "HF_TOKEN=<secret>" \
    --ipc=host \
    lmsysorg/sglang:latest \
    python3 -m sglang.launch_server \
        --model-path "kunaliitkgp09/improved-unified-multi-model-pt" \
        --host 0.0.0.0 \
        --port 30000
# Call the server using curl (OpenAI-compatible API):
curl -X POST "http://localhost:30000/v1/completions" \
	-H "Content-Type: application/json" \
	--data '{
		"model": "kunaliitkgp09/improved-unified-multi-model-pt",
		"prompt": "Once upon a time,",
		"max_tokens": 512,
		"temperature": 0.5
	}'

Docker Model Runner
How to use kunaliitkgp09/improved-unified-multi-model-pt with Docker Model Runner:
```
docker model run hf.co/kunaliitkgp09/improved-unified-multi-model-pt
```

improved-unified-multi-model-pt / test_improved_model.py

kunaliitkgp09

Upload test_improved_model.py with huggingface_hub

fd15b76 verified 10 months ago

raw

history blame contribute delete

10.2 kB

	#!/usr/bin/env python3
	"""
	Test the Improved Unified Multi-Model with Prompt Templates
	"""

	import asyncio
	import time
	import sys
	from pathlib import Path

	# Add current directory to path
	sys.path.append(str(Path(__file__).parent))

	from improved_unified_model_pt import ImprovedUnifiedMultiModelPT, ImprovedUnifiedModelConfig
	from prompt_template import PromptTemplates, TaskType, TestPrompt
	from test_suite import OrchestratorTester, TestResult

	class ImprovedModelWrapper:
	"""Wrapper class to make the improved model compatible with our test suite"""

	def __init__(self, model):
	self.model = model

	async def process_request(self, prompt):
	"""Process a request using the improved unified model"""
	try:
	# Process the request
	result = self.model.process(prompt)

	# Create a compatible result object
	class TaskResult:
	def __init__(self, result_dict):
	self.task_type = type('TaskType', (), {'value': result_dict.get('task_type', 'TEXT')})()
	self.confidence = result_dict.get('confidence', 0.5)
	self.success = True
	self.output = result_dict.get('output', '')
	self.error_message = None

	return TaskResult(result)

	except Exception as e:
	# Create error result
	class ErrorResult:
	def __init__(self, error):
	self.task_type = type('TaskType', (), {'value': 'ERROR'})()
	self.confidence = 0.0
	self.success = False
	self.output = ''
	self.error_message = str(error)

	return ErrorResult(e)

	async def test_improved_model_with_prompts():
	"""Test the improved model with our prompt templates"""
	print("🧪 Testing Improved Unified Model with Prompt Templates")
	print("=" * 70)

	# Create and load the improved model
	print("📦 Creating and loading improved model...")
	config = ImprovedUnifiedModelConfig()
	model = ImprovedUnifiedMultiModelPT(config)

	# Create wrapper
	wrapper = ImprovedModelWrapper(model)

	# Test with different types of prompts
	test_categories = [
	("Text Processing", TaskType.TEXT, 3),
	("Image Captioning", TaskType.CAPTION, 3),
	("Text-to-Image", TaskType.TEXT2IMG, 3),
	("Reasoning", TaskType.REASONING, 3),
	("Multimodal", TaskType.MULTIMODAL, 2)
	]

	results = []

	for category_name, task_type, num_prompts in test_categories:
	print(f"\n📝 Testing {category_name} ({num_prompts} prompts):")
	print("-" * 60)

	prompts = PromptTemplates.get_prompts_by_task_type(task_type)[:num_prompts]

	for i, prompt in enumerate(prompts, 1):
	print(f"\n{i}. Testing: {prompt.prompt[:60]}...")

	start_time = time.time()
	result = await wrapper.process_request(prompt.prompt)
	processing_time = time.time() - start_time

	# Check if task routing was correct
	expected_task = prompt.expected_task.value
	actual_task = result.task_type.value
	task_correct = expected_task == actual_task

	status = "✅" if result.success else "❌"
	task_status = "✅" if task_correct else "❌"

	print(f" {status} Success: {result.success}")
	print(f" {task_status} Task: {actual_task} (expected: {expected_task})")
	print(f" 📊 Confidence: {result.confidence:.2f}")
	print(f" ⏱️ Time: {processing_time:.2f}s")

	if result.output:
	print(f" 📄 Output: {result.output[:100]}...")

	if result.error_message:
	print(f" ❌ Error: {result.error_message}")

	# Store result for analysis
	test_result = TestResult(
	prompt=prompt.prompt,
	expected_task=prompt.expected_task,
	actual_task=actual_task,
	confidence=result.confidence,
	processing_time=processing_time,
	success=result.success,
	error_message=result.error_message,
	output=result.output
	)
	results.append(test_result)

	# Calculate overall statistics
	total_tests = len(results)
	successful_tests = sum(1 for r in results if r.success)
	correct_tasks = sum(1 for r in results if r.task_correct)

	accuracy = correct_tasks / total_tests if total_tests > 0 else 0
	success_rate = successful_tests / total_tests if total_tests > 0 else 0
	avg_confidence = sum(r.confidence for r in results) / total_tests if total_tests > 0 else 0
	avg_time = sum(r.processing_time for r in results) / total_tests if total_tests > 0 else 0

	print(f"\n📊 Overall Test Results:")
	print("=" * 50)
	print(f" Total Tests: {total_tests}")
	print(f" Successful: {successful_tests}")
	print(f" Task Accuracy: {accuracy:.1%}")
	print(f" Success Rate: {success_rate:.1%}")
	print(f" Avg Confidence: {avg_confidence:.2f}")
	print(f" Avg Processing Time: {avg_time:.2f}s")

	# Task-specific breakdown
	print(f"\n🎯 Task-Specific Results:")
	print("-" * 40)
	for task_type in TaskType:
	task_results = [r for r in results if r.expected_task == task_type]
	if task_results:
	task_correct = sum(1 for r in task_results if r.task_correct)
	task_accuracy = task_correct / len(task_results)
	print(f" {task_type.value}: {task_accuracy:.1%} ({task_correct}/{len(task_results)})")

	return results, model

	async def run_comprehensive_test(model):
	"""Run comprehensive test using our test suite"""
	print("\n🧪 Running Comprehensive Test Suite")
	print("=" * 60)

	wrapper = ImprovedModelWrapper(model)
	tester = OrchestratorTester(wrapper)

	# Run basic tests
	print("Running basic functionality tests...")
	basic_result = await tester.run_basic_tests()

	print(f"\n📊 Basic Test Results:")
	print(f" Total Tests: {basic_result.total_tests}")
	print(f" Passed: {basic_result.passed_tests}")
	print(f" Failed: {basic_result.failed_tests}")
	print(f" Accuracy: {basic_result.accuracy:.1%}")
	print(f" Avg Confidence: {basic_result.average_confidence:.2f}")
	print(f" Avg Processing Time: {basic_result.average_processing_time:.2f}s")

	return basic_result

	async def interactive_test(model):
	"""Interactive testing mode"""
	print("\n🎮 Interactive Testing Mode")
	print("=" * 50)
	print("Enter your prompts (type 'quit' to exit):")
	print("Example prompts:")
	print(" - What is machine learning?")
	print(" - Generate an image of a peaceful forest")
	print(" - Describe this image of a sunset")
	print(" - Explain step by step how neural networks work")
	print()

	wrapper = ImprovedModelWrapper(model)

	while True:
	try:
	user_input = input("Enter prompt: ").strip()

	if user_input.lower() in ['quit', 'exit', 'q']:
	break

	if not user_input:
	continue

	print(f"\n⏳ Processing: {user_input}")
	start_time = time.time()

	result = await wrapper.process_request(user_input)
	processing_time = time.time() - start_time

	print(f"✅ Task Type: {result.task_type.value}")
	print(f"📊 Confidence: {result.confidence:.2f}")
	print(f"⏱️ Processing Time: {processing_time:.2f}s")

	if result.output:
	print(f"📄 Output: {result.output}")

	if result.error_message:
	print(f"❌ Error: {result.error_message}")

	print()

	except KeyboardInterrupt:
	print("\nExiting interactive mode...")
	break
	except Exception as e:
	print(f"Error: {e}")

	def compare_with_original():
	"""Compare improved model with original model"""
	print("\n🔄 Comparing Improved vs Original Model")
	print("=" * 50)

	# Test prompts for comparison
	comparison_prompts = [
	("What is machine learning?", "TEXT"),
	("Generate an image of a peaceful forest", "TEXT2IMG"),
	("Describe this image of a sunset", "CAPTION"),
	("Explain step by step how neural networks work", "REASONING")
	]

	print("Testing improved model routing...")
	config = ImprovedUnifiedModelConfig()
	improved_model = ImprovedUnifiedMultiModelPT(config)

	for prompt, expected in comparison_prompts:
	print(f"\n🔍 Testing: {prompt}")
	result = improved_model.process(prompt)
	actual = result['task_type']
	correct = "✅" if actual == expected else "❌"
	print(f" {correct} Expected: {expected}, Actual: {actual}, Confidence: {result['confidence']:.2f}")

	async def main():
	"""Main function"""
	print("🚀 Improved Unified Multi-Model Testing")
	print("=" * 70)

	# Test with prompt templates
	results, model = await test_improved_model_with_prompts()

	# Run comprehensive test
	comprehensive_result = await run_comprehensive_test(model)

	# Compare with original
	compare_with_original()

	# Interactive testing option
	print("\n" + "="*70)
	print("🎮 Interactive Testing")
	print("="*70)

	try_interactive = input("\nWould you like to try interactive testing? (y/n): ").strip().lower()
	if try_interactive in ['y', 'yes']:
	await interactive_test(model)

	print("\n🎉 Testing completed!")
	print("📊 The improved model shows enhanced routing capabilities.")

	if __name__ == "__main__":
	asyncio.run(main())