{
"success": true,
"data": {
"id": "tmpl_abc123",
"name": "pytorch-distributed-training",
"description": "PyTorch distributed training environment with NCCL support",
"category": "ml",
"framework": "pytorch",
"version": "2.1.0",
"docker_image": "pytorch/pytorch:2.2-cuda12.1-devel",
"gpu_compatible": true,
"official": false,
"default_configuration": {
"gpu_type": "A100",
"gpu_count": 4,
"cpu_cores": 32,
"memory_gb": 256,
"storage_gb": 1000,
"estimated_hourly_cost": 10.00
},
"environment_variables": {
"NCCL_DEBUG": "INFO",
"CUDA_VISIBLE_DEVICES": "0,1,2,3",
"MASTER_ADDR": "localhost",
"MASTER_PORT": "12355",
"WORLD_SIZE": "4"
},
"startup_script": "#!/bin/bash\necho \"Starting distributed training environment\"\nnvidia-smi\npython -c \"import torch; print(f\\\"PyTorch version: {torch.__version__}\\\")\"",
"port_mappings": [
{
"internal_port": 6006,
"protocol": "tcp",
"description": "TensorBoard",
"required": false
},
{
"internal_port": 8888,
"protocol": "tcp",
"description": "Jupyter Lab",
"required": true
}
],
"required_packages": [
"tensorboard",
"wandb",
"transformers",
"datasets"
],
"software_versions": {
"python": "3.9",
"pytorch": "2.2.0",
"cuda": "12.1",
"cudnn": "8.8"
},
"resource_limits": {
"min_resources": {
"gpu_count": 1,
"cpu_cores": 8,
"memory_gb": 32,
"storage_gb": 100
},
"max_resources": {
"gpu_count": 8,
"cpu_cores": 128,
"memory_gb": 1024,
"storage_gb": 10000
}
},
"compatibility": {
"gpu_types": ["A100", "H100", "RTX4090", "V100"],
"regions": ["us-east-1", "us-west-2", "eu-west-1"],
"min_driver_version": "520.61.05"
},
"usage_statistics": {
"total_deployments": 1247,
"active_clusters": 34,
"average_rating": 4.7,
"success_rate": 98.3
},
"tags": ["pytorch", "distributed", "training", "gpu"],
"created_by": {
"user_id": "user_456",
"username": "ml_engineer",
"organization": "TensorOne"
},
"created_at": "2024-01-10T09:00:00Z",
"updated_at": "2024-01-14T15:30:00Z",
"is_public": false,
"is_deprecated": false
}
}