- Updated python_coding_microproject.csv to use NVIDIA NIM Kimi K2 - Updated kali_linux_shell_simulator.csv to use NVIDIA NIM Kimi K2 - Made more general-purpose (flexible targets, expanded tools) - Added nemotron-mini-agent.csv for fast local inference via Ollama - Added nemotron-agent.csv for advanced reasoning via Ollama - Added wiki page: Projects for NVIDIA NIMs and Nemotron
36 lines
1.4 KiB
SQL
36 lines
1.4 KiB
SQL
-- Migration: 027_assign_nvidia_models_to_tenants.sql
|
|
-- Description: Ensure NVIDIA models are assigned to all tenants (fix for partial 021 migration)
|
|
-- Date: 2025-12-08
|
|
-- Issue: Deploy.sh updates add models but don't assign to existing tenants
|
|
|
|
-- Assign NVIDIA models to all existing tenants with 1000 RPM rate limits
|
|
-- This is idempotent - ON CONFLICT DO NOTHING means it won't duplicate
|
|
INSERT INTO tenant_model_configs (tenant_id, model_config_id, model_id, is_enabled, priority, rate_limits, created_at, updated_at)
|
|
SELECT
|
|
t.id,
|
|
m.id, -- UUID foreign key (auto-generated in model_configs)
|
|
m.model_id, -- String identifier (kept for easier queries)
|
|
true,
|
|
5,
|
|
'{"max_requests_per_hour": 1000, "max_tokens_per_request": 4000, "concurrent_requests": 5, "max_cost_per_hour": 10.0, "requests_per_minute": 1000, "tokens_per_minute": 100000, "max_concurrent": 10}'::json,
|
|
NOW(),
|
|
NOW()
|
|
FROM tenants t
|
|
CROSS JOIN model_configs m
|
|
WHERE m.provider = 'nvidia'
|
|
AND m.is_active = true
|
|
ON CONFLICT (tenant_id, model_config_id) DO NOTHING;
|
|
|
|
-- Log migration completion
|
|
DO $$
|
|
DECLARE
|
|
assigned_count INTEGER;
|
|
BEGIN
|
|
SELECT COUNT(*) INTO assigned_count
|
|
FROM tenant_model_configs tmc
|
|
JOIN model_configs mc ON mc.id = tmc.model_config_id
|
|
WHERE mc.provider = 'nvidia';
|
|
|
|
RAISE NOTICE 'Migration 027: Ensured NVIDIA models are assigned to all tenants (% total assignments)', assigned_count;
|
|
END $$;
|