mirror of
https://github.com/simstudioai/sim.git
synced 2026-04-06 03:00:16 -04:00
* feat(timeouts): execution timeout limits * fix type issues * add to docs * update stale exec cleanup route * update more callsites * update tests * address bugbot comments * remove import expression * support streaming and async paths' * fix streaming path * add hitl and workflow handler * make sync path match * consolidate * timeout errors * validation errors typed * import order * Merge staging into feat/timeout-lims Resolved conflicts: - stt/route.ts: Keep both execution timeout and security imports - textract/parse/route.ts: Keep both execution timeout and validation imports - use-workflow-execution.ts: Keep cancellation console entry from feature branch - input-validation.ts: Remove server functions (moved to .server.ts in staging) - tools/index.ts: Keep execution timeout, use .server import for security * make run from block consistent * revert console update change * fix subflow errors * clean up base 64 cache correctly * update docs * consolidate workflow execution and run from block hook code * remove unused constant * fix cleanup base64 sse * fix run from block tracespan
145 lines
4.2 KiB
TypeScript
145 lines
4.2 KiB
TypeScript
import { createLogger } from '@sim/logger'
|
|
import type { NextRequest } from 'next/server'
|
|
import { NextResponse } from 'next/server'
|
|
import { checkInternalAuth } from '@/lib/auth/hybrid'
|
|
import { DEFAULT_EXECUTION_TIMEOUT_MS } from '@/lib/core/execution-limits'
|
|
import { validateAlphanumericId } from '@/lib/core/security/input-validation'
|
|
import { getBaseUrl } from '@/lib/core/utils/urls'
|
|
import { StorageService } from '@/lib/uploads'
|
|
|
|
const logger = createLogger('ProxyTTSAPI')
|
|
|
|
export async function POST(request: NextRequest) {
|
|
try {
|
|
const authResult = await checkInternalAuth(request, { requireWorkflowId: false })
|
|
if (!authResult.success) {
|
|
logger.error('Authentication failed for TTS proxy:', authResult.error)
|
|
return NextResponse.json({ error: 'Unauthorized' }, { status: 401 })
|
|
}
|
|
|
|
const body = await request.json()
|
|
const {
|
|
text,
|
|
voiceId,
|
|
apiKey,
|
|
modelId = 'eleven_monolingual_v1',
|
|
workspaceId,
|
|
workflowId,
|
|
executionId,
|
|
} = body
|
|
|
|
if (!text || !voiceId || !apiKey) {
|
|
return NextResponse.json({ error: 'Missing required parameters' }, { status: 400 })
|
|
}
|
|
|
|
const voiceIdValidation = validateAlphanumericId(voiceId, 'voiceId', 255)
|
|
if (!voiceIdValidation.isValid) {
|
|
logger.error(`Invalid voice ID: ${voiceIdValidation.error}`)
|
|
return NextResponse.json({ error: voiceIdValidation.error }, { status: 400 })
|
|
}
|
|
|
|
// Check if this is an execution context (from workflow tool execution)
|
|
const hasExecutionContext = workspaceId && workflowId && executionId
|
|
logger.info('Proxying TTS request for voice:', {
|
|
voiceId,
|
|
hasExecutionContext,
|
|
workspaceId,
|
|
workflowId,
|
|
executionId,
|
|
})
|
|
|
|
const endpoint = `https://api.elevenlabs.io/v1/text-to-speech/${voiceId}`
|
|
|
|
const response = await fetch(endpoint, {
|
|
method: 'POST',
|
|
headers: {
|
|
Accept: 'audio/mpeg',
|
|
'Content-Type': 'application/json',
|
|
'xi-api-key': apiKey,
|
|
},
|
|
body: JSON.stringify({
|
|
text,
|
|
model_id: modelId,
|
|
}),
|
|
signal: AbortSignal.timeout(DEFAULT_EXECUTION_TIMEOUT_MS),
|
|
})
|
|
|
|
if (!response.ok) {
|
|
logger.error(`Failed to generate TTS: ${response.status} ${response.statusText}`)
|
|
return NextResponse.json(
|
|
{ error: `Failed to generate TTS: ${response.status} ${response.statusText}` },
|
|
{ status: response.status }
|
|
)
|
|
}
|
|
|
|
const audioBlob = await response.blob()
|
|
|
|
if (audioBlob.size === 0) {
|
|
logger.error('Empty audio received from ElevenLabs')
|
|
return NextResponse.json({ error: 'Empty audio received' }, { status: 422 })
|
|
}
|
|
|
|
const audioBuffer = Buffer.from(await audioBlob.arrayBuffer())
|
|
const timestamp = Date.now()
|
|
|
|
// Use execution storage for workflow tool calls, copilot for chat UI
|
|
if (hasExecutionContext) {
|
|
const { uploadExecutionFile } = await import('@/lib/uploads/contexts/execution')
|
|
const fileName = `tts-${timestamp}.mp3`
|
|
|
|
const userFile = await uploadExecutionFile(
|
|
{
|
|
workspaceId,
|
|
workflowId,
|
|
executionId,
|
|
},
|
|
audioBuffer,
|
|
fileName,
|
|
'audio/mpeg',
|
|
authResult.userId
|
|
)
|
|
|
|
logger.info('TTS audio stored in execution context:', {
|
|
executionId,
|
|
fileName,
|
|
size: userFile.size,
|
|
})
|
|
|
|
return NextResponse.json({
|
|
audioFile: userFile,
|
|
audioUrl: userFile.url,
|
|
})
|
|
}
|
|
|
|
// Chat UI usage - no execution context, use copilot context
|
|
const fileName = `tts-${timestamp}.mp3`
|
|
const fileInfo = await StorageService.uploadFile({
|
|
file: audioBuffer,
|
|
fileName,
|
|
contentType: 'audio/mpeg',
|
|
context: 'copilot',
|
|
})
|
|
|
|
const audioUrl = `${getBaseUrl()}${fileInfo.path}`
|
|
|
|
logger.info('TTS audio stored in copilot context (chat UI):', {
|
|
fileName,
|
|
size: fileInfo.size,
|
|
})
|
|
|
|
return NextResponse.json({
|
|
audioUrl,
|
|
size: fileInfo.size,
|
|
})
|
|
} catch (error) {
|
|
logger.error('Error proxying TTS:', error)
|
|
|
|
return NextResponse.json(
|
|
{
|
|
error: `Internal Server Error: ${error instanceof Error ? error.message : 'Unknown error'}`,
|
|
},
|
|
{ status: 500 }
|
|
)
|
|
}
|
|
}
|