Files
sim/apps/sim/app/api/tools/tts/route.ts
Vikhyath Mondreti a627faabe7 feat(timeouts): execution timeout limits (#3120)
* feat(timeouts): execution timeout limits

* fix type issues

* add to docs

* update stale exec cleanup route

* update more callsites

* update tests

* address bugbot comments

* remove import expression

* support streaming and async paths'

* fix streaming path

* add hitl and workflow handler

* make sync path match

* consolidate

* timeout errors

* validation errors typed

* import order

* Merge staging into feat/timeout-lims

Resolved conflicts:
- stt/route.ts: Keep both execution timeout and security imports
- textract/parse/route.ts: Keep both execution timeout and validation imports
- use-workflow-execution.ts: Keep cancellation console entry from feature branch
- input-validation.ts: Remove server functions (moved to .server.ts in staging)
- tools/index.ts: Keep execution timeout, use .server import for security

* make run from block consistent

* revert console update change

* fix subflow errors

* clean up base 64 cache correctly

* update docs

* consolidate workflow execution and run from block hook code

* remove unused constant

* fix cleanup base64 sse

* fix run from block tracespan
2026-02-04 10:26:36 -08:00

145 lines
4.2 KiB
TypeScript

import { createLogger } from '@sim/logger'
import type { NextRequest } from 'next/server'
import { NextResponse } from 'next/server'
import { checkInternalAuth } from '@/lib/auth/hybrid'
import { DEFAULT_EXECUTION_TIMEOUT_MS } from '@/lib/core/execution-limits'
import { validateAlphanumericId } from '@/lib/core/security/input-validation'
import { getBaseUrl } from '@/lib/core/utils/urls'
import { StorageService } from '@/lib/uploads'
const logger = createLogger('ProxyTTSAPI')
export async function POST(request: NextRequest) {
try {
const authResult = await checkInternalAuth(request, { requireWorkflowId: false })
if (!authResult.success) {
logger.error('Authentication failed for TTS proxy:', authResult.error)
return NextResponse.json({ error: 'Unauthorized' }, { status: 401 })
}
const body = await request.json()
const {
text,
voiceId,
apiKey,
modelId = 'eleven_monolingual_v1',
workspaceId,
workflowId,
executionId,
} = body
if (!text || !voiceId || !apiKey) {
return NextResponse.json({ error: 'Missing required parameters' }, { status: 400 })
}
const voiceIdValidation = validateAlphanumericId(voiceId, 'voiceId', 255)
if (!voiceIdValidation.isValid) {
logger.error(`Invalid voice ID: ${voiceIdValidation.error}`)
return NextResponse.json({ error: voiceIdValidation.error }, { status: 400 })
}
// Check if this is an execution context (from workflow tool execution)
const hasExecutionContext = workspaceId && workflowId && executionId
logger.info('Proxying TTS request for voice:', {
voiceId,
hasExecutionContext,
workspaceId,
workflowId,
executionId,
})
const endpoint = `https://api.elevenlabs.io/v1/text-to-speech/${voiceId}`
const response = await fetch(endpoint, {
method: 'POST',
headers: {
Accept: 'audio/mpeg',
'Content-Type': 'application/json',
'xi-api-key': apiKey,
},
body: JSON.stringify({
text,
model_id: modelId,
}),
signal: AbortSignal.timeout(DEFAULT_EXECUTION_TIMEOUT_MS),
})
if (!response.ok) {
logger.error(`Failed to generate TTS: ${response.status} ${response.statusText}`)
return NextResponse.json(
{ error: `Failed to generate TTS: ${response.status} ${response.statusText}` },
{ status: response.status }
)
}
const audioBlob = await response.blob()
if (audioBlob.size === 0) {
logger.error('Empty audio received from ElevenLabs')
return NextResponse.json({ error: 'Empty audio received' }, { status: 422 })
}
const audioBuffer = Buffer.from(await audioBlob.arrayBuffer())
const timestamp = Date.now()
// Use execution storage for workflow tool calls, copilot for chat UI
if (hasExecutionContext) {
const { uploadExecutionFile } = await import('@/lib/uploads/contexts/execution')
const fileName = `tts-${timestamp}.mp3`
const userFile = await uploadExecutionFile(
{
workspaceId,
workflowId,
executionId,
},
audioBuffer,
fileName,
'audio/mpeg',
authResult.userId
)
logger.info('TTS audio stored in execution context:', {
executionId,
fileName,
size: userFile.size,
})
return NextResponse.json({
audioFile: userFile,
audioUrl: userFile.url,
})
}
// Chat UI usage - no execution context, use copilot context
const fileName = `tts-${timestamp}.mp3`
const fileInfo = await StorageService.uploadFile({
file: audioBuffer,
fileName,
contentType: 'audio/mpeg',
context: 'copilot',
})
const audioUrl = `${getBaseUrl()}${fileInfo.path}`
logger.info('TTS audio stored in copilot context (chat UI):', {
fileName,
size: fileInfo.size,
})
return NextResponse.json({
audioUrl,
size: fileInfo.size,
})
} catch (error) {
logger.error('Error proxying TTS:', error)
return NextResponse.json(
{
error: `Internal Server Error: ${error instanceof Error ? error.message : 'Unknown error'}`,
},
{ status: 500 }
)
}
}