'use strict'; const TOOLS_WRAPPER_PATTERN = /]*>([\s\S]*?)<\/tool_calls>/gi; const TOOL_CALL_MARKUP_BLOCK_PATTERN = /<(?:[a-z0-9_:-]+:)?invoke\b([^>]*)>([\s\S]*?)<\/(?:[a-z0-9_:-]+:)?invoke>/gi; const PARAMETER_BLOCK_PATTERN = /<(?:[a-z0-9_:-]+:)?parameter\b([^>]*)>([\s\S]*?)<\/(?:[a-z0-9_:-]+:)?parameter>/gi; const TOOL_CALL_MARKUP_KV_PATTERN = /<(?:[a-z0-9_:-]+:)?([a-z0-9_.-]+)\b[^>]*>([\s\S]*?)<\/(?:[a-z0-9_:-]+:)?\1>/gi; const CDATA_PATTERN = /^$/i; const XML_ATTR_PATTERN = /\b([a-z0-9_:-]+)\s*=\s*("([^"]*)"|'([^']*)')/gi; const { toStringSafe, } = require('./state'); function stripFencedCodeBlocks(text) { const t = typeof text === 'string' ? text : ''; if (!t) { return ''; } return t.replace(/```[\s\S]*?```/g, ' '); } function parseMarkupToolCalls(text) { const raw = toStringSafe(text).trim(); if (!raw) { return []; } const out = []; for (const wrapper of raw.matchAll(TOOLS_WRAPPER_PATTERN)) { const body = toStringSafe(wrapper[1]); for (const block of body.matchAll(TOOL_CALL_MARKUP_BLOCK_PATTERN)) { const parsed = parseMarkupSingleToolCall(block); if (parsed) { out.push(parsed); } } } return out; } function parseMarkupSingleToolCall(block) { const attrs = parseTagAttributes(block[1]); const name = toStringSafe(attrs.name).trim(); if (!name) { return null; } const inner = toStringSafe(block[2]).trim(); if (inner) { try { const decoded = JSON.parse(inner); if (decoded && typeof decoded === 'object' && !Array.isArray(decoded)) { return { name, input: decoded.input && typeof decoded.input === 'object' && !Array.isArray(decoded.input) ? decoded.input : decoded.parameters && typeof decoded.parameters === 'object' && !Array.isArray(decoded.parameters) ? decoded.parameters : {}, }; } } catch (_err) { // Not JSON, continue with markup parsing. } } const input = {}; for (const match of inner.matchAll(PARAMETER_BLOCK_PATTERN)) { const parameterAttrs = parseTagAttributes(match[1]); const paramName = toStringSafe(parameterAttrs.name).trim(); if (!paramName) { continue; } appendMarkupValue(input, paramName, parseMarkupValue(match[2])); } if (Object.keys(input).length === 0 && inner.trim() !== '') { return null; } return { name, input }; } function parseMarkupInput(raw) { const s = toStringSafe(raw).trim(); if (!s) { return {}; } // Prioritize XML-style KV tags (e.g., val) const kv = parseMarkupKVObject(s); if (Object.keys(kv).length > 0) { return kv; } // Fallback to JSON parsing const parsed = parseToolCallInput(s); if (parsed && typeof parsed === 'object' && !Array.isArray(parsed)) { if (Object.keys(parsed).length > 0) { return parsed; } } return { _raw: extractRawTagValue(s) }; } function parseMarkupKVObject(text) { const raw = toStringSafe(text).trim(); if (!raw) { return {}; } const out = {}; for (const m of raw.matchAll(TOOL_CALL_MARKUP_KV_PATTERN)) { const key = toStringSafe(m[1]).trim(); if (!key) { continue; } const value = parseMarkupValue(m[2]); if (value === undefined || value === null) { continue; } appendMarkupValue(out, key, value); } return out; } function parseMarkupValue(raw) { const s = toStringSafe(extractRawTagValue(raw)).trim(); if (!s) { return ''; } if (s.includes('<') && s.includes('>')) { const nested = parseMarkupInput(s); if (nested && typeof nested === 'object' && !Array.isArray(nested)) { if (isOnlyRawValue(nested)) { return toStringSafe(nested._raw); } return nested; } } if (s.startsWith('{') || s.startsWith('[')) { try { return JSON.parse(s); } catch (_err) { return s; } } return s; } function extractRawTagValue(inner) { const s = toStringSafe(inner).trim(); if (!s) { return ''; } // 1. Check for CDATA const cdataMatch = s.match(CDATA_PATTERN); if (cdataMatch && cdataMatch[1] !== undefined) { return cdataMatch[1]; } // 2. Fallback to unescaping standard HTML entities // Note: we avoid broad tag stripping here to preserve user content (like < symbols in code) return unescapeHtml(inner); } function unescapeHtml(safe) { if (!safe) return ''; return safe.replace(/&/g, '&') .replace(/</g, '<') .replace(/>/g, '>') .replace(/"/g, '"') .replace(/'/g, "'") .replace(/'/g, "'"); } function parseTagAttributes(raw) { const source = toStringSafe(raw); const out = {}; if (!source) { return out; } for (const match of source.matchAll(XML_ATTR_PATTERN)) { const key = toStringSafe(match[1]).trim().toLowerCase(); if (!key) { continue; } out[key] = match[3] || match[4] || ''; } return out; } function parseToolCallInput(v) { if (v == null) { return {}; } if (typeof v === 'string') { const raw = toStringSafe(v); if (!raw) { return {}; } try { const parsed = JSON.parse(raw); if (parsed && typeof parsed === 'object' && !Array.isArray(parsed)) { return parsed; } return { _raw: raw }; } catch (_err) { return { _raw: raw }; } } if (typeof v === 'object' && !Array.isArray(v)) { return v; } try { const parsed = JSON.parse(JSON.stringify(v)); if (parsed && typeof parsed === 'object' && !Array.isArray(parsed)) { return parsed; } } catch (_err) { return {}; } return {}; } function appendMarkupValue(out, key, value) { if (Object.prototype.hasOwnProperty.call(out, key)) { const current = out[key]; if (Array.isArray(current)) { current.push(value); return; } out[key] = [current, value]; return; } out[key] = value; } function isOnlyRawValue(obj) { if (!obj || typeof obj !== 'object' || Array.isArray(obj)) { return false; } const keys = Object.keys(obj); return keys.length === 1 && keys[0] === '_raw'; } module.exports = { stripFencedCodeBlocks, parseMarkupToolCalls, };