DollhouseMCP

Official

AGPL 3.0

330

mcp-server
scripts

fix-element-formatting.ts•10.6 kB

#!/usr/bin/env ts-node /** * Fix Element File Formatting * * Fixes element files (skills, personas, templates, agents) that have their markdown * content stored as single long lines without proper newlines. * * Issue: #1387 * * Usage: * npx ts-node scripts/fix-element-formatting.ts --dry-run # Preview changes * npx ts-node scripts/fix-element-formatting.ts # Apply changes */ import * as fs from 'node:fs'; import * as path from 'node:path'; import * as process from 'node:process'; interface ProcessingStats { fixed: number; skipped: number; errors: number; } /** * Check if a file needs formatting based on average line length */ function needsFormatting(filePath: string): boolean { try { const content = fs.readFileSync(filePath, 'utf-8'); const lines = content.split('\n'); // Find the content section (after frontmatter) let inFrontmatter = false; let frontmatterEnd = -1; for (let i = 0; i < lines.length; i++) { if (lines[i].trim() === '---') { if (inFrontmatter === false) { inFrontmatter = true; } else { frontmatterEnd = i; break; } } } if (frontmatterEnd === -1) { // No frontmatter found - file might be malformed or not an element file return false; } // Check content section only const contentLines = lines.slice(frontmatterEnd + 1); const contentText = contentLines.join('\n').trim(); if (contentText.length === 0) return false; // No content const contentLineCount = contentLines.filter(l => l.trim()).length; if (contentLineCount === 0) return false; // If average line length > 200, needs formatting const avgLineLength = contentText.length / contentLineCount; return avgLineLength > 200; } catch (error) { // Handle file read errors gracefully - file might be inaccessible or malformed // Log warning if needed, but don't throw to allow batch processing to continue if (error instanceof Error && error.message) { // Silent fail for batch processing - errors will be caught at processFile level } return false; } } /** * Format markdown content by adding proper newlines * * The content is typically one long line with headers, code blocks, etc. all smashed together. * Example: "Skill## PurposeAutomated workflow...### 1. Content Ingestion..." * * Security: Regex patterns are designed to avoid ReDoS (Regular Expression Denial of Service) * by using bounded quantifiers and avoiding nested/overlapping quantifiers that could cause * catastrophic backtracking on maliciously-crafted element files. */ function formatMarkdownContent(content: string): string { if (!content || content.length === 0) { return content; } // Security: Guard against excessively large files that could cause performance issues const MAX_CONTENT_LENGTH = 100000; // 100KB limit if (content.length > MAX_CONTENT_LENGTH) { console.warn(` ⚠️ Content too large (${content.length} chars), skipping formatting for safety`); return content; } let formatted = content; // Step 1: Add newlines before markdown headers (# ## ### ####) // Pattern: non-whitespace followed immediately by # (header marker) // Security: Simple pattern, no nested quantifiers, safe from ReDoS // Note: \s already includes \n, so just use [^\s] formatted = formatted.replaceAll(/([^\s])(#{1,6}\s)/g, '$1\n\n$2'); // Step 1b: Add newlines after header text when followed by capital letter // Pattern: header followed by capital letter with no newline (e.g., "## PurposeAutomated") // Security: FIXED - Use bounded quantifier {1,500} and non-greedy match to prevent ReDoS // Old pattern was vulnerable: [^\n]+ could backtrack excessively formatted = formatted.replaceAll(/(#{1,6}\s+[^\n]{1,500}?[a-z])([A-Z][a-z])/g, '$1\n\n$2'); // Step 2: Add newlines before code blocks // Pattern: word or punctuation followed immediately by ``` // Security: Simple pattern, no nested quantifiers, safe from ReDoS // Note: \s already includes \n, so just use [^\s] formatted = formatted.replaceAll(/([^\s])(```)/g, '$1\n\n$2'); // Step 3: Add newlines after code block closings // Pattern: ``` followed by a word (not on new line) // Security: Bounded quantifier {0,10} prevents excessive backtracking formatted = formatted.replaceAll(/(```)\s{0,10}([a-zA-Z])/g, '$1\n\n$2'); // Step 4: Fix code block language labels (e.g., "Pipelineyaml" -> "Pipeline\n\nyaml") // Security: Fixed alternation with bounded word length to prevent backtracking // Split into two patterns to reduce complexity (SonarCloud max is 20, was 29) // Group 1: Common markup/config languages formatted = formatted.replaceAll( /([a-z])(yaml|json|javascript|typescript|python|bash|sh|shell|ruby|go|rust|java)(?=\s|$)/gi, '$1\n\n$2' ); // Group 2: Additional languages formatted = formatted.replaceAll( /([a-z])(cpp|sql|css|html|xml|php|perl|swift|kotlin|scala|powershell)(?=\s|$)/gi, '$1\n\n$2' ); // Step 5: Fix bullet/numbered lists // Pattern: word/period followed by list marker // Security: FIXED - All quantifiers bounded to prevent ReDoS attacks // - \s{0,10}: Max 10 spaces before list marker // - \d{1,4}: Max 4 digits (supports lists up to 9999 items) // - \s{1,10}: Max 10 spaces after list marker/period // Note: \s already includes \n, so just use [^\s] formatted = formatted.replaceAll(/([^\s])\s{0,10}([-*]\s{1,10}[a-zA-Z])/g, '$1\n\n$2'); formatted = formatted.replaceAll(/([^\s])\s{0,10}(\d{1,4}\.\s{1,10}[a-zA-Z])/g, '$1\n\n$2'); // Step 6: Reduce excessive newlines (max 2 consecutive) // Security: Simple quantifier, safe pattern formatted = formatted.replaceAll(/\n{3,}/g, '\n\n'); // Step 7: Ensure proper spacing around colons in YAML-like structures // Security: Bounded quantifier {2,20} prevents excessive matching // Note: Starting at 2 spaces (not 3) to catch more formatting issues while staying safe formatted = formatted.replaceAll(/:\s{2,20}/g, ':\n '); // Step 8: Ensure single trailing newline formatted = formatted.trim() + '\n'; return formatted; } /** * Process an individual element file */ function processFile(filePath: string, dryRun: boolean): boolean { try { // Check if file needs formatting if (!needsFormatting(filePath)) { return false; } // Read and split into frontmatter and content const content = fs.readFileSync(filePath, 'utf-8'); const lines = content.split('\n'); let frontmatterStart = -1; let frontmatterEnd = -1; let inFrontmatter = false; for (let i = 0; i < lines.length; i++) { if (lines[i].trim() === '---') { if (inFrontmatter === false) { frontmatterStart = i; inFrontmatter = true; } else { frontmatterEnd = i; break; } } } if (frontmatterStart === -1 || frontmatterEnd === -1) { console.log(` ⚠️ No valid frontmatter: ${path.basename(filePath)}`); return false; } // Extract frontmatter and content const frontmatterLines = lines.slice(frontmatterStart, frontmatterEnd + 1); const contentLines = lines.slice(frontmatterEnd + 1); const contentText = contentLines.join('\n').trim(); // Format the content const formattedContent = formatMarkdownContent(contentText); // Check if anything actually changed if (formattedContent === contentText) { return false; } // Reconstruct the file const newContent = frontmatterLines.join('\n') + '\n' + formattedContent; if (!dryRun) { fs.writeFileSync(filePath, newContent, 'utf-8'); } return true; } catch (error) { console.error(` ❌ Error: ${path.basename(filePath)} - ${error}`); return false; } } /** * Process all files in a directory * * @returns ProcessingStats - Accumulated statistics for all files processed */ function processDirectory(dirPath: string, dryRun: boolean): ProcessingStats { // Initialize counters for tracking results let fixed = 0; let skipped = 0; let errors = 0; if (!fs.existsSync(dirPath)) { // Return empty stats if directory doesn't exist return { fixed, skipped, errors }; } const files = fs.readdirSync(dirPath) .filter((f: string) => f.endsWith('.md')) .sort(); console.log(`\n📁 ${path.basename(dirPath)} (${files.length} files)`); for (const file of files) { const filePath = path.join(dirPath, file); try { const wasFixed = processFile(filePath, dryRun); if (wasFixed) { console.log(` ✅ ${file}`); fixed++; } else { skipped++; } } catch (error) { // Handle error by logging and tracking in stats for summary reporting const errorMsg = error instanceof Error ? error.message : String(error); console.error(` ❌ ${file}: ${errorMsg}`); errors++; } } // Return accumulated statistics return { fixed, skipped, errors }; } /** * Main execution */ function main() { const args = process.argv.slice(2); const dryRun = args.includes('--dry-run'); const portfolioPath = path.join(process.env.HOME || '', '.dollhouse/portfolio'); console.log('═'.repeat(60)); console.log('🔧 Element File Formatter - Issue #1387'); console.log('═'.repeat(60)); if (dryRun) { console.log('\n🔍 DRY RUN MODE - No files will be modified'); } if (!fs.existsSync(portfolioPath)) { console.error(`\n❌ Portfolio directory not found: ${portfolioPath}`); process.exit(1); } const elementTypes = ['skills', 'personas', 'templates', 'agents']; const totalStats: ProcessingStats = { fixed: 0, skipped: 0, errors: 0 }; for (const type of elementTypes) { const dirPath = path.join(portfolioPath, type); const stats = processDirectory(dirPath, dryRun); totalStats.fixed += stats.fixed; totalStats.skipped += stats.skipped; totalStats.errors += stats.errors; } console.log('\n' + '═'.repeat(60)); console.log('📊 Summary'); console.log('═'.repeat(60)); console.log(`✅ Fixed: ${totalStats.fixed} files`); console.log(`⏭️ Skipped: ${totalStats.skipped} files (already formatted)`); console.log(`❌ Errors: ${totalStats.errors} files`); if (dryRun && totalStats.fixed > 0) { console.log('\n💡 Run without --dry-run to apply changes'); } else if (!dryRun && totalStats.fixed > 0) { console.log('\n✨ Files have been formatted successfully!'); } console.log('═'.repeat(60)); } main();

Latest Blog Posts

The 50MB Markdown Files That Broke Our Server
By punkpeye on December 3, 2025.
react
react-router
node-js
OpenTelemetry for Model Context Protocol (MCP) Analytics and Agent Observability
By Om-Shree-0709 on November 29, 2025.
observability
mcp
opentelemetry
Securing Enterprise AI Agents with Unique Identities in the Model Context Protocol (MCP)
By Om-Shree-0709 on November 27, 2025.

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/DollhouseMCP/mcp-server'

If you have feedback or need assistance with the MCP directory API, please join our Discord server