fix: improve markdown parser for tables, headings, and line breaks

2026-04-10 10:09:46 +00:00
parent 925920eee1
commit bfc85648db
2 changed files with 202 additions and 33 deletions
--- a/src/frontend/src/lib/components/ChatInterface.svelte
+++ b/src/frontend/src/lib/components/ChatInterface.svelte
@@ -124,6 +124,31 @@
 									<li>{item}</li>
 								{/each}
 							</ul>
+						{:else if segment.type === 'table' && segment.headers && segment.rows}
+							<div class="table-wrapper">
+								<table class="markdown-table">
+									<thead>
+									<tr>
+										{#each segment.headers as header}
+											<th>{header}</th>
+										{/each}
+									</tr>
+								</thead>
+								<tbody>
+									{#each segment.rows as row}
+										<tr>
+											{#each row as cell}
+												<td>{cell}</td>
+											{/each}
+									</tr>
+									{/each}
+								</tbody>
+							</table>
+							</div>
+						{:else if segment.type === 'heading'}
+							<h4 class="content-heading">{segment.content}</h4>
+						{:else if segment.type === 'lineBreak'}
+							<br />
 						{:else}
 							{segment.content}
 						{/if}
@@ -410,6 +435,52 @@
 		text-decoration: none;
 	}

+	.content-heading {
+		font-size: 1rem;
+		font-weight: 600;
+		margin: 1rem 0 0.5rem;
+		color: #fff;
+	}
+
+	.content-heading:first-child {
+		margin-top: 0;
+	}
+
+	.table-wrapper {
+		overflow-x: auto;
+		margin: 0.75rem 0;
+	}
+
+	.markdown-table {
+		border-collapse: collapse;
+		width: 100%;
+		font-size: 0.85rem;
+		background: rgba(0, 0, 0, 0.2);
+		border-radius: 6px;
+		overflow: hidden;
+	}
+
+	.markdown-table th,
+	.markdown-table td {
+		padding: 0.5rem 0.75rem;
+		text-align: left;
+		border-bottom: 1px solid rgba(255, 255, 255, 0.1);
+	}
+
+	.markdown-table th {
+		background: rgba(102, 126, 234, 0.2);
+		font-weight: 600;
+		color: #667eea;
+	}
+
+	.markdown-table tr:last-child td {
+		border-bottom: none;
+	}
+
+	.markdown-table tr:hover td {
+		background: rgba(255, 255, 255, 0.05);
+	}
+
 	a:hover {
 		text-decoration: underline;
 	}
--- a/src/frontend/src/lib/utils/markdown.ts
+++ b/src/frontend/src/lib/utils/markdown.ts
@@ -1,18 +1,23 @@
 /**
 * Simple markdown parser for rendering AI responses
- * Supports: bold, italic, code blocks, inline code, links, lists, headings
+ * Supports: bold, italic, code blocks, inline code, links, lists, tables, headings, line breaks
 */

 interface ParsedSegment {
-	type: 'text' | 'bold' | 'italic' | 'code' | 'codeBlock' | 'link' | 'list';
+	type: 'text' | 'bold' | 'italic' | 'code' | 'codeBlock' | 'link' | 'list' | 'table' | 'lineBreak' | 'heading';
 	content: string;
 	items?: string[];
+	headers?: string[];
+	rows?: string[][];
 }

 export function parseMarkdown(text: string): ParsedSegment[] {
 	const segments: ParsedSegment[] = [];
 	
-	// Split by code blocks first (they can contain other markdown)
+	// Normalize line endings
+	text = text.replace(/\r\n/g, '\n').replace(/\r/g, '\n');
+	
+	// First, extract code blocks
 	const codeBlockRegex = /```[\s\S]*?```/g;
 	const parts = text.split(codeBlockRegex);
 	const codeBlocks = text.match(codeBlockRegex) || [];
@@ -22,9 +27,9 @@ export function parseMarkdown(text: string): ParsedSegment[] {
 	while (partIndex < parts.length) {
 		const part = parts[partIndex];
 		
-		if (part) {
-			// Process inline formatting
-			segments.push(...parseInlineMarkdown(part));
+		if (part.trim()) {
+			// Process non-code content
+			segments.push(...parseInlineContent(part));
 		}
 		
 		// Add code block if there's one after this part
@@ -39,11 +44,127 @@ export function parseMarkdown(text: string): ParsedSegment[] {
 	return segments;
 }

-function parseInlineMarkdown(text: string): ParsedSegment[] {
+function parseInlineContent(text: string): ParsedSegment[] {
 	const segments: ParsedSegment[] = [];
 	
-	// Combined regex for bold, italic, inline code, links
-	const inlineRegex = /(\*\*[^*]+\*\*|\*[^*]+\*|`[^`]+`|\\\[.*?\]\(.*?\))/g;
+	// Check for tables first
+	const tableRegex = /^\|.+\|\n\|[-:\s|]+\|\n((?:\|.+\|\n?)*)/gm;
+	let tableMatch;
+	while ((tableMatch = tableRegex.exec(text)) !== null) {
+		// Add content before table
+		const beforeTable = text.substring(0, tableMatch.index);
+		if (beforeTable.trim()) {
+			segments.push(...parseLines(beforeTable));
+		}
+		
+		// Parse table
+		const tableContent = tableMatch[0];
+		const tableSegments = parseTable(tableContent);
+		segments.push(...tableSegments);
+		
+		// Update text for next iteration
+		text = text.substring(tableMatch.index + tableContent.length);
+	}
+	
+	// Add remaining content
+	if (text.trim()) {
+		segments.push(...parseLines(text));
+	}
+	
+	return segments;
+}
+
+function parseTable(tableStr: string): ParsedSegment[] {
+	const lines = tableStr.trim().split('\n').filter(line => line.trim());
+	if (lines.length < 2) return [];
+	
+	// Skip separator line (|---|---|)
+	const dataLines = lines.filter(line => !line.match(/^[\|\s-]+$/));
+	if (dataLines.length < 2) return [];
+	
+	const headers = parseTableRow(dataLines[0]);
+	const rows = dataLines.slice(1).map(row => parseTableRow(row));
+	
+	return [{
+		type: 'table',
+		content: '',
+		headers,
+		rows
+	}];
+}
+
+function parseTableRow(row: string): string[] {
+	return row.split('|').map(cell => cell.trim()).filter(cell => cell !== '');
+}
+
+function parseLines(text: string): ParsedSegment[] {
+	const segments: ParsedSegment[] = [];
+	
+	// Combined regex for inline formatting
+	const inlineRegex = /(\*\*[^*]+\*\*|\*[^*]+\*|`[^`]+`|\[.*?\]\(.*?\))/g;
+	const lines = text.split('\n');
+	
+	for (let i = 0; i < lines.length; i++) {
+		const line = lines[i];
+		
+		if (!line.trim()) {
+			// Empty line - add line break for paragraph separation
+			segments.push({ type: 'lineBreak', content: '' });
+			continue;
+		}
+		
+		// Check for headings
+		if (line.match(/^#{1,6}\s/)) {
+			segments.push({ type: 'heading', content: line.replace(/^#+\s/, '') });
+			continue;
+		}
+		
+		// Check for list items
+		if (line.match(/^[\-\*]\s/)) {
+			const listMatch = line.match(/^([\-\*])\s(.*)/);
+			if (listMatch) {
+				// Check if previous segment is a list
+				const lastSeg = segments[segments.length - 1];
+				if (lastSeg && lastSeg.type === 'list') {
+					lastSeg.items?.push(listMatch[2]);
+				} else {
+					segments.push({ type: 'list', content: '', items: [listMatch[2]] });
+				}
+			}
+			continue;
+		}
+		
+		// Check for numbered lists
+		if (line.match(/^\d+\.\s/)) {
+			const listMatch = line.match(/^\d+\.\s(.*)/);
+			if (listMatch) {
+				const lastSeg = segments[segments.length - 1];
+				if (lastSeg && lastSeg.type === 'list') {
+					lastSeg.items?.push(listMatch[1]);
+				} else {
+					segments.push({ type: 'list', content: '', items: [listMatch[1]] });
+				}
+			}
+			continue;
+		}
+		
+		// Process inline formatting
+		const inlineSegments = parseInlineElements(line);
+		segments.push(...inlineSegments);
+		
+		// Add line break after non-empty lines (except last in a paragraph)
+		if (i < lines.length - 1 && line.trim()) {
+			segments.push({ type: 'lineBreak', content: '' });
+		}
+	}
+	
+	return segments;
+}
+
+function parseInlineElements(text: string): ParsedSegment[] {
+	const segments: ParsedSegment[] = [];
+	
+	const inlineRegex = /(\*\*[^*]+\*\*|\*[^*]+\*|`[^`]+`|\[.*?\]\(.*?\))/g;
 	const parts = text.split(inlineRegex);
 	
 	for (const part of parts) {
@@ -60,30 +181,7 @@ function parseInlineMarkdown(text: string): ParsedSegment[] {
 			if (linkMatch) {
 				segments.push({ type: 'link', content: linkMatch[1] });
 			}
-		} else if (part.includes('\n')) {
-			// Handle newlines and lists
-			const lines = part.split('\n');
-			for (let i = 0; i < lines.length; i++) {
-				const line = lines[i];
-				if (line.match(/^[\-\*]\s/)) {
-					// List item
-					if (segments.length > 0 && segments[segments.length - 1].type === 'list') {
-						segments[segments.length - 1].items?.push(line.slice(2));
-					} else {
-						segments.push({ type: 'list', content: '', items: [line.slice(2)] });
-					}
-				} else if (line.match(/^#{1,6}\s/)) {
-					// Heading
-					segments.push({ type: 'text', content: line });
-				} else if (line) {
-					if (i > 0) {
-						segments.push({ type: 'text', content: '\n' + line });
-					} else {
-						segments.push({ type: 'text', content: line });
-					}
-				}
-			}
-		} else {
+		} else if (part) {
 			segments.push({ type: 'text', content: part });
 		}
 	}