Files
radzen-blazor/RadzenBlazorDemos.Tools/Program.cs
Vladimir Enchev 739ebde6a8 Llmtxt generation added (#2379)
* RadzenBlazorDemos.Tools added

* GenerateLlmsTxt Condition update to Release

* GenerateLlmsTxt updated again

* code fixed

* content generation cleaned

* razor/html tags removed from example descriptions and the code is now inside codeblock

* more fixes
2025-12-05 10:14:15 +02:00

690 lines
26 KiB
C#

using System.Text;
using System.Text.RegularExpressions;
namespace RadzenBlazorDemos.Tools;
class Program
{
static int Main(string[] args)
{
if (args.Length < 2)
{
Console.Error.WriteLine("Usage: GenerateLlmsTxt <outputPath> <pagesPath> [servicesPath] [modelsPath]");
return 1;
}
var outputPath = args[0];
var pagesPath = args[1];
var servicesPath = args.Length > 2 && !string.IsNullOrWhiteSpace(args[2]) ? args[2] : null;
var modelsPath = args.Length > 3 && !string.IsNullOrWhiteSpace(args[3]) ? args[3] : null;
if (!Directory.Exists(pagesPath))
{
Console.Error.WriteLine($"Pages path does not exist: {pagesPath}");
return 1;
}
try
{
Generate(outputPath, pagesPath, servicesPath, modelsPath);
Console.WriteLine($"Successfully generated llms.txt at: {outputPath}");
return 0;
}
catch (Exception ex)
{
Console.Error.WriteLine($"Error generating llms.txt: {ex.Message}");
Console.Error.WriteLine(ex.StackTrace);
return 1;
}
}
static void Generate(string outputPath, string pagesPath, string servicesPath, string modelsPath)
{
var sb = new StringBuilder();
sb.AppendLine("# Radzen Blazor Components - Demo Application");
sb.AppendLine();
sb.AppendLine("This file contains all demo pages and examples from the Radzen Blazor Components demo application.");
sb.AppendLine($"Generated: {DateTime.UtcNow:yyyy-MM-dd HH:mm:ss UTC}");
sb.AppendLine();
sb.AppendLine("## Table of Contents");
sb.AppendLine();
// Collect all demo files
var allPages = Directory.GetFiles(pagesPath, "*.razor", SearchOption.AllDirectories)
.Where(f => !Path.GetFileName(f).StartsWith("_"))
.ToList();
// Separate main pages (with @page directive) from example components
var mainPages = new List<string>();
var examplePages = new List<string>();
foreach (var page in allPages)
{
var content = File.ReadAllText(page, Encoding.UTF8);
// Check if it has @page directive - main pages have routes
if (Regex.IsMatch(content, @"^\s*@page\s+", RegexOptions.Multiline | RegexOptions.IgnoreCase))
{
mainPages.Add(page);
}
else
{
examplePages.Add(page);
}
}
// Sort main pages ascending by filename
mainPages = mainPages.OrderBy(p => Path.GetFileName(p)).ToList();
// Keep all pages for content generation (sorted ascending)
var pages = allPages.OrderBy(p => Path.GetFileName(p)).ToList();
var pageCs = Directory.GetFiles(pagesPath, "*.cs", SearchOption.AllDirectories)
.OrderBy(f => Path.GetFileName(f))
.ToList();
var services = !string.IsNullOrEmpty(servicesPath) && Directory.Exists(servicesPath)
? Directory.GetFiles(servicesPath, "*.cs", SearchOption.AllDirectories).OrderBy(f => Path.GetFileName(f)).ToList()
: Enumerable.Empty<string>();
var models = !string.IsNullOrEmpty(modelsPath) && Directory.Exists(modelsPath)
? Directory.GetFiles(modelsPath, "*.cs", SearchOption.AllDirectories).OrderBy(f => Path.GetFileName(f)).ToList()
: Enumerable.Empty<string>();
// Generate table of contents - only include main pages
sb.AppendLine("### Demo Pages");
foreach (var page in mainPages)
{
var relativePath = Path.GetRelativePath(pagesPath, page).Replace('\\', '/');
var fileName = Path.GetFileNameWithoutExtension(page);
sb.AppendLine($"- [{fileName}](#{SanitizeAnchor(fileName)}) - `{relativePath}`");
}
if (pageCs.Any())
{
sb.AppendLine();
sb.AppendLine("### Code-Behind Files");
foreach (var csFile in pageCs)
{
var fileName = Path.GetFileNameWithoutExtension(csFile);
sb.AppendLine($"- [{fileName}](#{SanitizeAnchor(fileName)}-code-behind)");
}
}
sb.AppendLine();
sb.AppendLine("---");
sb.AppendLine();
// Add demo pages
sb.AppendLine("## Demo Pages");
sb.AppendLine();
foreach (var page in pages)
{
var relativePath = Path.GetRelativePath(pagesPath, page).Replace('\\', '/');
var fileName = Path.GetFileNameWithoutExtension(page);
var fileContent = File.ReadAllText(page, Encoding.UTF8);
var extractedContent = ExtractDescriptionsAndExamples(fileContent, page);
if (string.IsNullOrWhiteSpace(extractedContent))
continue;
// Add explicit HTML anchor to ensure TOC links work across all markdown parsers
var anchor = SanitizeAnchor(fileName);
sb.AppendLine($"<a id=\"{anchor}\"></a>");
sb.AppendLine($"### {fileName}");
sb.AppendLine();
sb.AppendLine($"**Path:** `{relativePath}`");
sb.AppendLine();
sb.AppendLine(extractedContent);
sb.AppendLine();
sb.AppendLine("---");
sb.AppendLine();
}
// Add C# code-behind files
if (pageCs.Any())
{
sb.AppendLine("## Code-Behind Files");
sb.AppendLine();
foreach (var csFile in pageCs)
{
var relativePath = Path.GetRelativePath(pagesPath, csFile).Replace('\\', '/');
var fileName = Path.GetFileNameWithoutExtension(csFile);
var fileContent = File.ReadAllText(csFile, Encoding.UTF8);
var codeBehindAnchor = SanitizeAnchor($"{fileName}-code-behind");
sb.AppendLine($"<a id=\"{codeBehindAnchor}\"></a>");
sb.AppendLine($"### {fileName} (Code-Behind)");
sb.AppendLine();
sb.AppendLine($"**Path:** `{relativePath}`");
sb.AppendLine();
sb.AppendLine("```csharp");
sb.AppendLine(fileContent);
sb.AppendLine("```");
sb.AppendLine();
sb.AppendLine("---");
sb.AppendLine();
}
}
// Add services
if (services.Any())
{
sb.AppendLine("## Services");
sb.AppendLine();
foreach (var service in services)
{
var relativePath = Path.GetRelativePath(servicesPath, service).Replace('\\', '/');
var fileName = Path.GetFileNameWithoutExtension(service);
var fileContent = File.ReadAllText(service, Encoding.UTF8);
sb.AppendLine($"### {fileName}");
sb.AppendLine();
sb.AppendLine($"**Path:** `{relativePath}`");
sb.AppendLine();
sb.AppendLine("```csharp");
sb.AppendLine(fileContent);
sb.AppendLine("```");
sb.AppendLine();
sb.AppendLine("---");
sb.AppendLine();
}
}
// Add models
if (models.Any())
{
sb.AppendLine("## Data Models");
sb.AppendLine();
foreach (var model in models)
{
var relativePath = Path.GetRelativePath(modelsPath, model).Replace('\\', '/');
var fileName = Path.GetFileNameWithoutExtension(model);
var fileContent = File.ReadAllText(model, Encoding.UTF8);
sb.AppendLine($"### {fileName}");
sb.AppendLine();
sb.AppendLine($"**Path:** `{relativePath}`");
sb.AppendLine();
sb.AppendLine("```csharp");
sb.AppendLine(fileContent);
sb.AppendLine("```");
sb.AppendLine();
sb.AppendLine("---");
sb.AppendLine();
}
}
// Write to file
var outputDir = Path.GetDirectoryName(outputPath);
if (!string.IsNullOrEmpty(outputDir))
{
Directory.CreateDirectory(outputDir);
}
File.WriteAllText(outputPath, sb.ToString(), Encoding.UTF8);
}
static string SanitizeAnchor(string text)
{
if (string.IsNullOrWhiteSpace(text))
return "";
// Markdown heading anchors are generated by:
// 1. Convert to lowercase
// 2. Replace spaces and special chars with hyphens
// 3. Remove multiple consecutive hyphens
// 4. Trim hyphens from start/end
var anchor = text.ToLower()
.Replace(" ", "-")
.Replace("_", "-")
.Replace(".", "-")
.Replace("(", "")
.Replace(")", "")
.Replace("[", "")
.Replace("]", "")
.Replace("{", "")
.Replace("}", "")
.Replace("&", "")
.Replace(":", "")
.Replace(";", "")
.Replace("!", "")
.Replace("?", "")
.Replace("*", "")
.Replace("/", "-")
.Replace("\\", "-")
.Replace("+", "-")
.Replace("=", "-")
.Replace("@", "")
.Replace("#", "")
.Replace("%", "")
.Replace("$", "")
.Replace("^", "")
.Replace("~", "")
.Replace("`", "")
.Replace("'", "")
.Replace("\"", "");
// Remove multiple consecutive hyphens
anchor = Regex.Replace(anchor, @"-+", "-");
// Trim hyphens from start and end
anchor = anchor.Trim('-');
return anchor;
}
static string ExtractDescriptionsAndExamples(string razorContent, string pagePath)
{
var result = new StringBuilder();
var pagesDirectory = Path.GetDirectoryName(pagePath) ?? "";
// Remove @code blocks entirely
razorContent = Regex.Replace(razorContent,
@"@code\s*\{[^{}]*(?:\{[^{}]*\}[^{}]*)*\}",
"",
RegexOptions.Singleline | RegexOptions.IgnoreCase);
// Remove @page, @inject, @layout directives
razorContent = Regex.Replace(razorContent,
@"@(page|inject|layout|using|namespace|implements)[^\r\n]*",
"",
RegexOptions.IgnoreCase | RegexOptions.Multiline);
// Split content into lines to process sequentially
var lines = razorContent.Split(new[] { "\r\n", "\r", "\n" }, StringSplitOptions.None);
for (int i = 0; i < lines.Length; i++)
{
var line = lines[i];
// Check for RadzenText
if (line.Contains("<RadzenText"))
{
var textContent = ExtractRadzenTextContent(lines, ref i);
if (!string.IsNullOrWhiteSpace(textContent.Content))
{
// Format as heading if it's a heading style
if (textContent.IsHeading)
{
result.AppendLine();
result.AppendLine(textContent.Content);
result.AppendLine();
}
else
{
result.AppendLine(textContent.Content);
}
}
}
// Check for RadzenExample
else if (line.Contains("<RadzenExample"))
{
var exampleContent = ExtractRadzenExampleContent(lines, ref i, pagesDirectory);
if (!string.IsNullOrWhiteSpace(exampleContent))
{
result.AppendLine();
result.AppendLine("Example:");
result.AppendLine("```razor");
result.AppendLine(exampleContent);
result.AppendLine("```");
result.AppendLine();
}
}
}
return result.ToString().Trim();
}
static (string Content, bool IsHeading) ExtractRadzenTextContent(string[] lines, ref int index)
{
var fullTag = new StringBuilder();
var inTag = false;
var depth = 0;
// Collect the complete RadzenText tag (may span multiple lines)
for (int i = index; i < lines.Length; i++)
{
var line = lines[i];
fullTag.AppendLine(line);
// Count opening and closing tags
var openMatches = Regex.Matches(line, @"<RadzenText", RegexOptions.IgnoreCase);
var closeMatches = Regex.Matches(line, @"</RadzenText>", RegexOptions.IgnoreCase);
depth += openMatches.Count - closeMatches.Count;
if (closeMatches.Count > 0 && depth == 0)
{
index = i;
break;
}
}
var tagContent = fullTag.ToString();
// Extract attributes - check both TextStyle and TagName for heading detection
var textStyleMatch = Regex.Match(tagContent, @"TextStyle=""TextStyle\.(H[2-6])""", RegexOptions.IgnoreCase);
var tagNameMatch = Regex.Match(tagContent, @"TagName=""TagName\.(H[1-6])""", RegexOptions.IgnoreCase);
bool isHeading = false;
int headingLevel = 0;
// Prefer TextStyle for heading level, but also check TagName
if (textStyleMatch.Success)
{
var hMatch = Regex.Match(textStyleMatch.Groups[1].Value, @"H(\d)");
if (hMatch.Success)
{
headingLevel = int.Parse(hMatch.Groups[1].Value);
isHeading = headingLevel >= 2 && headingLevel <= 6;
}
}
// If no TextStyle heading but TagName suggests heading, use that
if (!isHeading && tagNameMatch.Success)
{
var hMatch = Regex.Match(tagNameMatch.Groups[1].Value, @"H(\d)");
if (hMatch.Success)
{
var tagLevel = int.Parse(hMatch.Groups[1].Value);
if (tagLevel >= 2 && tagLevel <= 6)
{
headingLevel = tagLevel;
isHeading = true;
}
}
}
// Extract inner content
var contentMatch = Regex.Match(tagContent, @"<RadzenText[^>]*>([\s\S]*?)</RadzenText>", RegexOptions.IgnoreCase);
if (!contentMatch.Success)
return (string.Empty, false);
var content = contentMatch.Groups[1].Value.Trim();
// Convert <code> tags to markdown inline code BEFORE converting links
content = ConvertCodeTagsToMarkdown(content);
// Convert RadzenLink to markdown links BEFORE removing HTML tags
content = ConvertRadzenLinksToMarkdown(content);
// Remove all HTML tags (except markdown links which are already converted)
content = Regex.Replace(content, @"<[^>]+>", "");
// Remove @ expressions
content = Regex.Replace(content, @"@[A-Za-z0-9_.()]+", "");
// Clean up whitespace
content = Regex.Replace(content, @"\s+", " ").Trim();
// Format as heading if needed
if (isHeading && !string.IsNullOrWhiteSpace(content))
{
// Map heading levels: H2 -> ####, H4 -> ####, H5 -> #####, H6 -> ######
int markdownLevel = 4; // Default to ####
if (headingLevel == 4) markdownLevel = 4; // H4 -> ####
else if (headingLevel == 5) markdownLevel = 5; // H5 -> #####
else if (headingLevel == 6) markdownLevel = 6; // H6 -> ######
else if (headingLevel == 2) markdownLevel = 4; // H2 -> ####
content = new string('#', markdownLevel) + " " + content;
}
return (content, isHeading);
}
static string ConvertCodeTagsToMarkdown(string content)
{
// Match <code>...</code> tags
var codeMatches = Regex.Matches(content,
@"<code>([\s\S]*?)</code>",
RegexOptions.IgnoreCase);
// Process in reverse to maintain indices
var matchesArray = new Match[codeMatches.Count];
for (int i = 0; i < codeMatches.Count; i++)
{
matchesArray[i] = codeMatches[i];
}
for (int i = matchesArray.Length - 1; i >= 0; i--)
{
var match = matchesArray[i];
var codeContent = match.Groups[1].Value.Trim();
// Remove nested HTML tags from code content
codeContent = Regex.Replace(codeContent, @"<[^>]+>", "");
// Clean up @("@bind-Selected") to @bind-Selected (remove extra quotes and parentheses)
// Match: @("...") pattern and extract the content inside quotes
// Pattern: @("@bind-Selected") -> @bind-Selected
// Use non-verbatim string to avoid quote escaping issues
codeContent = Regex.Replace(codeContent, "@\\(\"([^\"]+)\"\\)", "$1");
codeContent = Regex.Replace(codeContent, "@\\('([^']+)'\\)", "$1");
if (!string.IsNullOrWhiteSpace(codeContent))
{
var markdownCode = $"`{codeContent}`";
content = content.Substring(0, match.Index) + markdownCode +
content.Substring(match.Index + match.Length);
}
}
return content;
}
static string ConvertRadzenLinksToMarkdown(string content)
{
// Handle both self-closing and opening/closing RadzenLink tags
// Match the entire tag first, then extract attributes
// Pattern for self-closing: <RadzenLink ... />
var selfClosingPattern = @"<RadzenLink([^>]*?)\s*/>";
// Pattern for opening/closing: <RadzenLink ...>...</RadzenLink>
var openClosePattern = @"<RadzenLink([^>]*?)>([\s\S]*?)</RadzenLink>";
// Process self-closing tags
var selfClosingMatches = Regex.Matches(content, selfClosingPattern, RegexOptions.IgnoreCase);
var selfClosingArray = new Match[selfClosingMatches.Count];
for (int i = 0; i < selfClosingMatches.Count; i++)
{
selfClosingArray[i] = selfClosingMatches[i];
}
for (int i = selfClosingArray.Length - 1; i >= 0; i--)
{
var match = selfClosingArray[i];
var attributes = match.Groups[1].Value;
var (path, text) = ExtractLinkAttributes(attributes, "");
if (!string.IsNullOrWhiteSpace(path))
{
string linkText = !string.IsNullOrWhiteSpace(text) ? text : path;
var markdownLink = $"[{linkText}]({path})";
content = content.Substring(0, match.Index) + markdownLink +
content.Substring(match.Index + match.Length);
}
}
// Process opening/closing tags
var linkMatches = Regex.Matches(content, openClosePattern, RegexOptions.IgnoreCase);
var matchesArray = new Match[linkMatches.Count];
for (int i = 0; i < linkMatches.Count; i++)
{
matchesArray[i] = linkMatches[i];
}
for (int i = matchesArray.Length - 1; i >= 0; i--)
{
var match = matchesArray[i];
var attributes = match.Groups[1].Value;
var innerContent = match.Groups[2].Value.Trim();
var (path, text) = ExtractLinkAttributes(attributes, innerContent);
if (!string.IsNullOrWhiteSpace(path))
{
string linkText = !string.IsNullOrWhiteSpace(text) ? text :
(!string.IsNullOrWhiteSpace(innerContent) ? Regex.Replace(innerContent, @"<[^>]+>", "").Trim() : path);
if (string.IsNullOrWhiteSpace(linkText))
linkText = path;
var markdownLink = $"[{linkText}]({path})";
content = content.Substring(0, match.Index) + markdownLink +
content.Substring(match.Index + match.Length);
}
}
return content;
}
static (string Path, string Text) ExtractLinkAttributes(string attributes, string innerContent)
{
string path = "";
string text = "";
// Extract Path attribute (can be in any order)
var pathMatch = Regex.Match(attributes, @"Path=[""]?([^""\s>]+)[""]?", RegexOptions.IgnoreCase);
if (pathMatch.Success)
{
path = pathMatch.Groups[1].Value;
}
// Extract Text attribute
var textMatch = Regex.Match(attributes, @"Text=[""]?([^""]+)[""]?", RegexOptions.IgnoreCase);
if (textMatch.Success)
{
text = textMatch.Groups[1].Value.Trim();
}
// If no Text attribute and there's inner content, use that
if (string.IsNullOrWhiteSpace(text) && !string.IsNullOrWhiteSpace(innerContent))
{
text = Regex.Replace(innerContent, @"<[^>]+>", "").Trim();
}
return (path, text);
}
static string ExtractRadzenExampleContent(string[] lines, ref int index, string pagesDirectory)
{
var fullTag = new StringBuilder();
var depth = 0;
// Collect the complete RadzenExample tag
for (int i = index; i < lines.Length; i++)
{
var line = lines[i];
fullTag.AppendLine(line);
var openMatches = Regex.Matches(line, @"<RadzenExample", RegexOptions.IgnoreCase);
var closeMatches = Regex.Matches(line, @"</RadzenExample>", RegexOptions.IgnoreCase);
depth += openMatches.Count - closeMatches.Count;
if (closeMatches.Count > 0 && depth == 0)
{
index = i;
break;
}
}
var tagContent = fullTag.ToString();
// Extract Example attribute
var exampleMatch = Regex.Match(tagContent, @"Example=[""]?([^""\s>]+)[""]?", RegexOptions.IgnoreCase);
if (exampleMatch.Success)
{
var exampleName = exampleMatch.Groups[1].Value.Trim();
var exampleFilePath = Path.Combine(pagesDirectory, $"{exampleName}.razor");
if (File.Exists(exampleFilePath))
{
var exampleContent = File.ReadAllText(exampleFilePath, Encoding.UTF8);
return CleanExampleFile(exampleContent);
}
}
// Fallback: extract inline content
var inlineMatch = Regex.Match(tagContent, @"<RadzenExample[^>]*>([\s\S]*?)</RadzenExample>", RegexOptions.IgnoreCase);
if (inlineMatch.Success)
{
return CleanExampleContent(inlineMatch.Groups[1].Value);
}
return string.Empty;
}
static string CleanTextContent(string content)
{
if (string.IsNullOrWhiteSpace(content))
return string.Empty;
var result = content;
// Remove all HTML tags (including <strong>, <code>, <Radzen*>, etc.)
result = Regex.Replace(result, @"<[^>]+>", "");
// Remove @ expressions (like @variable, @ExampleService)
result = Regex.Replace(result, @"@[A-Za-z0-9_.()]+", "");
// Clean up multiple spaces but preserve single newlines for readability
result = Regex.Replace(result, @"[ \t]+", " ");
// Clean up multiple newlines (max 2 consecutive)
result = Regex.Replace(result, @"(\r?\n){3,}", Environment.NewLine + Environment.NewLine);
return result.Trim();
}
static string CleanExampleContent(string content)
{
if (string.IsNullOrWhiteSpace(content))
return string.Empty;
var result = content;
// Remove nested RadzenExample tags if any
result = Regex.Replace(result,
@"<RadzenExample[^>]*>[\s\S]*?</RadzenExample>",
"",
RegexOptions.IgnoreCase);
// Trim each line and remove empty lines
var lines = result.Split(new[] { "\r\n", "\r", "\n" }, StringSplitOptions.None)
.Select(l => l.Trim())
.Where(l => !string.IsNullOrWhiteSpace(l))
.ToList();
return string.Join(Environment.NewLine, lines);
}
static string CleanExampleFile(string content)
{
if (string.IsNullOrWhiteSpace(content))
return string.Empty;
var result = content;
// Remove @code blocks
result = Regex.Replace(result,
@"@code\s*\{[^{}]*(?:\{[^{}]*\}[^{}]*)*\}",
"",
RegexOptions.Singleline | RegexOptions.IgnoreCase);
// Remove @using, @inject, @page directives
result = Regex.Replace(result,
@"@(using|inject|page|layout|namespace|implements)[^\r\n]*",
"",
RegexOptions.IgnoreCase | RegexOptions.Multiline);
// Clean up multiple blank lines
result = Regex.Replace(result, @"(\r?\n\s*){3,}", Environment.NewLine + Environment.NewLine);
return result.Trim();
}
}