Convert HTML to Text string in C# and .NET


Complete code

using System;
using System.IO;
using SautinSoft;

namespace Sample
{
    class Test
    {
        static void Main(string[] args)
        {
			// Get your free 30-day key here:   
            // https://sautinsoft.com/start-for-free/
	
            // Convert HTML string to Text string.
            // If you need more information about "HTML to RTF .Net" 
            // Email us at: support@sautinsoft.com.
            ConvertHtmlToTextString();
        }

        public static void ConvertHtmlToTextString()
        {
            SautinSoft.HtmlToRtf h = new SautinSoft.HtmlToRtf();
            HtmlConvertOptions opt = new HtmlConvertOptions();
            opt.OutputFormat = HtmlToRtf.OutputFormat.TextUTF8WithBOM;

            string inputFile = @"..\..\..\Sample.html";
            string outputFile = "Result.txt";

            // Read our HTML file a string.
            string htmlString = File.ReadAllText(inputFile);
            byte[] textBytes = null;

            if (h.Convert(System.Text.Encoding.UTF8.GetBytes(htmlString), out textBytes, opt))
            {
                string textString = System.Text.Encoding.UTF8.GetString(textBytes);

                // Open the result for demonstration purposes.
                if (!String.IsNullOrEmpty(textString))
                {
                    File.WriteAllText(outputFile, textString);
                    System.Diagnostics.Process.Start(new System.Diagnostics.ProcessStartInfo(outputFile) { UseShellExecute = true });
                }
            }
        }
    }
}

Download

Imports System
Imports System.IO
Imports SautinSoft

Namespace Sample
	Friend Class Test
		Shared Sub Main(ByVal args() As String)
			' Get your free 30-day key here:   
            ' https://sautinsoft.com/start-for-free/
	
			' Convert HTML string to Text string.
			' If you need more information about "HTML to RTF .Net" 
			' Email us at: support@sautinsoft.com.
			ConvertHtmlToTextString()
		End Sub

		Public Shared Sub ConvertHtmlToTextString()
			Dim h As New SautinSoft.HtmlToRtf()
			Dim opt As New HtmlConvertOptions()
			opt.OutputFormat = HtmlToRtf.OutputFormat.TextUTF8WithBOM

			Dim inputFile As String = "..\..\..\Sample.html"
			Dim outputFile As String = "Result.txt"

			' Read our HTML file a string.
			Dim htmlString As String = File.ReadAllText(inputFile)
			Dim textBytes() As Byte = Nothing

			If h.Convert(System.Text.Encoding.UTF8.GetBytes(htmlString), textBytes, opt) Then
				Dim textString As String = System.Text.Encoding.UTF8.GetString(textBytes)

				' Open the result for demonstration purposes.
				If Not String.IsNullOrEmpty(textString) Then
					File.WriteAllText(outputFile, textString)
					System.Diagnostics.Process.Start(New System.Diagnostics.ProcessStartInfo(outputFile) With {.UseShellExecute = True})
				End If
			End If
		End Sub
	End Class
End Namespace

Download


If you need a new code example or have a question: email us at support@sautinsoft.com or ask at Online Chat (right-bottom corner of this page) or use the Form below:



Questions and suggestions from you are always welcome!

We are developing .Net components since 2002. We know PDF, DOCX, RTF, HTML, XLSX and Images formats. If you need any assistance with creating, modifying or converting documents in various formats, we can help you. We will write any code example for you absolutely free.