Load a document

Document .Net supports these formats:

PDF DOCX RTF HTML
Create/Read/Write Create/Read/Write Create/Read/Write Create/Read/Write

To load a document from a file, a single line is enough:

 
            //It's easy to load any document.
            DocumentCore dc = DocumentCore.Load(@"d:\Book.pdf");

DocumentCore is root class, it represents a document itself.

In this example, the method Load detects that a loadable document is PDF from the extension ".pdf".

You can also explicitly set the type of loadable document as second parameter. For example, PdfLoadOptions or DocxLoadOptions or another:


            DocumentCore dc = DocumentCore.Load(@"d:\Book.pdf", new PdfLoadOptions()
            {
                DetectTables=true,
                RasterizeVectorGraphics = false
            });

All load options are derived from the base abstract class LoadOptions.

After loading you get the full Tree Of Objects and can do anything you want: Find, Replace, Remove, Insert, Modify, Save to another format.

Document .Net provides you by the full tree of its objects after the loading document.
 

Load from a Stream is also straightforward:


            // Let us say we already have a DOCX document as array of bytes.        
            DocumentCore dc = null;
            using (MemoryStream docxStream = new MemoryStream(docxBytes))
            {
                dc = DocumentCore.Load(docxStream, new DocxLoadOptions());
            }
            // Here we can do with our document 'dc' anything we need.
 

Complete code

using System.IO;
using SautinSoft.Document;
using System;

namespace Example
{
    class Program
    {

        static void Main(string[] args)
        {
            LoadFromFile();
        }

        // From a file
        static void LoadFromFile()
        {
            string filePath = @"..\..\example.docx";
            // The file format is detected automatically from the file extension: ".docx".
            // But as shown in the example below, we can specify DocxLoadOptions as 2nd parameter
            // to explicitly set that a loadable document has Docx format.
            DocumentCore dc = DocumentCore.Load(filePath);
        }

        // From a Stream
        static void LoadFromStream()
        {

            // We've knowingly created an empty DocumentCore instance before "Using {}"
            // to continue work with it after stream will be closed.
            DocumentCore dc = null;
            using (FileStream fs = new FileStream(@"..\..\example.docx", FileMode.Open))
            {

                // Here we explicitly set that a loadable document is Docx.
                dc = DocumentCore.Load(fs, new DocxLoadOptions());
            }
        }

        // From an array of bytes
        static void LoadFromBytes()
        {

            // Get document bytes from a file.
            byte[] fileBytes = File.ReadAllBytes(@"..\..\example.pdf");

            DocumentCore dc = null;
            using (MemoryStream ms = new MemoryStream(fileBytes))
            {

                // With PdfLoadOptions we explicitly set that a loadable document is PDF.
                PdfLoadOptions pdfLO = new PdfLoadOptions()
                {

                    // Leave a vector graphics as is.
                    RasterizeVectorGraphics = false,

                    // Load only first 2 pages from document.
                    PageCount = 2
                };
                dc = DocumentCore.Load(ms, pdfLO);
            }
        }
    }
}

Download.

        
            Imports System.IO
Imports SautinSoft.Document

Module ExampleVB

    Sub Main()
        LoadFromFile()
    End Sub

    ' From a file
    Public Sub LoadFromFile()
        Dim filePath As String = "..\example.docx"

        ' The file format is detected automatically from the file extension: ".docx".
        ' But as shown in the example below, we can specify DocxLoadOptions as 2nd parameter
        ' to explicitly set that a loadable document has Docx format.
        Dim dc As DocumentCore = DocumentCore.Load(filePath)
    End Sub

    ' From a Stream
    Public Sub LoadFromStream()

        ' We've knowingly created an empty DocumentCore instance before "Using {}"
        ' to continue work with it after stream will be closed.
        Dim dc As DocumentCore = Nothing
        Using fs As New FileStream("..\example.docx", FileMode.Open)

            ' Here we explicitly set that a loadable document is Docx.
            dc = DocumentCore.Load(fs, New DocxLoadOptions())
        End Using
    End Sub

    ' From an array of bytes
    Public Sub LoadFromBytes()

        ' Get document bytes from a file.
        Dim fileBytes() As Byte = File.ReadAllBytes("..\example.pdf")

        Dim dc As DocumentCore = Nothing
        Using ms As New MemoryStream(fileBytes)

            ' With PdfLoadOptions we explicitly set that a loadable document is PDF.
            Dim pdfLO As New PdfLoadOptions() With {
                    .RasterizeVectorGraphics = False,
                    .PageCount = 2
                }
            dc = DocumentCore.Load(ms, pdfLO)
        End Using
    End Sub
End Module

Download.

© SautinSoft 2019