GuilhermeStracini/POC-dotnet-ExtractPdfContent

View on GitHub
Src/POCExtractPdfContent/Extractors/DocNetExtractor.cs

Summary

Maintainability
A
0 mins
Test Coverage
using Docnet.Core;
using Docnet.Core.Models;

namespace POCExtractPdfContent.Extractors;

/// <summary>
/// Class DocNetExtractor.
/// </summary>
public class DocNetExtractor : IPdfExtractor
{
    /// <summary>
    /// Extracts the specified data.
    /// </summary>
    /// <param name="data">The data.</param>
    /// <returns>System.String.</returns>
    public string Extract(byte[] data)
    {
        using var docReader = DocLib.Instance.GetDocReader(data, new PageDimensions());
        var page = docReader.GetPageReader(0);
        var text = page.GetText();
        return text;
    }
}