Class PdfToHtmlConverter
java.lang.Object
com.flowable.platform.pdf.converter.PdfToHtmlConverter
Experimental
Converts a PDF to an HTML file.
-
Field Summary
Modifier and TypeFieldDescriptionprotected PdfToHtmlConverterConfig
protected Set<com.aspose.pdf.MarkupSection>
protected Set<com.aspose.pdf.MarkupSection>
protected Set<com.aspose.pdf.MarkupSection>
protected com.aspose.pdf.ParagraphAbsorber
protected com.aspose.pdf.Document
-
Constructor Summary
-
Method Summary
Modifier and TypeMethodDescriptionprotected com.aspose.pdf.Document
cleanupContent
(SortedSet<com.flowable.platform.pdf.converter.PdfToHtmlConverter.ConverterFilter> filters) protected com.aspose.pdf.HtmlSaveOptions
convert
(InputStream pdfInputStream, SortedSet<com.flowable.platform.pdf.converter.PdfToHtmlConverter.ConverterFilter> filters) findBottomMargin
(List<com.aspose.pdf.MarkupSection> pageSections, Set<com.aspose.pdf.MarkupSection> footersOnThePage) protected Set<com.aspose.pdf.MarkupSection>
findDocumentNameOnTopCorner
(com.aspose.pdf.PageMarkup pageMarkup) protected Set<com.aspose.pdf.MarkupSection>
findFootersByPosition
(com.aspose.pdf.MarkupSection markupSection) protected Set<com.aspose.pdf.MarkupSection>
findFootersOnSinglePage
(com.aspose.pdf.PageMarkup pageMarkup) protected Set<com.aspose.pdf.MarkupSection>
findHeadersByPosition
(com.aspose.pdf.MarkupSection markupSection) protected Set<com.aspose.pdf.MarkupSection>
findHeadersOnSinglePage
(com.aspose.pdf.PageMarkup pageMarkup) protected Set<com.aspose.pdf.MarkupSection>
findPageNumbersOnSinglePage
(com.aspose.pdf.PageMarkup pageMarkup) findTopMargin
(List<com.aspose.pdf.MarkupSection> pageSections, Set<com.aspose.pdf.MarkupSection> headersOnThePage) protected String
getFragmentText
(com.aspose.pdf.TextFragment textFragment) getPageIndex
(com.aspose.pdf.MarkupSection markupSection) getPageIndex
(List<com.aspose.pdf.TextFragment> textFragments) protected String
getSectionText
(com.aspose.pdf.MarkupSection section) protected boolean
matchesFooterRegexp
(com.aspose.pdf.MarkupSection markupSection) protected boolean
matchesHeaderRegexp
(com.aspose.pdf.MarkupSection markupSection) protected boolean
matchesPageNumberRegexp
(com.aspose.pdf.MarkupSection markupSection) protected Predicate<com.aspose.pdf.MarkupSection>
matchingSectionsByPosition
(com.aspose.pdf.MarkupSection markupSection) protected void
protected void
protected void
protected void
protected void
protected void
protected void
protected void
removeSections
(Collection<com.aspose.pdf.MarkupSection> sectionsToRemove) protected void
removeTextFragment
(com.aspose.pdf.TextFragment fragmentToRemove) protected void
removeTextFragmentsContainingPageNumber
(com.aspose.pdf.MarkupSection markupSection) protected void
protected void
setPageSize
(com.aspose.pdf.Page page, com.aspose.pdf.Rectangle rectangle)
-
Field Details
-
configuration
-
pdfDocument
protected com.aspose.pdf.Document pdfDocument -
paragraphAbsorber
protected com.aspose.pdf.ParagraphAbsorber paragraphAbsorber -
headers
-
pageNumbers
-
-
Constructor Details
-
PdfToHtmlConverter
-
-
Method Details
-
convert
public InputStream convert(InputStream pdfInputStream, SortedSet<com.flowable.platform.pdf.converter.PdfToHtmlConverter.ConverterFilter> filters) throws IOException - Throws:
IOException
-
cleanupContent
protected com.aspose.pdf.Document cleanupContent(SortedSet<com.flowable.platform.pdf.converter.PdfToHtmlConverter.ConverterFilter> filters) throws IOException - Throws:
IOException
-
configureHtmlSaveOptions
protected com.aspose.pdf.HtmlSaveOptions configureHtmlSaveOptions() -
removeEmptyAndTransparentSections
protected void removeEmptyAndTransparentSections() -
removePagesWithSingleRotatedSection
protected void removePagesWithSingleRotatedSection() -
removeHeaders
protected void removeHeaders() -
removePageNumbers
protected void removePageNumbers() -
removeEmptyPages
protected void removeEmptyPages() -
removeTopMargin
protected void removeTopMargin() -
removeBottomMargin
protected void removeBottomMargin() -
findHeadersOnSinglePage
protected Set<com.aspose.pdf.MarkupSection> findHeadersOnSinglePage(com.aspose.pdf.PageMarkup pageMarkup) -
findPageNumbersOnSinglePage
protected Set<com.aspose.pdf.MarkupSection> findPageNumbersOnSinglePage(com.aspose.pdf.PageMarkup pageMarkup) -
findTopMargin
-
findBottomMargin
-
findHeadersByPosition
protected Set<com.aspose.pdf.MarkupSection> findHeadersByPosition(com.aspose.pdf.MarkupSection markupSection) -
matchesHeaderRegexp
protected boolean matchesHeaderRegexp(com.aspose.pdf.MarkupSection markupSection) -
matchesPageNumberRegexp
protected boolean matchesPageNumberRegexp(com.aspose.pdf.MarkupSection markupSection) -
findDocumentNameOnTopCorner
protected Set<com.aspose.pdf.MarkupSection> findDocumentNameOnTopCorner(com.aspose.pdf.PageMarkup pageMarkup) -
matchingSectionsByPosition
protected Predicate<com.aspose.pdf.MarkupSection> matchingSectionsByPosition(com.aspose.pdf.MarkupSection markupSection) -
removeTextFragmentsContainingPageNumber
protected void removeTextFragmentsContainingPageNumber(com.aspose.pdf.MarkupSection markupSection) -
setPageSize
protected void setPageSize(com.aspose.pdf.Page page, com.aspose.pdf.Rectangle rectangle) -
getFragmentText
-
getSectionText
-
removeSections
-
removeTextFragment
protected void removeTextFragment(com.aspose.pdf.TextFragment fragmentToRemove) -
getPageIndex
-
getPageIndex
-