Class PdfToHtmlConverter
java.lang.Object
com.flowable.platform.pdf.converter.PdfToHtmlConverter
Experimental
Converts a PDF to an HTML file.
-
Field Summary
FieldsModifier and TypeFieldDescriptionprotected PdfToHtmlConverterConfigprotected Set<com.aspose.pdf.MarkupSection>protected Set<com.aspose.pdf.MarkupSection>protected Set<com.aspose.pdf.MarkupSection>protected com.aspose.pdf.ParagraphAbsorberprotected com.aspose.pdf.Document -
Constructor Summary
Constructors -
Method Summary
Modifier and TypeMethodDescriptionprotected com.aspose.pdf.DocumentcleanupContent(SortedSet<com.flowable.platform.pdf.converter.PdfToHtmlConverter.ConverterFilter> filters) protected com.aspose.pdf.HtmlSaveOptionsconvert(InputStream pdfInputStream, SortedSet<com.flowable.platform.pdf.converter.PdfToHtmlConverter.ConverterFilter> filters) findBottomMargin(List<com.aspose.pdf.MarkupSection> pageSections, Set<com.aspose.pdf.MarkupSection> footersOnThePage) protected Set<com.aspose.pdf.MarkupSection>findDocumentNameOnTopCorner(com.aspose.pdf.PageMarkup pageMarkup) protected Set<com.aspose.pdf.MarkupSection>findFootersByPosition(com.aspose.pdf.MarkupSection markupSection) protected Set<com.aspose.pdf.MarkupSection>findFootersOnSinglePage(com.aspose.pdf.PageMarkup pageMarkup) protected Set<com.aspose.pdf.MarkupSection>findHeadersByPosition(com.aspose.pdf.MarkupSection markupSection) protected Set<com.aspose.pdf.MarkupSection>findHeadersOnSinglePage(com.aspose.pdf.PageMarkup pageMarkup) protected Set<com.aspose.pdf.MarkupSection>findPageNumbersOnSinglePage(com.aspose.pdf.PageMarkup pageMarkup) findTopMargin(List<com.aspose.pdf.MarkupSection> pageSections, Set<com.aspose.pdf.MarkupSection> headersOnThePage) protected StringgetFragmentText(com.aspose.pdf.TextFragment textFragment) getPageIndex(com.aspose.pdf.MarkupSection markupSection) getPageIndex(List<com.aspose.pdf.TextFragment> textFragments) protected StringgetSectionText(com.aspose.pdf.MarkupSection section) protected booleanmatchesFooterRegexp(com.aspose.pdf.MarkupSection markupSection) protected booleanmatchesHeaderRegexp(com.aspose.pdf.MarkupSection markupSection) protected booleanmatchesPageNumberRegexp(com.aspose.pdf.MarkupSection markupSection) protected Predicate<com.aspose.pdf.MarkupSection>matchingSectionsByPosition(com.aspose.pdf.MarkupSection markupSection) protected voidprotected voidprotected voidprotected voidprotected voidprotected voidprotected voidprotected voidremoveSections(Collection<com.aspose.pdf.MarkupSection> sectionsToRemove) protected voidremoveTextFragment(com.aspose.pdf.TextFragment fragmentToRemove) protected voidremoveTextFragmentsContainingPageNumber(com.aspose.pdf.MarkupSection markupSection) protected voidprotected voidsetPageSize(com.aspose.pdf.Page page, com.aspose.pdf.Rectangle rectangle)
-
Field Details
-
configuration
-
pdfDocument
protected com.aspose.pdf.Document pdfDocument -
paragraphAbsorber
protected com.aspose.pdf.ParagraphAbsorber paragraphAbsorber -
headers
-
pageNumbers
-
-
Constructor Details
-
PdfToHtmlConverter
-
-
Method Details
-
convert
public InputStream convert(InputStream pdfInputStream, SortedSet<com.flowable.platform.pdf.converter.PdfToHtmlConverter.ConverterFilter> filters) throws IOException - Throws:
IOException
-
cleanupContent
protected com.aspose.pdf.Document cleanupContent(SortedSet<com.flowable.platform.pdf.converter.PdfToHtmlConverter.ConverterFilter> filters) throws IOException - Throws:
IOException
-
configureHtmlSaveOptions
protected com.aspose.pdf.HtmlSaveOptions configureHtmlSaveOptions() -
removeEmptyAndTransparentSections
protected void removeEmptyAndTransparentSections() -
removePagesWithSingleRotatedSection
protected void removePagesWithSingleRotatedSection() -
removeHeaders
protected void removeHeaders() -
removePageNumbers
protected void removePageNumbers() -
removeEmptyPages
protected void removeEmptyPages() -
removeTopMargin
protected void removeTopMargin() -
removeBottomMargin
protected void removeBottomMargin() -
findHeadersOnSinglePage
protected Set<com.aspose.pdf.MarkupSection> findHeadersOnSinglePage(com.aspose.pdf.PageMarkup pageMarkup) -
findPageNumbersOnSinglePage
protected Set<com.aspose.pdf.MarkupSection> findPageNumbersOnSinglePage(com.aspose.pdf.PageMarkup pageMarkup) -
findTopMargin
-
findBottomMargin
-
findHeadersByPosition
protected Set<com.aspose.pdf.MarkupSection> findHeadersByPosition(com.aspose.pdf.MarkupSection markupSection) -
matchesHeaderRegexp
protected boolean matchesHeaderRegexp(com.aspose.pdf.MarkupSection markupSection) -
matchesPageNumberRegexp
protected boolean matchesPageNumberRegexp(com.aspose.pdf.MarkupSection markupSection) -
findDocumentNameOnTopCorner
protected Set<com.aspose.pdf.MarkupSection> findDocumentNameOnTopCorner(com.aspose.pdf.PageMarkup pageMarkup) -
matchingSectionsByPosition
protected Predicate<com.aspose.pdf.MarkupSection> matchingSectionsByPosition(com.aspose.pdf.MarkupSection markupSection) -
removeTextFragmentsContainingPageNumber
protected void removeTextFragmentsContainingPageNumber(com.aspose.pdf.MarkupSection markupSection) -
setPageSize
protected void setPageSize(com.aspose.pdf.Page page, com.aspose.pdf.Rectangle rectangle) -
getFragmentText
-
getSectionText
-
removeSections
-
removeTextFragment
protected void removeTextFragment(com.aspose.pdf.TextFragment fragmentToRemove) -
getPageIndex
-
getPageIndex
-