[mod] rename
This commit is contained in:
		
							parent
							
								
									3ba5b52227
								
							
						
					
					
						commit
						e1c74c9608
					
				
					 2 changed files with 41 additions and 58 deletions
				
			
		| 
						 | 
				
			
			@ -1,5 +1,6 @@
 | 
			
		|||
xquery version '3.1';
 | 
			
		||||
(:~ pdfbox 3.0 https://pdfbox.apache.org/ interface library, 
 | 
			
		||||
(:~ 
 | 
			
		||||
pdfbox 3.0 https://pdfbox.apache.org/ interface library, 
 | 
			
		||||
requires pdfbox jar on classpath
 | 
			
		||||
3.02 required tested with pdfbox-app-3.0.2-20240121.184204-66.jar
 | 
			
		||||
@see https://lists.apache.org/list?users@pdfbox.apache.org:lte=1M:loader
 | 
			
		||||
| 
						 | 
				
			
			@ -60,41 +61,8 @@ as xs:integer{
 | 
			
		|||
  PDDocument:getNumberOfPages($doc)
 | 
			
		||||
};
 | 
			
		||||
 | 
			
		||||
(:~ @TODO 
 | 
			
		||||
  PDOutlineItem current = bookmark.getFirstChild();
 | 
			
		||||
    while (current != null) {
 | 
			
		||||
        PDPage currentPage = current.findDestinationPage(document);
 | 
			
		||||
        Integer pageNumber = document.getDocumentCatalog().getPages().indexOf(currentPage) + 1;
 | 
			
		||||
        System.out.println(current.getTitle() + "-------->" + pageNumber);
 | 
			
		||||
        getOutlines(document, current, indentation);
 | 
			
		||||
        current = current.getNextSibling();
 | 
			
		||||
    }
 | 
			
		||||
:)
 | 
			
		||||
declare function pdfbox:siblings($acc as item()*,$outlineItem ,$doc as item())
 | 
			
		||||
as map(*)*{
 | 
			
		||||
   if(empty($outlineItem))
 | 
			
		||||
  then $acc
 | 
			
		||||
  else let $next:=  PDOutlineItem:getNextSibling($outlineItem)=>trace("next: ")
 | 
			
		||||
       return pdfbox:siblings($acc,pdfbox:bookmark($outlineItem ,$doc),
 | 
			
		||||
                      $next
 | 
			
		||||
                    )
 | 
			
		||||
  
 | 
			
		||||
};
 | 
			
		||||
 | 
			
		||||
(: return bookmark info for children of $outlineItem :)
 | 
			
		||||
declare function pdfbox:sibs($outlineItem,$doc )
 | 
			
		||||
as map(*)*
 | 
			
		||||
{
 | 
			
		||||
  hof:until(
 | 
			
		||||
    function($output) { empty($output?this) },
 | 
			
		||||
    function($input ) { map{
 | 
			
		||||
                       "list":($input?list,pdfbox:bookmark($input?this,$doc)),
 | 
			
		||||
                       "this":  PDOutlineItem:getNextSibling($input?this)}
 | 
			
		||||
                            },
 | 
			
		||||
    map{"list":(),"this":$outlineItem}
 | 
			
		||||
  )
 | 
			
		||||
};
 | 
			
		||||
 | 
			
		||||
(:~ outline for $doc as map()* :)
 | 
			
		||||
declare function pdfbox:outline($doc as item())
 | 
			
		||||
as map(*)*{
 | 
			
		||||
  (# db:wrapjava some #) {
 | 
			
		||||
| 
						 | 
				
			
			@ -103,29 +71,47 @@ as map(*)*{
 | 
			
		|||
                =>PDDocumentCatalog:getDocumentOutline()
 | 
			
		||||
                =>PDOutlineItem:getFirstChild()=>trace("cur")
 | 
			
		||||
 | 
			
		||||
 
 | 
			
		||||
  (: let $bk:=pdfbox:siblings((),$bookmark ,$doc) :)
 | 
			
		||||
let $bk:=pdfbox:sibs($bookmark ,$doc)?list
 | 
			
		||||
  (: let $bookmark := PDOutlineItem:getNextSibling($bookmark)
 | 
			
		||||
  let $bk := ($bk, pdfbox:bookmark($bookmark, $doc))
 | 
			
		||||
  let $bookmark := PDOutlineItem:getNextSibling($bookmark)
 | 
			
		||||
  let $bk := ($bk, pdfbox:bookmark($bookmark, $doc))
 | 
			
		||||
  let $bookmark := PDOutlineItem:getNextSibling($bookmark)
 | 
			
		||||
  let $bk := ($bk, pdfbox:bookmark($bookmark, $doc))
 | 
			
		||||
  let $bookmark := PDOutlineItem:getNextSibling($bookmark) 
 | 
			
		||||
  let $bk := ($bk, pdfbox:bookmark($bookmark, $doc))
 | 
			
		||||
let $bookmark := PDOutlineItem:getNextSibling($bookmark) => trace("EMP")
 | 
			
		||||
  let $bk := ($bk, if(exists($bookmark)) then pdfbox:bookmark($bookmark, $doc)) :)
 | 
			
		||||
  let $bk:=pdfbox:outline($bookmark ,$doc) 
 | 
			
		||||
  return  $bk
 | 
			
		||||
  }
 | 
			
		||||
};
 | 
			
		||||
 | 
			
		||||
(: return bookmark info for children of $outlineItem :)
 | 
			
		||||
declare function pdfbox:outline($outlineItem,$doc )
 | 
			
		||||
as map(*)*
 | 
			
		||||
{
 | 
			
		||||
  let $find:=hof:until(
 | 
			
		||||
            function($output) { empty($output?this) },
 | 
			
		||||
            function($input ) { 
 | 
			
		||||
                      let $bk:= pdfbox:bookmark($input?this,$doc)
 | 
			
		||||
                      let $bk:= if($bk?hasChildren)
 | 
			
		||||
                                then let $kids:=pdfbox:outline(PDOutlineItem:getFirstChild($input?this), $doc)
 | 
			
		||||
                                     return map:merge(($bk,map:entry("children",$kids)))
 | 
			
		||||
                                else $bk 
 | 
			
		||||
                      return map{
 | 
			
		||||
                            "list": ($input?list, $bk),
 | 
			
		||||
                            "this":  PDOutlineItem:getNextSibling($input?this)}
 | 
			
		||||
                          },
 | 
			
		||||
            map{"list":(),"this":$outlineItem}
 | 
			
		||||
        )
 | 
			
		||||
  return $find?list      
 | 
			
		||||
};
 | 
			
		||||
 | 
			
		||||
declare function pdfbox:outline-XML($outline as map(*)*)
 | 
			
		||||
as element(*){
 | 
			
		||||
 element outline { 
 | 
			
		||||
  for $bookmark in $outline
 | 
			
		||||
  return <bookmark title="{$bookmark?title}" index="{$bookmark?index}">
 | 
			
		||||
    {$bookmark?children!pdfbox:outline-XML(.)}
 | 
			
		||||
  </bookmark>
 | 
			
		||||
 }
 | 
			
		||||
};
 | 
			
		||||
 | 
			
		||||
(: return bookmark info for children of $outlineItem :)
 | 
			
		||||
declare function pdfbox:bookmark($bookmark as item(),$doc as item())
 | 
			
		||||
as map(*){
 | 
			
		||||
  let $currentPage := PDOutlineItem:findDestinationPage($bookmark,$doc)
 | 
			
		||||
  (: return hof:until(empty#1,pdfbox:outx(?,$doc),()) :)
 | 
			
		||||
  return map{ 
 | 
			
		||||
  "index":  pdfbox:pageIndex($currentPage,$doc),
 | 
			
		||||
 map{ 
 | 
			
		||||
  "index":  PDOutlineItem:findDestinationPage($bookmark,$doc)=>pdfbox:pageIndex($doc),
 | 
			
		||||
  "title": PDOutlineItem:getTitle($bookmark),
 | 
			
		||||
  "hasChildren": PDOutlineItem:hasChildren($bookmark)
 | 
			
		||||
  }
 | 
			
		||||
| 
						 | 
				
			
			@ -1,7 +1,7 @@
 | 
			
		|||
(: PDFBOX experiments
 | 
			
		||||
:)
 | 
			
		||||
 | 
			
		||||
import module namespace pdfbox="urn:expkg-zone58:pdfbox:3" at "../lib/pdfbox-lib.xqm";
 | 
			
		||||
import module namespace pdfbox="urn:expkg-zone58:pdfbox:3" at "../lib/pdfbox3.xqm";
 | 
			
		||||
 | 
			
		||||
 | 
			
		||||
declare variable $samples:= map{
 | 
			
		||||
| 
						 | 
				
			
			@ -15,11 +15,8 @@ declare variable $base:= "C:\Users\mrwhe\git\bloomsbury\content-architecture\xqu
 | 
			
		|||
(:~ resolve :)
 | 
			
		||||
declare variable $PDF:= $samples?climate=>file:resolve-path($base);
 | 
			
		||||
 | 
			
		||||
(: women pdfs :)
 | 
			
		||||
(: let $pdfdoc:="data\drop-01d\set\2-6-1\A6229C_1\outputs\9798216172628\2798216172625\pdfs\chunks-docbook.xml"
 | 
			
		||||
=>file:resolve-path(file:base-dir())
 | 
			
		||||
=>doc() :)
 | 
			
		||||
 | 
			
		||||
 | 
			
		||||
let $doc:=pdfbox:open($PDF)
 | 
			
		||||
return pdfbox:outline($doc)
 | 
			
		||||
return pdfbox:outline($doc)=>pdfbox:outline-XML()
 | 
			
		||||
(: return pdfbox:extract($doc,"c:\tmp\junk3.pdf",1,pdfbox:page-count($doc)) :)
 | 
			
		||||
		Loading…
	
	Add table
		
		Reference in a new issue