Difference between revisions of "Cognitive PDF/A"

From OpenKM Documentation
Jump to: navigation, search
m
 
(2 intermediate revisions by 2 users not shown)
Line 3: Line 3:
 
Description:
 
Description:
 
* Input server folder where images are stored '''systemFolder = "c:\\samples"'''
 
* Input server folder where images are stored '''systemFolder = "c:\\samples"'''
* Compressimo server path '''cognitiveCompressimo'''
+
* Cognitive PDF/A server path '''cognitivePdfa'''
 
* OpenKM path where compressimo files are imported '''String path = "/okm:root/imported" + "/" + uploadFile.getName()'''
 
* OpenKM path where compressimo files are imported '''String path = "/okm:root/imported" + "/" + uploadFile.getName()'''
  
Line 17: Line 17:
 
String token = DbSessionManager.getInstance().getSystemToken();
 
String token = DbSessionManager.getInstance().getSystemToken();
 
String systemFolder = "c:\\samples";
 
String systemFolder = "c:\\samples";
String cognitiveCompressimo = "C:\\Users\\jllort\\Desktop\\cpdfa-1.4.4-dev-win32-1month\\cpdfa\\bin\\cpdfacli.exe splitdummy eng ";
+
String cognitivePdfa = "C:\\Users\\jllort\\Desktop\\cpdfa-1.4.4-dev-win32-1month\\cpdfa\\bin\\cpdfacli.exe splitdummy eng ";
 
Logger log = LoggerFactory.getLogger("com.openkm.compressimo");
 
Logger log = LoggerFactory.getLogger("com.openkm.compressimo");
  
Line 27: Line 27:
 
for (int i=0; i<listOfFiles.length; i++) {
 
for (int i=0; i<listOfFiles.length; i++) {
 
     File file = listOfFiles[i];
 
     File file = listOfFiles[i];
 +
 
     if (file.isFile() && file.getName().toLowerCase().endsWith(".tif")) {
 
     if (file.isFile() && file.getName().toLowerCase().endsWith(".tif")) {
       
 
 
         // Converting tif file to pdf
 
         // Converting tif file to pdf
 
         String tifFile =  systemFolder + "\\" + file.getName();
 
         String tifFile =  systemFolder + "\\" + file.getName();
 
         String pdfFile =  systemFolder + "\\" + file.getName().toLowerCase().replace(".tif", ".pdf");
 
         String pdfFile =  systemFolder + "\\" + file.getName().toLowerCase().replace(".tif", ".pdf");
 
         log.info("Converting file:" + tifFile+" to:"+pdfFile);
 
         log.info("Converting file:" + tifFile+" to:"+pdfFile);
         String command = cognitiveCompressimo + tifFile + " " + pdfFile;
+
         String command = cognitivePdfa + tifFile + " " + pdfFile;
 
         Process process = Runtime.getRuntime().exec(command);
 
         Process process = Runtime.getRuntime().exec(command);
 
          
 
          
Line 39: Line 39:
 
         String line = null;
 
         String line = null;
  
         while ((line=input.readLine())!=null) {
+
         while ((line=input.readLine()) != null) {
 
             log.info(line);
 
             log.info(line);
 
         }
 
         }

Latest revision as of 13:42, 11 February 2013

Cognitive PDF/A is a powerful Cognitive Forms tool which it makes PDF/A ISO standard documents from scanned document images. OpenKM integrate Compressimo transparently using automation or crontab utilities.

Description:

  • Input server folder where images are stored systemFolder = "c:\\samples"
  • Cognitive PDF/A server path cognitivePdfa
  • OpenKM path where compressimo files are imported String path = "/okm:root/imported" + "/" + uploadFile.getName()
import java.io.*;
import java.util.*;
import com.openkm.module.db.stuff.DbSessionManager;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import com.openkm.bean.Document;
import com.openkm.api.OKMDocument;

String token = DbSessionManager.getInstance().getSystemToken();
String systemFolder = "c:\\samples";
String cognitivePdfa = "C:\\Users\\jllort\\Desktop\\cpdfa-1.4.4-dev-win32-1month\\cpdfa\\bin\\cpdfacli.exe splitdummy eng ";
Logger log = LoggerFactory.getLogger("com.openkm.compressimo");

// Loading files
log.info("***** Process BEGIN *****");
File folder = new File(systemFolder);
File[] listOfFiles = folder.listFiles();

for (int i=0; i<listOfFiles.length; i++) {
    File file = listOfFiles[i];

    if (file.isFile() && file.getName().toLowerCase().endsWith(".tif")) {
        // Converting tif file to pdf
        String tifFile =  systemFolder + "\\" + file.getName();
        String pdfFile =  systemFolder + "\\" + file.getName().toLowerCase().replace(".tif", ".pdf");
        log.info("Converting file:" + tifFile+" to:"+pdfFile);
        String command = cognitivePdfa + tifFile + " " + pdfFile;
        Process process = Runtime.getRuntime().exec(command);
        
        BufferedReader input = new BufferedReader(new InputStreamReader(process.getInputStream()));
        String line = null;

        while ((line=input.readLine()) != null) {
            log.info(line);
        }

        int exitVal = process.waitFor();
        log.info("Exit code " + exitVal);
        
        // Uploading pdf file
        File uploadFile = new File(pdfFile);
        Document doc = new Document();
	String path = "/okm:root/imported" + "/" + uploadFile.getName();
        log.info("Importing file:"+ pdfFile + " to:"+path);
	doc.setPath(path);
        FileInputStream fis = new FileInputStream(uploadFile);
	doc = OKMDocument.getInstance().create(token, doc, fis);
        
	// Deleting pdf File
        uploadFile.delete();
    }
}

log.info("***** Process END *****");

Example

Scanned files: Red square remark initial document size.

Okm user guide 360.png


Crontab compressimo importer task:

Okm user guide 361.png


OpenKM log execution server output:

Okm user guide 362.png


Imported files: Red square remark final document size.

Okm user guide 363.png


PDF/A compliance:

Okm user guide 364.png


Search engine search by content:

Okm user guide 365.png


For more information: