From e6defcc13d71dd28d886b22365e5a4d020163d10 Mon Sep 17 00:00:00 2001 From: Yokozuna Date: Sat, 19 Oct 2019 16:04:23 +0200 Subject: [PATCH] dification recadragePdf --- src/recadragePdf/CorrectionPdf.java | 10 + src/recadragePdf/DetectionPdf.java | 53 +++++ src/recadragePdf/LoadingExistingDocument.java | 38 ++++ src/recadragePdf/PdfAnalyzer.java | 195 ++++++++++++++++++ src/recadragePdf/PdfToImage.java | 102 +++++++++ 5 files changed, 398 insertions(+) create mode 100644 src/recadragePdf/CorrectionPdf.java create mode 100644 src/recadragePdf/DetectionPdf.java create mode 100644 src/recadragePdf/LoadingExistingDocument.java create mode 100644 src/recadragePdf/PdfAnalyzer.java create mode 100644 src/recadragePdf/PdfToImage.java diff --git a/src/recadragePdf/CorrectionPdf.java b/src/recadragePdf/CorrectionPdf.java new file mode 100644 index 0000000..7d380d2 --- /dev/null +++ b/src/recadragePdf/CorrectionPdf.java @@ -0,0 +1,10 @@ +package RecadragePdf; + +public class CorrectionPdf { + + public static void main(String[] args) { + // TODO Auto-generated method stub + + } + +} diff --git a/src/recadragePdf/DetectionPdf.java b/src/recadragePdf/DetectionPdf.java new file mode 100644 index 0000000..97bb839 --- /dev/null +++ b/src/recadragePdf/DetectionPdf.java @@ -0,0 +1,53 @@ +package RecadragePdf; + +import java.awt.Color; +import java.awt.image.BufferedImage; +import java.io.File; +import java.io.IOException; +import javax.imageio.ImageIO; + +public class DetectionPdf { + String dir=""; + String filename=""; + BufferedImage img; + + + public DetectionPdf(String directory,String file) { + dir=directory; + filename=file; + File f =new File(dir+filename); + + try { + img=ImageIO.read(f); + } catch (IOException e) { + System.out.println(e); + } + } + + public boolean estDroite() { //determine si l'image png/jpg du pdf est droite + int count=0; + boolean stop=false; + for (int ty=0; ty<100 && !stop;ty++) { + for (int tx=0;tximg.getWidth()/5.4 && count convertPagesToBWJPG(PDDocument document) { + ArrayList images = new ArrayList(); + PDFRenderer pdfRenderer = new PDFRenderer(document); + try { + int pageCounter = 0; + for (PDPage page : document.getPages()) { + System.out.println("page.getRotation() : " + page.getRotation()); + System.out.println("pageCounter : " + pageCounter); + BufferedImage bim = pdfRenderer.renderImageWithDPI(pageCounter++, 300, ImageType.BINARY); // BINARY = + // noir et + // blanc + images.add(bim); + System.out.println("Ajout n°" + pageCounter); + } + // document.close(); + } catch (IOException ioe) { + ioe.printStackTrace(); + } + return images; + } + + public void saveOnDisk(ArrayList images, String originalFileName) { + int pageCounter = 0; + try { + for (BufferedImage img : images) { + ImageIO.write(img, "JPEG", new File(originalFileName + pageCounter++ + ".jpg")); + } + } catch (IOException ioe) { + ioe.printStackTrace(); + } + } + + // public void drawRectangle(int x, int y) + + public static void main(String args[]) throws IOException { + + /* + * Pattern p = Pattern.compile("\\d{1,16}"); Matcher m = p.matcher("123456789"); + * boolean b = m.matches(); + */ + + PdfAnalyzer pdfAnalyzer = new PdfAnalyzer(); + File pdfFile; + PDDocument document = null; + ArrayList images = new ArrayList(); + BufferedImage img = null; + // File f = null; + + // CONVERT PAGES TO IMAGES + try { + String pdfFilename = "C:\\Users\\Nico\\Desktop\\M3302 - Sujet S3T 2019.pdf"; + pdfFile = new File(pdfFilename); + document = PDDocument.load(pdfFile); + images = pdfAnalyzer.convertPagesToBWJPG(document); + pdfAnalyzer.saveOnDisk(images, "C:\\Users\\Nico\\Desktop\\M3302 - Sujet S3T 2019.pdf"); + } catch (IOException e) { + System.out.println(e); + } /* + * if (!pdfAnalyzer.isBlackWhite(img)) { BufferedImage bw_image = + * pdfAnalyzer.blackWhiteConvert(img); } + */ + // DRAW RECTANGLE ON X,Y + // Create a Document object. + PDDocument pdDocument = new PDDocument(); + + // Create a Page object + PDPage pdPage = new PDPage(PDRectangle.A4); + int height = (int) pdPage.getMediaBox().getHeight(); + int width = (int) pdPage.getMediaBox().getWidth(); + System.out.println(height + " " + width); + // Add the page to the document and save the document to a desired file. + pdDocument.addPage(pdPage); + try { + // Create a Content Stream + PDPageContentStream pdPageContentStream = new PDPageContentStream(pdDocument, pdPage); + + // Set a Color for the Rectangle + pdPageContentStream.setNonStrokingColor(Color.BLACK); + // Give the X, Y coordinates and height and width + + PDFont font = PDType1Font.HELVETICA_BOLD; + + pdPageContentStream.setNonStrokingColor(0, 0, 0); // black text + pdPageContentStream.setFont(font, 9); + + String title = "Evaluation Pattern"; + + pdPageContentStream.beginText(); + pdPageContentStream.newLineAtOffset((width / 2) - title.length(), height - 10); + pdPageContentStream.showText(title); + pdPageContentStream.endText(); + + int count = 0; + for (int y = height - 50; y > (height / 2); y -= 25) { + // write some text + String enonce = "Question " + count + " : ..."; + pdPageContentStream.beginText(); + pdPageContentStream.newLineAtOffset(10, y); + pdPageContentStream.showText(enonce); + pdPageContentStream.endText(); + // draw an empty rectangle + pdPageContentStream.addRect(50, y - 15, 10, 10); // X (lower left x corner), Y (lower left y corner), + // Width, + // Height + pdPageContentStream.closeAndStroke(); + // write some text + pdPageContentStream.beginText(); + pdPageContentStream.newLineAtOffset(70, y - 15); + pdPageContentStream.showText("Question non cochée " + count); + pdPageContentStream.endText(); + // draw a filled rectangle + pdPageContentStream.addRect(200, y - 15, 10, 10); + pdPageContentStream.fill(); + // write some text + pdPageContentStream.beginText(); + pdPageContentStream.newLineAtOffset(220, y - 15); + pdPageContentStream.showText("Question cochée " + count++); + pdPageContentStream.endText(); + } + + // pdPageContentStream.fill(); + + // Once all the content is written, close the stream + pdPageContentStream.close(); + + pdDocument.save("C:\\Users\\Nico\\Desktop\\testPDFRect.pdf"); + pdDocument.close(); + System.out.println("PDF saved to the location !!!"); + + } catch (IOException ioe) { + System.out.println("Error while saving pdf" + ioe.getMessage()); + } + } +} diff --git a/src/recadragePdf/PdfToImage.java b/src/recadragePdf/PdfToImage.java new file mode 100644 index 0000000..4dac2ac --- /dev/null +++ b/src/recadragePdf/PdfToImage.java @@ -0,0 +1,102 @@ +package RecadragePdf; + +import java.awt.image.BufferedImage; +import java.io.File; +import java.io.IOException; +import java.util.ArrayList; + +import javax.imageio.ImageIO; + +import org.apache.pdfbox.pdmodel.PDDocument; +import org.apache.pdfbox.pdmodel.PDPage; +import org.apache.pdfbox.rendering.ImageType; +import org.apache.pdfbox.rendering.PDFRenderer; + +public class PdfToImage { + public BufferedImage blackWhiteConvert(BufferedImage image) { + // Convertit une image en image en noir et blanc + // TODO : voir recursivite + int width = image.getWidth(); + int height = image.getHeight(); + for (int x = 0; x < width; x++) { + for (int y = 0; y < height; y++) { + if (image.getRGB(x, y) < 128) { + image.setRGB(x, y, 0); + } else { + image.setRGB(x, y, 255); + } + } + } + return image; + } + + public boolean isBlackWhite(BufferedImage image) { + // verifie si une image est en noir et blanc + // TODO : voir recursivite + int width = image.getWidth(); + int height = image.getHeight(); + for (int x = 0; x < width; x++) { + for (int y = 0; y < height; y++) { + if ((image.getRGB(x, y) != 0) || (image.getRGB(x, y) != 255)) { + return false; + } + } + } + return true; + } + + public ArrayList convertPagesToBWJPG(PDDocument document) { + // convertit chaque page d'un document pdf en image noir et blanc + // retourne une array liste d'images + ArrayList images = new ArrayList(); + PDFRenderer pdfRenderer = new PDFRenderer(document); + try { + int pageCounter = 0; + for (PDPage page : document.getPages()) { + System.out.println("page.getRotation() : " + page.getRotation()); + System.out.println("pageCounter : " + pageCounter); + BufferedImage bim = pdfRenderer.renderImageWithDPI(pageCounter++, 300, ImageType.BINARY); // BINARY = + // noir et + // blanc + images.add(bim); + System.out.println("Ajout n°" + pageCounter); + } + // document.close(); + } catch (IOException ioe) { + ioe.printStackTrace(); + } + return images; + } + + public void saveOnDisk(ArrayList images, String originalFileDir) { + // sauvegarde sur le disque les images + int pageCounter = 0; + try { + for (BufferedImage img : images) { + ImageIO.write(img, "JPEG", new File(originalFileDir + "img_" + pageCounter++ + ".jpg")); + } + } catch (IOException ioe) { + ioe.printStackTrace(); + } + } + + public static void main(String args[]) throws IOException { + + PdfAnalyzer pdfAnalyzer = new PdfAnalyzer(); + File pdfFile; + PDDocument document = null; + ArrayList images = new ArrayList(); // stockera les images (resultat) + + // CONVERT PAGES TO IMAGES + try { + String pdfFilename = "DOC-sujet.pdf"; // nom du fichier pdf à ouvrir (TODO: changer le chemin) + pdfFile = new File(pdfFilename); // cree un fichier pdf (non sauvegarde sur le disque) + document = PDDocument.load(pdfFile); // charge le fichier pdf cree pour le traiter + images = pdfAnalyzer.convertPagesToBWJPG(document); // appelle la methode qui convertit les pages en images + // (jpg) noir et blanches + pdfAnalyzer.saveOnDisk(images, "C:\\Users\\kg403211\\eclipse-workspace\\QCM\\src\\RecadragePdf\\Pdf"); // sauvegarde les images au chemin specifie (TODO: changer le chemin) + } catch (IOException e) { + System.out.println(e); + } + } +}