mirror of
https://github.com/Frooodle/Stirling-PDF.git
synced 2026-04-06 03:19:39 +02:00
Remove images (#5966)
This commit is contained in:
@@ -0,0 +1,137 @@
|
||||
package stirling.software.SPDF.controller.api.misc;
|
||||
|
||||
import java.io.ByteArrayOutputStream;
|
||||
import java.io.IOException;
|
||||
import java.util.ArrayList;
|
||||
import java.util.List;
|
||||
|
||||
import org.apache.pdfbox.cos.COSDictionary;
|
||||
import org.apache.pdfbox.cos.COSName;
|
||||
import org.apache.pdfbox.pdmodel.PDDocument;
|
||||
import org.apache.pdfbox.pdmodel.PDPage;
|
||||
import org.apache.pdfbox.pdmodel.PDResources;
|
||||
import org.apache.pdfbox.pdmodel.graphics.PDXObject;
|
||||
import org.apache.pdfbox.pdmodel.graphics.form.PDFormXObject;
|
||||
import org.apache.pdfbox.pdmodel.graphics.image.PDImageXObject;
|
||||
import org.springframework.http.MediaType;
|
||||
import org.springframework.http.ResponseEntity;
|
||||
import org.springframework.web.bind.annotation.ModelAttribute;
|
||||
import org.springframework.web.multipart.MultipartFile;
|
||||
|
||||
import io.swagger.v3.oas.annotations.Operation;
|
||||
|
||||
import lombok.RequiredArgsConstructor;
|
||||
import lombok.extern.slf4j.Slf4j;
|
||||
|
||||
import stirling.software.common.annotations.AutoJobPostMapping;
|
||||
import stirling.software.common.annotations.api.GeneralApi;
|
||||
import stirling.software.common.model.api.PDFFile;
|
||||
import stirling.software.common.service.CustomPDFDocumentFactory;
|
||||
import stirling.software.common.util.ExceptionUtils;
|
||||
import stirling.software.common.util.GeneralUtils;
|
||||
import stirling.software.common.util.WebResponseUtils;
|
||||
|
||||
@GeneralApi
|
||||
@Slf4j
|
||||
@RequiredArgsConstructor
|
||||
public class RemoveImagesController {
|
||||
|
||||
private final CustomPDFDocumentFactory pdfDocumentFactory;
|
||||
|
||||
@AutoJobPostMapping(consumes = MediaType.MULTIPART_FORM_DATA_VALUE, value = "/remove-image-pdf")
|
||||
@Operation(
|
||||
summary = "Remove images from PDF",
|
||||
description =
|
||||
"This endpoint removes all embedded images from a PDF file and returns the"
|
||||
+ " modified document. Input:PDF Output:PDF Type:SISO")
|
||||
public ResponseEntity<byte[]> removeImages(@ModelAttribute PDFFile request)
|
||||
throws IOException {
|
||||
|
||||
MultipartFile inputFile = request.getFileInput();
|
||||
|
||||
try (PDDocument pdfDoc = pdfDocumentFactory.load(request)) {
|
||||
|
||||
int totalPages = pdfDoc.getNumberOfPages();
|
||||
int imagesRemoved = 0;
|
||||
|
||||
for (int pageIndex = 0; pageIndex < totalPages; pageIndex++) {
|
||||
PDPage currentPage = pdfDoc.getPage(pageIndex);
|
||||
imagesRemoved += removeImagesFromPage(currentPage);
|
||||
}
|
||||
|
||||
log.info("Removed {} images from PDF with {} pages", imagesRemoved, totalPages);
|
||||
|
||||
ByteArrayOutputStream baos = new ByteArrayOutputStream();
|
||||
pdfDoc.save(baos);
|
||||
byte[] pdfContent = baos.toByteArray();
|
||||
|
||||
return WebResponseUtils.bytesToWebResponse(
|
||||
pdfContent,
|
||||
GeneralUtils.generateFilename(
|
||||
inputFile.getOriginalFilename(), "_images_removed.pdf"));
|
||||
|
||||
} catch (IOException e) {
|
||||
throw ExceptionUtils.handlePdfException(e, "during image removal");
|
||||
}
|
||||
}
|
||||
|
||||
private int removeImagesFromPage(PDPage page) throws IOException {
|
||||
int imagesRemoved = 0;
|
||||
|
||||
PDResources resources = page.getResources();
|
||||
if (resources == null) {
|
||||
return imagesRemoved;
|
||||
}
|
||||
|
||||
imagesRemoved += removeImagesFromResources(resources);
|
||||
return imagesRemoved;
|
||||
}
|
||||
|
||||
private int removeImagesFromFormXObject(PDFormXObject formXObject) throws IOException {
|
||||
PDResources resources = formXObject.getResources();
|
||||
if (resources == null) {
|
||||
return 0;
|
||||
}
|
||||
|
||||
return removeImagesFromResources(resources);
|
||||
}
|
||||
|
||||
private int removeImagesFromResources(PDResources resources) throws IOException {
|
||||
if (resources == null) {
|
||||
return 0;
|
||||
}
|
||||
|
||||
COSDictionary xObjects = resources.getCOSObject().getCOSDictionary(COSName.XOBJECT);
|
||||
if (xObjects == null) {
|
||||
return 0;
|
||||
}
|
||||
|
||||
int imagesRemoved = 0;
|
||||
// Create snapshot to safely iterate while removing
|
||||
List<COSName> names = new ArrayList<>(xObjects.keySet());
|
||||
|
||||
for (COSName name : names) {
|
||||
try {
|
||||
PDXObject xObject = resources.getXObject(name);
|
||||
if (xObject == null) {
|
||||
continue;
|
||||
}
|
||||
|
||||
// Remove direct images
|
||||
if (xObject instanceof PDImageXObject) {
|
||||
xObjects.removeItem(name);
|
||||
imagesRemoved++;
|
||||
log.debug("Removed image: {}", name.getName());
|
||||
}
|
||||
// Recursively process nested form XObjects
|
||||
else if (xObject instanceof PDFormXObject form) {
|
||||
imagesRemoved += removeImagesFromResources(form.getResources());
|
||||
}
|
||||
} catch (IOException e) {
|
||||
log.warn("Error processing XObject {}: {}", name.getName(), e.getMessage());
|
||||
}
|
||||
}
|
||||
|
||||
return imagesRemoved;
|
||||
}
|
||||
}
|
||||
Reference in New Issue
Block a user