mirror of
https://github.com/Stirling-Tools/Stirling-PDF.git
synced 2025-06-14 03:25:02 +00:00
164 lines
6.4 KiB
Java
164 lines
6.4 KiB
Java
package stirling.software.SPDF.controller.api;
|
|
|
|
import java.io.ByteArrayOutputStream;
|
|
import java.io.IOException;
|
|
import java.nio.file.Files;
|
|
import java.nio.file.Path;
|
|
import java.util.ArrayList;
|
|
import java.util.List;
|
|
import java.util.stream.Collectors;
|
|
import java.util.zip.ZipEntry;
|
|
import java.util.zip.ZipOutputStream;
|
|
|
|
import org.apache.pdfbox.pdmodel.PDDocument;
|
|
import org.apache.pdfbox.pdmodel.PDPage;
|
|
import org.springframework.http.MediaType;
|
|
import org.springframework.http.ResponseEntity;
|
|
import org.springframework.web.bind.annotation.ModelAttribute;
|
|
import stirling.software.common.annotations.AutoJobPostMapping;
|
|
import org.springframework.web.bind.annotation.RequestMapping;
|
|
import org.springframework.web.bind.annotation.RestController;
|
|
import org.springframework.web.multipart.MultipartFile;
|
|
|
|
import io.github.pixee.security.Filenames;
|
|
import io.swagger.v3.oas.annotations.Operation;
|
|
import io.swagger.v3.oas.annotations.tags.Tag;
|
|
|
|
import lombok.RequiredArgsConstructor;
|
|
import lombok.extern.slf4j.Slf4j;
|
|
|
|
import stirling.software.SPDF.model.api.PDFWithPageNums;
|
|
import stirling.software.common.service.CustomPDFDocumentFactory;
|
|
import stirling.software.common.util.WebResponseUtils;
|
|
|
|
@RestController
|
|
@RequestMapping("/api/v1/general")
|
|
@Slf4j
|
|
@Tag(name = "General", description = "General APIs")
|
|
@RequiredArgsConstructor
|
|
public class SplitPDFController {
|
|
|
|
private final CustomPDFDocumentFactory pdfDocumentFactory;
|
|
|
|
@AutoJobPostMapping(consumes = "multipart/form-data", value = "/split-pages")
|
|
@Operation(
|
|
summary = "Split a PDF file into separate documents",
|
|
description =
|
|
"This endpoint splits a given PDF file into separate documents based on the"
|
|
+ " specified page numbers or ranges. Users can specify pages using"
|
|
+ " individual numbers, ranges, or 'all' for every page. Input:PDF"
|
|
+ " Output:PDF Type:SIMO")
|
|
public ResponseEntity<byte[]> splitPdf(@ModelAttribute PDFWithPageNums request)
|
|
throws IOException {
|
|
|
|
PDDocument document = null;
|
|
Path zipFile = null;
|
|
List<ByteArrayOutputStream> splitDocumentsBoas = new ArrayList<>();
|
|
|
|
try {
|
|
|
|
MultipartFile file = request.getFileInput();
|
|
String pages = request.getPageNumbers();
|
|
// open the pdf document
|
|
|
|
document = pdfDocumentFactory.load(file);
|
|
// PdfMetadata metadata = PdfMetadataService.extractMetadataFromPdf(document);
|
|
int totalPages = document.getNumberOfPages();
|
|
List<Integer> pageNumbers = request.getPageNumbersList(document, false);
|
|
if (!pageNumbers.contains(totalPages - 1)) {
|
|
// Create a mutable ArrayList so we can add to it
|
|
pageNumbers = new ArrayList<>(pageNumbers);
|
|
pageNumbers.add(totalPages - 1);
|
|
}
|
|
|
|
log.info(
|
|
"Splitting PDF into pages: {}",
|
|
pageNumbers.stream().map(String::valueOf).collect(Collectors.joining(",")));
|
|
|
|
// split the document
|
|
splitDocumentsBoas = new ArrayList<>();
|
|
int previousPageNumber = 0;
|
|
for (int splitPoint : pageNumbers) {
|
|
try (PDDocument splitDocument =
|
|
pdfDocumentFactory.createNewDocumentBasedOnOldDocument(document)) {
|
|
for (int i = previousPageNumber; i <= splitPoint; i++) {
|
|
PDPage page = document.getPage(i);
|
|
splitDocument.addPage(page);
|
|
log.info("Adding page {} to split document", i);
|
|
}
|
|
previousPageNumber = splitPoint + 1;
|
|
|
|
// Transfer metadata to split pdf
|
|
// PdfMetadataService.setMetadataToPdf(splitDocument, metadata);
|
|
|
|
ByteArrayOutputStream baos = new ByteArrayOutputStream();
|
|
splitDocument.save(baos);
|
|
|
|
splitDocumentsBoas.add(baos);
|
|
} catch (Exception e) {
|
|
log.error("Failed splitting documents and saving them", e);
|
|
throw e;
|
|
}
|
|
}
|
|
|
|
// closing the original document
|
|
document.close();
|
|
|
|
zipFile = Files.createTempFile("split_documents", ".zip");
|
|
|
|
String filename =
|
|
Filenames.toSimpleFileName(file.getOriginalFilename())
|
|
.replaceFirst("[.][^.]+$", "");
|
|
try (ZipOutputStream zipOut = new ZipOutputStream(Files.newOutputStream(zipFile))) {
|
|
// loop through the split documents and write them to the zip file
|
|
for (int i = 0; i < splitDocumentsBoas.size(); i++) {
|
|
String fileName = filename + "_" + (i + 1) + ".pdf";
|
|
ByteArrayOutputStream baos = splitDocumentsBoas.get(i);
|
|
byte[] pdf = baos.toByteArray();
|
|
|
|
// Add PDF file to the zip
|
|
ZipEntry pdfEntry = new ZipEntry(fileName);
|
|
zipOut.putNextEntry(pdfEntry);
|
|
zipOut.write(pdf);
|
|
zipOut.closeEntry();
|
|
|
|
log.info("Wrote split document {} to zip file", fileName);
|
|
}
|
|
} catch (Exception e) {
|
|
log.error("Failed writing to zip", e);
|
|
throw e;
|
|
}
|
|
|
|
log.info("Successfully created zip file with split documents: {}", zipFile.toString());
|
|
byte[] data = Files.readAllBytes(zipFile);
|
|
Files.deleteIfExists(zipFile);
|
|
|
|
// return the Resource in the response
|
|
return WebResponseUtils.bytesToWebResponse(
|
|
data, filename + ".zip", MediaType.APPLICATION_OCTET_STREAM);
|
|
|
|
} finally {
|
|
try {
|
|
// Close the main document
|
|
if (document != null) {
|
|
document.close();
|
|
}
|
|
|
|
// Close all ByteArrayOutputStreams
|
|
for (ByteArrayOutputStream baos : splitDocumentsBoas) {
|
|
if (baos != null) {
|
|
baos.close();
|
|
}
|
|
}
|
|
|
|
// Delete temporary zip file
|
|
if (zipFile != null) {
|
|
Files.deleteIfExists(zipFile);
|
|
}
|
|
} catch (Exception e) {
|
|
log.error("Error while cleaning up resources", e);
|
|
}
|
|
}
|
|
}
|
|
}
|