diff --git a/.github/workflows/licenses-update.yml b/.github/workflows/licenses-update.yml index 8c1e1c29..409735c0 100644 --- a/.github/workflows/licenses-update.yml +++ b/.github/workflows/licenses-update.yml @@ -52,7 +52,7 @@ jobs: - name: Create Pull Request id: cpr if: env.CHANGES_DETECTED == 'true' - uses: peter-evans/create-pull-request@c5a7806660adbe173f04e3e038b0ccdcd758773c # v6.1.0 + uses: peter-evans/create-pull-request@5e914681df9dc83aa4e4905692ca88beb2f9e91f # v7.0.5 with: token: ${{ secrets.GITHUB_TOKEN }} commit-message: "Update 3rd Party Licenses" @@ -65,9 +65,10 @@ jobs: Auto-generated by [create-pull-request][1] [1]: https://github.com/peter-evans/create-pull-request - labels: licenses + labels: licenses,github-actions draft: false delete-branch: true + sign-commits: true - name: Auto approve if: steps.cpr.outputs.pull-request-operation == 'created' diff --git a/.github/workflows/multiOSReleases.yml b/.github/workflows/multiOSReleases.yml index 2792a909..e445dc2b 100644 --- a/.github/workflows/multiOSReleases.yml +++ b/.github/workflows/multiOSReleases.yml @@ -99,6 +99,6 @@ jobs: if-no-files-found: error - name: Upload binaries to release - uses: softprops/action-gh-release@7b4da11513bf3f43f9999e90eabced41ab8bb048 # v2.2.0 + uses: softprops/action-gh-release@01570a1f39cb168c169c802c3bceb9e93fb10974 # v2.1.0 with: files: ./Stirling-PDF-${{ matrix.platform }}-installer.${{ matrix.ext }} diff --git a/.github/workflows/pre_commit.yml b/.github/workflows/pre_commit.yml new file mode 100644 index 00000000..b8948ded --- /dev/null +++ b/.github/workflows/pre_commit.yml @@ -0,0 +1,55 @@ +name: Pre-commit + +on: + push: + branches: [main] + +permissions: read-all + +jobs: + update: + if: ${{ github.event.pull_request.user.login != 'dependabot[bot]' }} + runs-on: ubuntu-latest + permissions: + contents: write + pull-requests: write + steps: + - name: Checkout repository + uses: actions/checkout@v4 + with: + token: ${{ secrets.GITHUB_TOKEN }} + - name: Set up Python + uses: actions/setup-python@v5 + with: + python-version: 3.12 + - name: Set up git config + run: | + git config --global user.name "github-actions[bot]" + git config --global user.email "github-actions[bot]@users.noreply.github.com" + - name: Install Dependencies + run: | + pip install pre-commit==4.0.1 + - name: Run pre-commit and git add + run: | + pre-commit run -c .pre-commit-config.yaml || true + git add . + git diff --staged --quiet || git commit -m ":file_folder: pre-commit + > Made via .github/workflows/pre_commit.yml" || echo "pre-commit: no changes" + - name: Create Pull Request + uses: peter-evans/create-pull-request@5e914681df9dc83aa4e4905692ca88beb2f9e91f # v7.0.5 + with: + token: ${{ secrets.GITHUB_TOKEN }} + commit-message: Update files + committer: GitHub Action + author: GitHub Action + signoff: true + branch: pre-commit + title: "🔨 [pre-commit] Update files by " + body: | + Auto-generated by [create-pull-request][1] + + [1]: https://github.com/peter-evans/create-pull-request + draft: false + delete-branch: true + labels: github-actions + sign-commits: true diff --git a/.github/workflows/push-docker.yml b/.github/workflows/push-docker.yml index a36aec1a..590e90cf 100644 --- a/.github/workflows/push-docker.yml +++ b/.github/workflows/push-docker.yml @@ -7,7 +7,10 @@ on: - master - main -permissions: read-all +permissions: + contents: read + packages: write + id-token: write jobs: push: @@ -37,6 +40,11 @@ jobs: env: DOCKER_ENABLE_SECURITY: false + - name: Install cosign + uses: sigstore/cosign-installer@v3.7.0 + with: + cosign-release: 'v2.4.1' + - name: Set up Docker Buildx id: buildx uses: docker/setup-buildx-action@6524bf65af31da8d45b59e8c27de4bd072b392f5 # v3.8.0 @@ -80,6 +88,7 @@ jobs: type=raw,value=alpha,enable=${{ github.ref == 'refs/heads/main' }} - name: Build and push main Dockerfile + id: build-push-regular uses: docker/build-push-action@48aba3b46d1b1fec4febb7c5d0c644b249a11355 # v6.10.0 with: builder: ${{ steps.buildx.outputs.name }} @@ -92,6 +101,35 @@ jobs: labels: ${{ steps.meta.outputs.labels }} build-args: VERSION_TAG=${{ steps.versionNumber.outputs.versionNumber }} platforms: linux/amd64,linux/arm64/v8 + provenance: true + sbom: true + + - name: Sign regular images + env: + DIGEST: ${{ steps.build-push-regular.outputs.digest }} + TAGS: ${{ steps.meta.outputs.tags }} + COSIGN_PRIVATE_KEY: ${{ secrets.COSIGN_PRIVATE_KEY }} + COSIGN_PASSWORD: ${{ secrets.COSIGN_PASSWORD }} + run: | + # Always sign images regardless of branch + echo "$TAGS" | tr ',' '\n' | while read -r tag; do + cosign sign --yes \ + --key env://COSIGN_PRIVATE_KEY \ + "${tag}@${DIGEST}" + done + + # For alpha builds specifically, we want to ensure they're marked as development builds + if [[ "${{ github.ref }}" == "refs/heads/main" ]]; then + echo "Signing alpha build with development attestation" + echo "$TAGS" | tr ',' '\n' | while read -r tag; do + if [[ $tag == *":alpha" ]]; then + cosign attest --key env://COSIGN_PRIVATE_KEY \ + --predicate <(echo '{"type":"development"}') \ + --yes "${tag}@${DIGEST}" + fi + done + fi + - name: Generate tags ultra-lite id: meta2 @@ -108,11 +146,12 @@ jobs: type=raw,value=latest-ultra-lite,enable=${{ github.ref == 'refs/heads/master' }} - name: Build and push Dockerfile-ultra-lite + id: build-push-lite uses: docker/build-push-action@48aba3b46d1b1fec4febb7c5d0c644b249a11355 # v6.10.0 if: github.ref != 'refs/heads/main' with: context: . - file: ./Dockerfile-ultra-lite + file: ./Dockerfile.ultra-lite push: true cache-from: type=gha cache-to: type=gha,mode=max @@ -120,6 +159,20 @@ jobs: labels: ${{ steps.meta2.outputs.labels }} build-args: VERSION_TAG=${{ steps.versionNumber.outputs.versionNumber }} platforms: linux/amd64,linux/arm64/v8 + provenance: true + sbom: true + + - name: Sign ultra-lite images + if: github.ref != 'refs/heads/main' + env: + DIGEST: ${{ steps.build-push-lite.outputs.digest }} + TAGS: ${{ steps.meta2.outputs.tags }} + COSIGN_PRIVATE_KEY: ${{ secrets.COSIGN_PRIVATE_KEY }} + COSIGN_PASSWORD: ${{ secrets.COSIGN_PASSWORD }} + run: | + echo "$TAGS" | tr ',' '\n' | while read -r tag; do + cosign sign --key env://COSIGN_PRIVATE_KEY --yes "${tag}@${DIGEST}" + done - name: Generate tags fat id: meta3 @@ -136,12 +189,13 @@ jobs: type=raw,value=latest-fat,enable=${{ github.ref == 'refs/heads/master' }} - name: Build and push main Dockerfile fat + id: build-push-fat uses: docker/build-push-action@48aba3b46d1b1fec4febb7c5d0c644b249a11355 # v6.10.0 if: github.ref != 'refs/heads/main' with: builder: ${{ steps.buildx.outputs.name }} context: . - file: ./Dockerfile-fat + file: ./Dockerfile.fat push: true cache-from: type=gha cache-to: type=gha,mode=max @@ -149,3 +203,17 @@ jobs: labels: ${{ steps.meta3.outputs.labels }} build-args: VERSION_TAG=${{ steps.versionNumber.outputs.versionNumber }} platforms: linux/amd64,linux/arm64/v8 + provenance: true + sbom: true + + - name: Sign fat images + if: github.ref != 'refs/heads/main' + env: + DIGEST: ${{ steps.build-push-fat.outputs.digest }} + TAGS: ${{ steps.meta3.outputs.tags }} + COSIGN_PRIVATE_KEY: ${{ secrets.COSIGN_PRIVATE_KEY }} + COSIGN_PASSWORD: ${{ secrets.COSIGN_PASSWORD }} + run: | + echo "$TAGS" | tr ',' '\n' | while read -r tag; do + cosign sign --key env://COSIGN_PRIVATE_KEY --yes "${tag}@${DIGEST}" + done diff --git a/.github/workflows/releaseArtifacts.yml b/.github/workflows/releaseArtifacts.yml index ceaa1d0f..21f2fb14 100644 --- a/.github/workflows/releaseArtifacts.yml +++ b/.github/workflows/releaseArtifacts.yml @@ -62,7 +62,7 @@ jobs: if-no-files-found: error - name: Upload binaries to release - uses: softprops/action-gh-release@7b4da11513bf3f43f9999e90eabced41ab8bb048 # v2.2.0 + uses: softprops/action-gh-release@01570a1f39cb168c169c802c3bceb9e93fb10974 # v2.1.0 with: files: ./build/launch4j/Stirling-PDF-Server${{ matrix.file_suffix }}.exe @@ -79,6 +79,6 @@ jobs: if-no-files-found: error - name: Upload jar binaries to release - uses: softprops/action-gh-release@7b4da11513bf3f43f9999e90eabced41ab8bb048 # v2.2.0 + uses: softprops/action-gh-release@01570a1f39cb168c169c802c3bceb9e93fb10974 # v2.1.0 with: files: ./build/libs/Stirling-PDF${{ matrix.file_suffix }}.jar diff --git a/.github/workflows/sync_files.yml b/.github/workflows/sync_files.yml index fc4a2fce..fbbb56ab 100644 --- a/.github/workflows/sync_files.yml +++ b/.github/workflows/sync_files.yml @@ -42,7 +42,7 @@ jobs: git diff --staged --quiet || git commit -m ":memo: Sync README > Made via sync_files.yml" || echo "no changes" - name: Create Pull Request - uses: peter-evans/create-pull-request@c5a7806660adbe173f04e3e038b0ccdcd758773c # v6.1.0 + uses: peter-evans/create-pull-request@5e914681df9dc83aa4e4905692ca88beb2f9e91f # v7.0.5 with: token: ${{ secrets.GITHUB_TOKEN }} commit-message: Update files @@ -58,3 +58,4 @@ jobs: draft: false delete-branch: true labels: Documentation,Translation,github-actions + sign-commits: true diff --git a/.github/workflows/update-translations.yml b/.github/workflows/update-translations.yml index 141d9a72..c6b408c3 100644 --- a/.github/workflows/update-translations.yml +++ b/.github/workflows/update-translations.yml @@ -65,7 +65,7 @@ jobs: Auto-generated by [create-pull-request][1] [1]: https://github.com/peter-evans/create-pull-request - labels: Translation draft: false delete-branch: true + labels: Translation,github-actions sign-commits: true diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md index 47f6215c..463cb433 100644 --- a/CONTRIBUTING.md +++ b/CONTRIBUTING.md @@ -18,9 +18,9 @@ For a detailed pull request tutorial, see [this guide](https://www.digitalocean. Please make sure your Pull Request adheres to the following guidelines: - Use the PR template provided. -- Keep your Pull Request title succinct, detailed and to the point. +- Keep your Pull Request title succinct, detailed, and to the point. - Keep commits atomic. One commit should contain one change. If you want to make multiple changes, submit multiple Pull Requests. -- Commits should be clear, concise and easy to understand. +- Commits should be clear, concise, and easy to understand. - References to the Issue number in the Pull Request and/or Commit message. ## Translations @@ -29,15 +29,15 @@ If you would like to add or modify a translation, please see [How to add new lan ## Docs -Documentation for Stirling-PDF is handled in a separate repository. Please see [Docs repository](https://github.com/Stirling-Tools/Stirling-Tools.github.io) or use "edit this page"-button at the bottom of each page at [https://docs.stirlingpdf.com/](https://docs.stirlingpdf.com/). +Documentation for Stirling-PDF is handled in a separate repository. Please see [Docs repository](https://github.com/Stirling-Tools/Stirling-Tools.github.io) or use the "edit this page"-button at the bottom of each page at [https://docs.stirlingpdf.com/](https://docs.stirlingpdf.com/). ## Fixing Bugs or Adding a New Feature First, make sure you've read the section [Pull Requests](#pull-requests). -To build from source, please follow this [Guide](LocalRunGuide.md). +To build from the source, please follow this [Guide](LocalRunGuide.md). -If, at any point of time, you have a question, please feel free to ask in the same issue thread or in our [Discord](https://discord.gg/FJUSXUSYec). +If, at any point in time, you have a question, please feel free to ask in the same issue thread or in our [Discord](https://discord.gg/FJUSXUSYec). ## License diff --git a/DeveloperGuide.md b/DeveloperGuide.md index 66b1751e..ac0004ff 100644 --- a/DeveloperGuide.md +++ b/DeveloperGuide.md @@ -2,7 +2,7 @@ ## 1. Introduction -Stirling-PDF is a robust, locally hosted web-based PDF manipulation tool. This guide focuses on Docker-based development and testing, which is the recommended approach for working with the full version of Stirling-PDF. +Stirling-PDF is a robust, locally hosted, web-based PDF manipulation tool. This guide focuses on Docker-based development and testing, which is the recommended approach for working with the full version of Stirling-PDF. ## 2. Project Overview @@ -25,7 +25,7 @@ Stirling-PDF is built using: - Docker - Git - Java JDK 17 or later -- Gradle 7.0 or later (Included within repo) +- Gradle 7.0 or later (Included within the repo) ### Setup Steps @@ -38,14 +38,14 @@ Stirling-PDF is built using: 2. Install Docker and JDK17 if not already installed. -3. Install a recommended Java IDE such as Eclipse, IntelliJ or VSCode +3. Install a recommended Java IDE such as Eclipse, IntelliJ, or VSCode 4. Lombok Setup Stirling-PDF uses Lombok to reduce boilerplate code. Some IDEs, like Eclipse, don't support Lombok out of the box. To set up Lombok in your development environment: Visit the [Lombok website](https://projectlombok.org/setup/) for installation instructions specific to your IDE. 5. Add environment variable -For local testing you should generally be testing the full 'Security' version of Stirling-PDF to do this you must add the environment flag DOCKER_ENABLE_SECURITY=true to your system and/or IDE build/run step +For local testing, you should generally be testing the full 'Security' version of Stirling-PDF. To do this, you must add the environment flag DOCKER_ENABLE_SECURITY=true to your system and/or IDE build/run step. ## 4. Project Structure @@ -86,8 +86,8 @@ Stirling-PDF/ │ └── SPDF/ ├── build.gradle # Gradle build configuration ├── Dockerfile # Main Dockerfile -├── Dockerfile-ultra-lite # Dockerfile for ultra-lite version -├── Dockerfile-fat # Dockerfile for fat version +├── Dockerfile.ultra-lite # Dockerfile for ultra-lite version +├── Dockerfile.fat # Dockerfile for fat version ├── docker-compose.yml # Docker Compose configuration └── test.sh # Test script to deploy all docker versions and run cuke tests ``` @@ -102,7 +102,7 @@ Stirling-PDF offers several Docker versions: ### Example Docker Compose Files -Stirling-PDF provides several example Docker Compose files in the `exampleYmlFiles` directory such as : +Stirling-PDF provides several example Docker Compose files in the `exampleYmlFiles` directory, such as: - `docker-compose-latest.yml`: Latest version without security features - `docker-compose-latest-security.yml`: Latest version with security features enabled @@ -179,14 +179,14 @@ Stirling-PDF uses different Docker images for various configurations. The build For the ultra-lite version: ```bash - docker build --no-cache --pull --build-arg VERSION_TAG=alpha -t stirlingtools/stirling-pdf:latest-ultra-lite -f ./Dockerfile-ultra-lite . + docker build --no-cache --pull --build-arg VERSION_TAG=alpha -t stirlingtools/stirling-pdf:latest-ultra-lite -f ./Dockerfile.ultra-lite . ``` For the fat version (with security enabled): ```bash export DOCKER_ENABLE_SECURITY=true - docker build --no-cache --pull --build-arg VERSION_TAG=alpha -t stirlingtools/stirling-pdf:latest-fat -f ./Dockerfile-fat . + docker build --no-cache --pull --build-arg VERSION_TAG=alpha -t stirlingtools/stirling-pdf:latest-fat -f ./Dockerfile.fat . ``` Note: The `--no-cache` and `--pull` flags ensure that the build process uses the latest base images and doesn't use cached layers, which is useful for testing and ensuring reproducible builds. however to improve build times these can often be removed depending on your usecase @@ -205,9 +205,9 @@ To run the test script: This script performs the following actions: -1. Builds all Docker images (full, ultra-lite, fat) -2. Runs each version to ensure it starts correctly -3. Executes Cucumber tests against main version and ensures feature compatibility, in the event these tests fail your PR will not be merged +1. Builds all Docker images (full, ultra-lite, fat). +2. Runs each version to ensure it starts correctly. +3. Executes Cucumber tests against the main version and ensures feature compatibility. In the event these tests fail, your PR will not be merged. Note: The `test.sh` script will run automatically when you raise a PR. However, it's recommended to run it locally first to save resources and catch any issues early. @@ -229,7 +229,7 @@ For quick iterations and development of Java backend, JavaScript, and UI compone To run Stirling-PDF locally: -1. Compile and run the project using built in IDE methods or by running: +1. Compile and run the project using built-in IDE methods or by running: ```bash ./gradlew bootRun @@ -261,7 +261,7 @@ Important notes: 6. Push your changes to your fork. 7. Submit a pull request to the main repository. -8. See additional [contributing guidelines](https://github.com/Stirling-Tools/Stirling-PDF/blob/main/CONTRIBUTING.md) +8. See additional [contributing guidelines](https://github.com/Stirling-Tools/Stirling-PDF/blob/main/CONTRIBUTING.md). When you raise a PR: @@ -317,7 +317,7 @@ Remember to test your changes thoroughly to ensure they don't break any existing ### Overview of Thymeleaf -Thymeleaf is a server-side Java HTML template engine. It is used in Stirling-PDF to render dynamic web pages. Thymeleaf integrates heavily with Spring Boot +Thymeleaf is a server-side Java HTML template engine. It is used in Stirling-PDF to render dynamic web pages. Thymeleaf integrates heavily with Spring Boot. ### Thymeleaf overview @@ -327,22 +327,24 @@ Some examples of this are: ```html +``` or +```html ``` -Where it uses the th:block, th: indicating its a special thymeleaf element to be used serverside in generating the html, and block being the actual element type. -In this case we are inserting the ``navbar`` entry within the ``fragments/navbar.html`` fragment into the ``th:block`` element. +Where it uses the `th:block`, `th:` indicating it's a special Thymeleaf element to be used server-side in generating the HTML, and block being the actual element type. +In this case, we are inserting the `navbar` entry within the `fragments/navbar.html` fragment into the `th:block` element. -They can be more complex such as: +They can be more complex, such as: ```html ``` -Which is the same as above but passes the parameters title and header into the fragment common.html to be used in its HTML generation +Which is the same as above but passes the parameters title and header into the fragment `common.html` to be used in its HTML generation. -Thymeleaf can also be used to loop through objects or pass things from java side into html side. +Thymeleaf can also be used to loop through objects or pass things from the Java side into the HTML side. ```java @GetMapping @@ -352,7 +354,7 @@ Thymeleaf can also be used to loop through objects or pass things from java side } ``` -in above example if exampleData is a list of plain java objects of class Person and within it you had id, name, age etc. You can reference it like so +In the above example, if exampleData is a list of plain java objects of class Person and within it, you had id, name, age, etc. You can reference it like so ```html @@ -452,7 +454,7 @@ This would generate n entries of tr for each person in exampleData 1. **Create a New Thymeleaf Template:** - Create a new HTML file in the `src/main/resources/templates` directory. - Use Thymeleaf attributes to dynamically generate content. - - Use `extract-page.html` as a base example for the HTML template, useful to ensure importing of the general layout, navbar and footer. + - Use `extract-page.html` as a base example for the HTML template, which is useful to ensure importing of the general layout, navbar, and footer. ```html diff --git a/Dockerfile b/Dockerfile index 9577c9ca..900f4a40 100644 --- a/Dockerfile +++ b/Dockerfile @@ -1,5 +1,5 @@ # Main stage -FROM alpine:3.20.3@sha256:1e42bbe2508154c9126d48c2b8a75420c3544343bf86fd041fb7527e017a4b4a +FROM alpine:3.20.3 # Copy necessary files COPY scripts /scripts @@ -10,6 +10,18 @@ COPY build/libs/*.jar app.jar ARG VERSION_TAG +LABEL org.opencontainers.image.title="Stirling-PDF" +LABEL org.opencontainers.image.description="A powerful locally hosted web-based PDF manipulation tool supporting 50+ operations including merging, splitting, conversion, OCR, watermarking, and more." +LABEL org.opencontainers.image.source="https://github.com/Stirling-Tools/Stirling-PDF" +LABEL org.opencontainers.image.licenses="MIT" +LABEL org.opencontainers.image.vendor="Stirling-Tools" +LABEL org.opencontainers.image.url="https://www.stirlingpdf.com" +LABEL org.opencontainers.image.documentation="https://docs.stirlingpdf.com" +LABEL maintainer="Stirling-Tools" +LABEL org.opencontainers.image.authors="Stirling-Tools" +LABEL org.opencontainers.image.version="${VERSION_TAG}" +LABEL org.opencontainers.image.keywords="PDF, manipulation, merge, split, convert, OCR, watermark" + # Set Environment Variables ENV DOCKER_ENABLE_SECURITY=false \ VERSION_TAG=$VERSION_TAG \ @@ -19,6 +31,7 @@ ENV DOCKER_ENABLE_SECURITY=false \ PGID=1000 \ UMASK=022 + # JDK for app RUN echo "@testing https://dl-cdn.alpinelinux.org/alpine/edge/main" | tee -a /etc/apk/repositories && \ echo "@testing https://dl-cdn.alpinelinux.org/alpine/edge/community" | tee -a /etc/apk/repositories && \ @@ -57,8 +70,7 @@ RUN echo "@testing https://dl-cdn.alpinelinux.org/alpine/edge/main" | tee -a /et # User permissions addgroup -S stirlingpdfgroup && adduser -S stirlingpdfuser -G stirlingpdfgroup && \ chown -R stirlingpdfuser:stirlingpdfgroup $HOME /scripts /usr/share/fonts/opentype/noto /configs /customFiles /pipeline && \ - chown stirlingpdfuser:stirlingpdfgroup /app.jar && \ - tesseract --list-langs + chown stirlingpdfuser:stirlingpdfgroup /app.jar EXPOSE 8080/tcp diff --git a/Dockerfile-fat b/Dockerfile.fat similarity index 95% rename from Dockerfile-fat rename to Dockerfile.fat index c9641590..1ee20176 100644 --- a/Dockerfile-fat +++ b/Dockerfile.fat @@ -1,5 +1,5 @@ # Build the application -FROM gradle:8.12-jdk17 AS build +FROM gradle:8.11-jdk17 AS build # Set the working directory WORKDIR /app @@ -73,8 +73,7 @@ RUN echo "@testing https://dl-cdn.alpinelinux.org/alpine/edge/main" | tee -a /et # User permissions addgroup -S stirlingpdfgroup && adduser -S stirlingpdfuser -G stirlingpdfgroup && \ chown -R stirlingpdfuser:stirlingpdfgroup $HOME /scripts /usr/share/fonts/opentype/noto /configs /customFiles /pipeline && \ - chown stirlingpdfuser:stirlingpdfgroup /app.jar && \ - tesseract --list-langs + chown stirlingpdfuser:stirlingpdfgroup /app.jar EXPOSE 8080/tcp diff --git a/Dockerfile-ultra-lite b/Dockerfile.ultra-lite similarity index 94% rename from Dockerfile-ultra-lite rename to Dockerfile.ultra-lite index 09e4a5a3..4953f338 100644 --- a/Dockerfile-ultra-lite +++ b/Dockerfile.ultra-lite @@ -1,5 +1,5 @@ # use alpine -FROM alpine:3.21.0 +FROM alpine:3.21.0@sha256:21dc6063fd678b478f57c0e13f47560d0ea4eeba26dfc947b2a4f81f686b9f45 ARG VERSION_TAG diff --git a/HowToUseOCR.md b/HowToUseOCR.md index 0a5cc94c..f529b72c 100644 --- a/HowToUseOCR.md +++ b/HowToUseOCR.md @@ -92,8 +92,9 @@ Verify installation: ``tesseract --list-langs`` You must then edit your ``/configs/settings.yml`` and change the system.tessdataDir to match the directory containing lang files + ``` system: tessdataDir: C:/Program Files/Tesseract-OCR/tessdata # path to the directory containing the Tessdata files. This setting is relevant for Windows systems. For Windows users, this path should be adjusted to point to the appropriate directory where the Tessdata files are stored. ``` - + \ No newline at end of file diff --git a/LocalRunGuide.md b/LocalRunGuide.md index 124cff9b..177299c6 100644 --- a/LocalRunGuide.md +++ b/LocalRunGuide.md @@ -13,7 +13,7 @@ You could theoretically use a Distrobox/Toolbox if your distribution has old or Install the following software, if not already installed: - Java 17 or later (21 recommended) -- Gradle 7.0 or later (included within repo so not needed on server) +- Gradle 7.0 or later (included within the repo, so not needed on the server) - Git - Python 3.8 (with pip) - Make @@ -32,7 +32,7 @@ sudo apt-get update sudo apt-get install -y git automake autoconf libtool libleptonica-dev pkg-config zlib1g-dev make g++ openjdk-21-jdk python3 python3-pip ``` -For Fedora-based systems use this command: +For Fedora-based systems, use this command: ```bash sudo dnf install -y git automake autoconf libtool leptonica-devel pkg-config zlib-devel make gcc-c++ java-21-openjdk python3 python3-pip @@ -68,7 +68,7 @@ nix-env -iA nixpkgs.jbig2enc ### Step 3: Install Additional Software -Next we need to install LibreOffice for conversions, qpdf for OCR, and OpenCV for pattern recognition functionality. +Next, we need to install LibreOffice for conversions, qpdf for OCR, and OpenCV for pattern recognition functionality. Install the following software: @@ -232,7 +232,7 @@ Terminal=true; EOF ``` -Note: Currently the app will run in the background until manually closed. +Note: Currently, the app will run in the background until it is manually closed. ### Optional: Changing the Host and Port of the Application @@ -251,7 +251,7 @@ server: ### Optional: Run Stirling-PDF as a Service (requires root) -First create a `.env` file, where you can store environment variables: +First, create a `.env` file, where you can store environment variables: ```bash touch /opt/Stirling-PDF/.env @@ -265,7 +265,7 @@ Create a new file where we store our service settings and open it with the nano nano /etc/systemd/system/stirlingpdf.service ``` -Paste this content, make sure to update the filename of the jar file. Press `Ctrl+S` and `Ctrl+X` to save and exit the nano editor: +Paste this content, and make sure to update the filename of the jar file. Press `Ctrl+S` and `Ctrl+X` to save and exit the nano editor: ```ini [Unit] diff --git a/README.md b/README.md index 5b879378..662fcb77 100644 --- a/README.md +++ b/README.md @@ -26,12 +26,11 @@ All files and PDFs exist either exclusively on the client side, reside in server - Optional Login and Authentication support (see [here](https://github.com/Stirling-Tools/Stirling-PDF/tree/main#login-authentication) for documentation) - Database Backup and Import (see [here](https://github.com/Stirling-Tools/Stirling-PDF/blob/main/DATABASE.md) for documentation) - ## PDF Features ### Page Operations -- View and modify PDFs - View multi-page PDFs with custom viewing, sorting, and searching. Plus on-page edit features like annotate, draw, and adding text and images. (Using PDF.js with Joxit and Liberation fonts) +- View and modify PDFs - View multi-page PDFs with custom viewing, sorting, and searching. Plus, on-page edit features like annotating, drawing, and adding text and images. (Using PDF.js with Joxit and Liberation fonts) - Full interactive GUI for merging/splitting/rotating/moving PDFs and their pages - Merge multiple PDFs into a single resultant file - Split PDFs into multiple files at specified page numbers or extract all pages as individual files @@ -42,11 +41,11 @@ All files and PDFs exist either exclusively on the client side, reside in server - Scale page contents size by set percentage - Adjust contrast - Crop PDF -- Auto split PDF (with physically scanned page dividers) +- Auto-split PDF (with physically scanned page dividers) - Extract page(s) - Convert PDF to a single page - Overlay PDFs on top of each other -- PDF to single page +- PDF to a single page - Split PDF by sections ### Conversion Operations @@ -55,7 +54,7 @@ All files and PDFs exist either exclusively on the client side, reside in server - Convert any common file to PDF (using LibreOffice) - Convert PDF to Word/PowerPoint/others (using LibreOffice) - Convert HTML to PDF -- Convert PDF to xml +- Convert PDF to XML - Convert PDF to CSV - URL to PDF - Markdown to PDF @@ -83,9 +82,9 @@ All files and PDFs exist either exclusively on the client side, reside in server - Extract images from scans - Remove annotations - Add page numbers -- Auto rename file by detecting PDF header text -- OCR on PDF (using tesseract) -- PDF/A conversion (using libreoffice) +- Auto-rename files by detecting PDF header text +- OCR on PDF (using Tesseract OCR) +- PDF/A conversion (using LibreOffice) - Edit metadata - Flatten PDFs - Get all information on a PDF to view or export as JSON @@ -121,7 +120,7 @@ Please view the [LocalRunGuide](https://github.com/Stirling-Tools/Stirling-PDF/b > [!NOTE] > -Stirling-PDF has three different versions: a full version, an ultra-lite version, and a 'fat' version. Depending on the types of features you use, you may want a smaller image to save on space. To see what the different versions offer, please look at our [version mapping](https://github.com/Stirling-Tools/Stirling-PDF/blob/main/Version-groups.md). For people that don't mind space optimization, just use the latest tag. +Stirling-PDF has three different versions: a full version, an ultra-lite version, and a 'fat' version. Depending on the types of features you use, you may want a smaller image to save on space. To see what the different versions offer, please look at our [version mapping](https://github.com/Stirling-Tools/Stirling-PDF/blob/main/Version-groups.md). For people who don't mind space optimization, just use the latest tag. ![Docker Image Size (tag)](https://img.shields.io/docker/image-size/stirlingtools/stirling-pdf/latest?label=Stirling-PDF%20Full) ![Docker Image Size (tag)](https://img.shields.io/docker/image-size/stirlingtools/stirling-pdf/latest-ultra-lite?label=Stirling-PDF%20Ultra-Lite) @@ -178,7 +177,7 @@ Please view the [HowToUseOCR.md](https://github.com/Stirling-Tools/Stirling-PDF/ ## Reuse Stored Files -Certain functionality like `Sign` supports pre-saved files stored at `/customFiles/signatures/`. Image files placed within here will be accessible to be used via the web UI. Currently, this supports two folder types: +Certain functionality like `Sign` supports pre-saved files stored at `/customFiles/signatures/`. Image files placed here will be accessible via the web UI. Currently, this supports two folder types: - `/customFiles/signatures/ALL_USERS`: Accessible to all users, useful for organizations where many users use the same files or for users not using authentication - `/customFiles/signatures/{username}`: Such as `/customFiles/signatures/froodle`, accessible only to the `froodle` username, private for all others @@ -234,11 +233,11 @@ Please see our [Contributing Guide](CONTRIBUTING.md). ## Stirling PDF Enterprise -Stirling PDF offers a Enterprise edition of its software, This is the same great software but with added features and comforts +Stirling PDF offers an Enterprise edition of its software. This is the same great software but with added features and comforts. -### Whats included +### What's included -- Prioritised Support tickets via support@stirlingpdf.com to reach directly to Stirling-PDF team for support and 1:1 meetings where applicable (Provided they come from same email domain registered with us) +- Prioritized Support tickets via support@stirlingpdf.com to reach directly to Stirling-PDF team for support and 1:1 meetings where applicable (Provided they come from the same email domain registered with us) - Prioritised Enhancements to Stirling-PDF where applicable - Base SSO support - Advanced SSO such as automated login handling (Coming very soon) @@ -247,7 +246,7 @@ Stirling PDF offers a Enterprise edition of its software, This is the same great - Advanced user configurations (Coming soon) - Plus other exciting features to come -Check out of [docs](https://docs.stirlingpdf.com/Enterprise%20Edition) on it or our official [website](https://www.stirlingpdf.com) +Check out our [docs](https://docs.stirlingpdf.com/Enterprise%20Edition) on it or our official [website](https://www.stirlingpdf.com) ## Customization @@ -365,8 +364,6 @@ AutomaticallyGenerated: There is an additional config file `/configs/custom_settings.yml` where users familiar with Java and Spring `application.properties` can input their own settings on top of Stirling-PDF's existing ones. - - ### Extra Notes - **Endpoints**: Currently, the `ENDPOINTS_TO_REMOVE` and `GROUPS_TO_REMOVE` endpoints can include comma-separated lists of endpoints and groups to disable. For example, `ENDPOINTS_TO_REMOVE=img-to-pdf,remove-pages` would disable both image-to-pdf and remove pages, while `GROUPS_TO_REMOVE=LibreOffice` would disable all things that use LibreOffice. You can see a list of all endpoints and groups [here](https://github.com/Stirling-Tools/Stirling-PDF/blob/main/Endpoint-groups.md). @@ -401,7 +398,7 @@ When you log in to Stirling-PDF, you will be redirected to the `/login` page to To access your account settings, go to Account Settings in the settings cog menu (top right in the navbar). This Account Settings menu is also where you find your API key. -To add new users, go to the bottom of Account Settings and hit 'Admin Settings'. Here you can add new users. The different roles mentioned within this are for rate limiting. This is a work in progress and will be expanded on more in the future. +To add new users, go to the bottom of Account Settings and hit 'Admin Settings'. Here, you can add new users. The different roles mentioned within this are for rate limiting. This is a work in progress and will be expanded on more in the future. For API usage, you must provide a header with `X-API-KEY` and the associated API key for that user. @@ -417,9 +414,9 @@ For API usage, you must provide a header with `X-API-KEY` and the associated API - Multi-page layout (stitch PDF pages together) support x rows y columns and custom page sizing - Fill forms manually or automatically -### Q2: Why is my application downloading .htm files? Why am i getting HTTP error 413? +### Q2: Why is my application downloading .htm files? Why am I getting HTTP error 413? -This is an issue commonly caused by your NGINX configuration. The default file upload size for NGINX is 1MB. You need to add the following in your Nginx sites-available file: `client_max_body_size SIZE;` (where "SIZE" is 50M for example for 50MB files). +This is an issue commonly caused by your NGINX configuration. The default file upload size for NGINX is 1MB. You need to add the following in your Nginx sites-available file: `client_max_body_size SIZE;` (where "SIZE" is 50M, for example, for 50MB files). ### Q3: Why is my download timing out? diff --git a/SECURITY.md b/SECURITY.md index e67cdce4..5f532aa7 100644 --- a/SECURITY.md +++ b/SECURITY.md @@ -8,7 +8,7 @@ The Stirling-PDF team takes security vulnerabilities seriously. We appreciate yo You can report security vulnerabilities through two channels: -1. **GitHub Security Advisory**: +1. **GitHub Security Advisory**: - Navigate to the [Security tab](https://github.com/Stirling-Tools/Stirling-PDF/security) in our repository - Click on "Report a vulnerability" - Provide a detailed description of the vulnerability diff --git a/Version-groups.md b/Version-groups.md index e7f5536c..c8f3aff8 100644 --- a/Version-groups.md +++ b/Version-groups.md @@ -1,14 +1,14 @@ -|All versions in a Docker environment can download Calibre as a optional extra at runtime to support `book-to-pdf` and `pdf-to-book` using parameter ``INSTALL_BOOK_AND_ADVANCED_HTML_OPS``. +All versions in a Docker environment can download Calibre as a optional extra at runtime to support `book-to-pdf` and `pdf-to-book` using parameter ``INSTALL_BOOK_AND_ADVANCED_HTML_OPS``. The 'Fat' container contains all those found in 'Full' with security jar along with this Calibre install. | Technology | Ultra-Lite | Full | | ---------- | :--------: | :---: | -| Java | ✔️ | ✔️ | -| JavaScript | ✔️ | ✔️ | +| Java | ✔️ | ✔️ | +| JavaScript | ✔️ | ✔️ | | Libre | | ✔️ | | Python | | ✔️ | | OpenCV | | ✔️ | -| qpdf | | ✔️ | +| qpdf | | ✔️ | | Operation | Ultra-Lite | Full | | ---------------------- | ---------- | ---- | @@ -54,15 +54,15 @@ The 'Fat' container contains all those found in 'Full' with security jar along w | ocr-pdf | | ✔️ | | pdf-to-pdfa | | ✔️ | | remove-blanks | | ✔️ | -pdf-to-text | ✔️ | ✔️ -pdf-to-html | | ✔️ -pdf-to-word | | ✔️ -pdf-to-presentation | | ✔️ -pdf-to-xml | | ✔️ -remove-annotations | ✔️ | ✔️ -remove-cert-sign | ✔️ | ✔️ -remove-image-pdf | ✔️ | ✔️ -file-to-pdf | | ✔️ -html-to-pdf | | ✔️ -url-to-pdf | | ✔️ -repair | | ✔️ +| pdf-to-text | ✔️ | ✔️ | +| pdf-to-html | | ✔️ | +| pdf-to-word | | ✔️ | +| pdf-to-presentation | | ✔️ | +| pdf-to-xml | | ✔️ | +| remove-annotations | ✔️ | ✔️ | +| remove-cert-sign | ✔️ | ✔️ | +| remove-image-pdf | ✔️ | ✔️ | +| file-to-pdf | | ✔️ | +| html-to-pdf | | ✔️ | +| url-to-pdf | | ✔️ | +| repair | | ✔️ | diff --git a/test.sh b/test.sh index 2ad25905..d789c6be 100644 --- a/test.sh +++ b/test.sh @@ -74,7 +74,7 @@ main() { # Building Docker images # docker build --no-cache --pull --build-arg VERSION_TAG=alpha -t stirlingtools/stirling-pdf:latest -f ./Dockerfile . - # docker build --no-cache --pull --build-arg VERSION_TAG=alpha -t stirlingtools/stirling-pdf:latest-ultra-lite -f ./Dockerfile-ultra-lite . + # docker build --no-cache --pull --build-arg VERSION_TAG=alpha -t stirlingtools/stirling-pdf:latest-ultra-lite -f ./Dockerfile.ultra-lite . # Test each configuration #run_tests "Stirling-PDF-Ultra-Lite" "./exampleYmlFiles/docker-compose-latest-ultra-lite.yml" @@ -94,8 +94,8 @@ main() { # Building Docker images with security enabled # docker build --no-cache --pull --build-arg VERSION_TAG=alpha -t stirlingtools/stirling-pdf:latest -f ./Dockerfile . - # docker build --no-cache --pull --build-arg VERSION_TAG=alpha -t stirlingtools/stirling-pdf:latest-ultra-lite -f ./Dockerfile-ultra-lite . - docker build --no-cache --pull --build-arg VERSION_TAG=alpha -t stirlingtools/stirling-pdf:latest-fat -f ./Dockerfile-fat . + # docker build --no-cache --pull --build-arg VERSION_TAG=alpha -t stirlingtools/stirling-pdf:latest-ultra-lite -f ./Dockerfile.ultra-lite . + docker build --no-cache --pull --build-arg VERSION_TAG=alpha -t stirlingtools/stirling-pdf:latest-fat -f ./Dockerfile.fat . # Test each configuration with security diff --git a/test2.sh b/test2.sh index 61db7993..b33d2df8 100644 --- a/test2.sh +++ b/test2.sh @@ -65,7 +65,7 @@ build_and_test() { dockerfile_name="./Dockerfile" ;; ultra-lite) - dockerfile_name="./Dockerfile-ultra-lite" + dockerfile_name="./Dockerfile.ultra-lite" ;; esac