Compare commits
38 Commits
Author | SHA1 | Date | |
---|---|---|---|
|
a4c3415838 | ||
f535eacd97 | |||
9908897aa2 | |||
29d3cbb0b6 | |||
babc20649a | |||
1188643c4b | |||
6b74301588 | |||
168527573c | |||
3d7bb37849 | |||
12a581ced9 | |||
857e1717a5 | |||
186bfb9d12 | |||
c5bc354f65 | |||
c48bb0428f | |||
46fbb615a0 | |||
3df4e103f9 | |||
addff418c6 | |||
14d653e701 | |||
040bac5256 | |||
bf44901a0a | |||
b4d0f4e949 | |||
b2b47b1f6a | |||
1b1398653b | |||
1f61dcb115 | |||
1476fc9174 | |||
d157a3acd9 | |||
fe6be928a9 | |||
8e537be454 | |||
6947529e02 | |||
b6d78929b9 | |||
e997189a64 | |||
31940deb7a | |||
922c6da234 | |||
aa8fb165eb | |||
4cd4431565 | |||
826183be8c | |||
6d9b7ee0e4 | |||
3c66acb653 |
66
.gitea/workflows/default_nottags.yaml
Normal file
66
.gitea/workflows/default_nottags.yaml
Normal file
@@ -0,0 +1,66 @@
|
|||||||
|
name: Default (not tags)
|
||||||
|
|
||||||
|
on:
|
||||||
|
push:
|
||||||
|
tags-ignore:
|
||||||
|
- '**'
|
||||||
|
|
||||||
|
env:
|
||||||
|
IMAGE: registry.gitlab.com/hosttoday/ht-docker-node:npmci
|
||||||
|
NPMCI_COMPUTED_REPOURL: https://${{gitea.repository_owner}}:${{secrets.GITEA_TOKEN}}@gitea.lossless.digital/${{gitea.repository}}.git
|
||||||
|
NPMCI_TOKEN_NPM: ${{secrets.NPMCI_TOKEN_NPM}}
|
||||||
|
NPMCI_TOKEN_NPM2: ${{secrets.NPMCI_TOKEN_NPM2}}
|
||||||
|
NPMCI_GIT_GITHUBTOKEN: ${{secrets.NPMCI_GIT_GITHUBTOKEN}}
|
||||||
|
NPMCI_URL_CLOUDLY: ${{secrets.NPMCI_URL_CLOUDLY}}
|
||||||
|
|
||||||
|
jobs:
|
||||||
|
security:
|
||||||
|
runs-on: ubuntu-latest
|
||||||
|
continue-on-error: true
|
||||||
|
container:
|
||||||
|
image: ${{ env.IMAGE }}
|
||||||
|
|
||||||
|
steps:
|
||||||
|
- uses: actions/checkout@v3
|
||||||
|
|
||||||
|
- name: Install pnpm and npmci
|
||||||
|
run: |
|
||||||
|
pnpm install -g pnpm
|
||||||
|
pnpm install -g @shipzone/npmci
|
||||||
|
|
||||||
|
- name: Run npm prepare
|
||||||
|
run: npmci npm prepare
|
||||||
|
|
||||||
|
- name: Audit production dependencies
|
||||||
|
run: |
|
||||||
|
npmci command npm config set registry https://registry.npmjs.org
|
||||||
|
npmci command pnpm audit --audit-level=high --prod
|
||||||
|
continue-on-error: true
|
||||||
|
|
||||||
|
- name: Audit development dependencies
|
||||||
|
run: |
|
||||||
|
npmci command npm config set registry https://registry.npmjs.org
|
||||||
|
npmci command pnpm audit --audit-level=high --dev
|
||||||
|
continue-on-error: true
|
||||||
|
|
||||||
|
test:
|
||||||
|
if: ${{ always() }}
|
||||||
|
needs: security
|
||||||
|
runs-on: ubuntu-latest
|
||||||
|
container:
|
||||||
|
image: ${{ env.IMAGE }}
|
||||||
|
|
||||||
|
steps:
|
||||||
|
- uses: actions/checkout@v3
|
||||||
|
|
||||||
|
- name: Test stable
|
||||||
|
run: |
|
||||||
|
npmci node install stable
|
||||||
|
npmci npm install
|
||||||
|
npmci npm test
|
||||||
|
|
||||||
|
- name: Test build
|
||||||
|
run: |
|
||||||
|
npmci node install stable
|
||||||
|
npmci npm install
|
||||||
|
npmci npm build
|
124
.gitea/workflows/default_tags.yaml
Normal file
124
.gitea/workflows/default_tags.yaml
Normal file
@@ -0,0 +1,124 @@
|
|||||||
|
name: Default (tags)
|
||||||
|
|
||||||
|
on:
|
||||||
|
push:
|
||||||
|
tags:
|
||||||
|
- '*'
|
||||||
|
|
||||||
|
env:
|
||||||
|
IMAGE: registry.gitlab.com/hosttoday/ht-docker-node:npmci
|
||||||
|
NPMCI_COMPUTED_REPOURL: https://${{gitea.repository_owner}}:${{secrets.GITEA_TOKEN}}@gitea.lossless.digital/${{gitea.repository}}.git
|
||||||
|
NPMCI_TOKEN_NPM: ${{secrets.NPMCI_TOKEN_NPM}}
|
||||||
|
NPMCI_TOKEN_NPM2: ${{secrets.NPMCI_TOKEN_NPM2}}
|
||||||
|
NPMCI_GIT_GITHUBTOKEN: ${{secrets.NPMCI_GIT_GITHUBTOKEN}}
|
||||||
|
NPMCI_URL_CLOUDLY: ${{secrets.NPMCI_URL_CLOUDLY}}
|
||||||
|
|
||||||
|
jobs:
|
||||||
|
security:
|
||||||
|
runs-on: ubuntu-latest
|
||||||
|
continue-on-error: true
|
||||||
|
container:
|
||||||
|
image: ${{ env.IMAGE }}
|
||||||
|
|
||||||
|
steps:
|
||||||
|
- uses: actions/checkout@v3
|
||||||
|
|
||||||
|
- name: Prepare
|
||||||
|
run: |
|
||||||
|
pnpm install -g pnpm
|
||||||
|
pnpm install -g @shipzone/npmci
|
||||||
|
npmci npm prepare
|
||||||
|
|
||||||
|
- name: Audit production dependencies
|
||||||
|
run: |
|
||||||
|
npmci command npm config set registry https://registry.npmjs.org
|
||||||
|
npmci command pnpm audit --audit-level=high --prod
|
||||||
|
continue-on-error: true
|
||||||
|
|
||||||
|
- name: Audit development dependencies
|
||||||
|
run: |
|
||||||
|
npmci command npm config set registry https://registry.npmjs.org
|
||||||
|
npmci command pnpm audit --audit-level=high --dev
|
||||||
|
continue-on-error: true
|
||||||
|
|
||||||
|
test:
|
||||||
|
if: ${{ always() }}
|
||||||
|
needs: security
|
||||||
|
runs-on: ubuntu-latest
|
||||||
|
container:
|
||||||
|
image: ${{ env.IMAGE }}
|
||||||
|
|
||||||
|
steps:
|
||||||
|
- uses: actions/checkout@v3
|
||||||
|
|
||||||
|
- name: Prepare
|
||||||
|
run: |
|
||||||
|
pnpm install -g pnpm
|
||||||
|
pnpm install -g @shipzone/npmci
|
||||||
|
npmci npm prepare
|
||||||
|
|
||||||
|
- name: Test stable
|
||||||
|
run: |
|
||||||
|
npmci node install stable
|
||||||
|
npmci npm install
|
||||||
|
npmci npm test
|
||||||
|
|
||||||
|
- name: Test build
|
||||||
|
run: |
|
||||||
|
npmci node install stable
|
||||||
|
npmci npm install
|
||||||
|
npmci npm build
|
||||||
|
|
||||||
|
release:
|
||||||
|
needs: test
|
||||||
|
if: github.event_name == 'push' && startsWith(github.ref, 'refs/tags/')
|
||||||
|
runs-on: ubuntu-latest
|
||||||
|
container:
|
||||||
|
image: ${{ env.IMAGE }}
|
||||||
|
|
||||||
|
steps:
|
||||||
|
- uses: actions/checkout@v3
|
||||||
|
|
||||||
|
- name: Prepare
|
||||||
|
run: |
|
||||||
|
pnpm install -g pnpm
|
||||||
|
pnpm install -g @shipzone/npmci
|
||||||
|
npmci npm prepare
|
||||||
|
|
||||||
|
- name: Release
|
||||||
|
run: |
|
||||||
|
npmci node install stable
|
||||||
|
npmci npm publish
|
||||||
|
|
||||||
|
metadata:
|
||||||
|
needs: test
|
||||||
|
if: github.event_name == 'push' && startsWith(github.ref, 'refs/tags/')
|
||||||
|
runs-on: ubuntu-latest
|
||||||
|
container:
|
||||||
|
image: ${{ env.IMAGE }}
|
||||||
|
continue-on-error: true
|
||||||
|
|
||||||
|
steps:
|
||||||
|
- uses: actions/checkout@v3
|
||||||
|
|
||||||
|
- name: Prepare
|
||||||
|
run: |
|
||||||
|
pnpm install -g pnpm
|
||||||
|
pnpm install -g @shipzone/npmci
|
||||||
|
npmci npm prepare
|
||||||
|
|
||||||
|
- name: Code quality
|
||||||
|
run: |
|
||||||
|
npmci command npm install -g typescript
|
||||||
|
npmci npm install
|
||||||
|
|
||||||
|
- name: Trigger
|
||||||
|
run: npmci trigger
|
||||||
|
|
||||||
|
- name: Build docs and upload artifacts
|
||||||
|
run: |
|
||||||
|
npmci node install stable
|
||||||
|
npmci npm install
|
||||||
|
pnpm install -g @git.zone/tsdoc
|
||||||
|
npmci command tsdoc
|
||||||
|
continue-on-error: true
|
128
.gitlab-ci.yml
128
.gitlab-ci.yml
@@ -1,128 +0,0 @@
|
|||||||
# gitzone ci_default
|
|
||||||
image: registry.gitlab.com/hosttoday/ht-docker-node:npmci
|
|
||||||
|
|
||||||
cache:
|
|
||||||
paths:
|
|
||||||
- .npmci_cache/
|
|
||||||
key: '$CI_BUILD_STAGE'
|
|
||||||
|
|
||||||
stages:
|
|
||||||
- security
|
|
||||||
- test
|
|
||||||
- release
|
|
||||||
- metadata
|
|
||||||
|
|
||||||
before_script:
|
|
||||||
- pnpm install -g pnpm
|
|
||||||
- pnpm install -g @shipzone/npmci
|
|
||||||
- npmci npm prepare
|
|
||||||
|
|
||||||
# ====================
|
|
||||||
# security stage
|
|
||||||
# ====================
|
|
||||||
# ====================
|
|
||||||
# security stage
|
|
||||||
# ====================
|
|
||||||
auditProductionDependencies:
|
|
||||||
image: registry.gitlab.com/hosttoday/ht-docker-node:npmci
|
|
||||||
stage: security
|
|
||||||
script:
|
|
||||||
- npmci command npm config set registry https://registry.npmjs.org
|
|
||||||
- npmci command pnpm audit --audit-level=high --prod
|
|
||||||
tags:
|
|
||||||
- lossless
|
|
||||||
- docker
|
|
||||||
allow_failure: true
|
|
||||||
|
|
||||||
auditDevDependencies:
|
|
||||||
image: registry.gitlab.com/hosttoday/ht-docker-node:npmci
|
|
||||||
stage: security
|
|
||||||
script:
|
|
||||||
- npmci command npm config set registry https://registry.npmjs.org
|
|
||||||
- npmci command pnpm audit --audit-level=high --dev
|
|
||||||
tags:
|
|
||||||
- lossless
|
|
||||||
- docker
|
|
||||||
allow_failure: true
|
|
||||||
|
|
||||||
# ====================
|
|
||||||
# test stage
|
|
||||||
# ====================
|
|
||||||
|
|
||||||
testStable:
|
|
||||||
stage: test
|
|
||||||
script:
|
|
||||||
- npmci node install stable
|
|
||||||
- npmci npm install
|
|
||||||
- npmci npm test
|
|
||||||
coverage: /\d+.?\d+?\%\s*coverage/
|
|
||||||
tags:
|
|
||||||
- docker
|
|
||||||
|
|
||||||
testBuild:
|
|
||||||
stage: test
|
|
||||||
script:
|
|
||||||
- npmci node install stable
|
|
||||||
- npmci npm install
|
|
||||||
- npmci command npm run build
|
|
||||||
coverage: /\d+.?\d+?\%\s*coverage/
|
|
||||||
tags:
|
|
||||||
- docker
|
|
||||||
|
|
||||||
release:
|
|
||||||
stage: release
|
|
||||||
script:
|
|
||||||
- npmci node install stable
|
|
||||||
- npmci npm publish
|
|
||||||
only:
|
|
||||||
- tags
|
|
||||||
tags:
|
|
||||||
- lossless
|
|
||||||
- docker
|
|
||||||
- notpriv
|
|
||||||
|
|
||||||
# ====================
|
|
||||||
# metadata stage
|
|
||||||
# ====================
|
|
||||||
codequality:
|
|
||||||
stage: metadata
|
|
||||||
allow_failure: true
|
|
||||||
only:
|
|
||||||
- tags
|
|
||||||
script:
|
|
||||||
- npmci command npm install -g typescript
|
|
||||||
- npmci npm prepare
|
|
||||||
- npmci npm install
|
|
||||||
tags:
|
|
||||||
- lossless
|
|
||||||
- docker
|
|
||||||
- priv
|
|
||||||
|
|
||||||
trigger:
|
|
||||||
stage: metadata
|
|
||||||
script:
|
|
||||||
- npmci trigger
|
|
||||||
only:
|
|
||||||
- tags
|
|
||||||
tags:
|
|
||||||
- lossless
|
|
||||||
- docker
|
|
||||||
- notpriv
|
|
||||||
|
|
||||||
pages:
|
|
||||||
stage: metadata
|
|
||||||
script:
|
|
||||||
- npmci node install stable
|
|
||||||
- npmci npm install
|
|
||||||
- npmci command npm run buildDocs
|
|
||||||
tags:
|
|
||||||
- lossless
|
|
||||||
- docker
|
|
||||||
- notpriv
|
|
||||||
only:
|
|
||||||
- tags
|
|
||||||
artifacts:
|
|
||||||
expire_in: 1 week
|
|
||||||
paths:
|
|
||||||
- public
|
|
||||||
allow_failure: true
|
|
142
changelog.md
Normal file
142
changelog.md
Normal file
@@ -0,0 +1,142 @@
|
|||||||
|
# Changelog
|
||||||
|
|
||||||
|
## 2025-08-01 - 3.3.0 - feat(smartpdf)
|
||||||
|
Add automatic port allocation and multi-instance support
|
||||||
|
|
||||||
|
- Added ISmartPdfOptions interface with port configuration options
|
||||||
|
- Implemented automatic port allocation between 20000-30000 by default
|
||||||
|
- Added support for custom port ranges via portRangeStart/portRangeEnd options
|
||||||
|
- Added support for specific port assignment via port option
|
||||||
|
- Fixed resource cleanup when port allocation fails
|
||||||
|
- Multiple SmartPdf instances can now run simultaneously without port conflicts
|
||||||
|
- Updated readme with comprehensive documentation for all features
|
||||||
|
|
||||||
|
## 2025-02-25 - 3.2.2 - fix(SmartPdf)
|
||||||
|
Fix buffer handling for PDF conversion and text extraction
|
||||||
|
|
||||||
|
- Ensure Uint8Array is converted to Node Buffer for PDF conversion.
|
||||||
|
- Correct the PDF page viewport handling by using document dimensions.
|
||||||
|
- Fix extractTextFromPdfBuffer argument type from Uint8Array to Buffer.
|
||||||
|
|
||||||
|
## 2025-02-25 - 3.2.1 - fix(SmartPdf)
|
||||||
|
Fix type for extractTextFromPdfBuffer function
|
||||||
|
|
||||||
|
- Corrected the parameter type from Buffer to Uint8Array for extractTextFromPdfBuffer function.
|
||||||
|
|
||||||
|
## 2025-02-25 - 3.2.0 - feat(smartpdf)
|
||||||
|
Improve dependency versions and optimize PDF to PNG conversion.
|
||||||
|
|
||||||
|
- Update several dependencies to newer versions for better stability and performance.
|
||||||
|
- Refactor tests to enhance readability and add directory creation validations.
|
||||||
|
- Optimize PDF to PNG conversion by switching to a more efficient Puppeteer and PDF.js-based method.
|
||||||
|
- Add checks for presence of required dependencies (GraphicsMagick and Ghostscript).
|
||||||
|
- Fix media emulation issue by properly awaiting the emulateMediaType function.
|
||||||
|
|
||||||
|
## 2024-11-30 - 3.1.8 - fix(core)
|
||||||
|
Fix candidate handling in PDF generation
|
||||||
|
|
||||||
|
- Added error handling for missing PDF candidates in server requests.
|
||||||
|
- Updated devDependencies and dependencies to latest versions for better stability and new features.
|
||||||
|
- Patched header retrieval logic during PDF generation for security check.
|
||||||
|
|
||||||
|
## 2024-09-27 - 3.1.7 - fix(dependencies)
|
||||||
|
Update dependencies to latest versions
|
||||||
|
|
||||||
|
- Updated @git.zone/tsbuild to version ^2.1.84
|
||||||
|
- Updated @git.zone/tsdoc to version ^1.3.12
|
||||||
|
- Updated @git.zone/tsrun to version ^1.2.49
|
||||||
|
- Updated @push.rocks/tapbundle to version ^5.3.0
|
||||||
|
- Updated @types/node to version ^22.7.4
|
||||||
|
- Updated @push.rocks/smartfile to version ^11.0.21
|
||||||
|
- Updated @push.rocks/smartpromise to version ^4.0.4
|
||||||
|
- Updated @tsclass/tsclass to version ^4.1.2
|
||||||
|
- Updated express to version ^4.21.0
|
||||||
|
- Updated pdf2pic to version ^3.1.3
|
||||||
|
|
||||||
|
## 2024-05-29 - 3.1.6 - Core
|
||||||
|
Updated description
|
||||||
|
|
||||||
|
- Minor changes to documentation and internal text.
|
||||||
|
|
||||||
|
## 2024-04-25 to 2024-04-30 - 3.1.0 to 3.1.5 - Core
|
||||||
|
Fix updates in core functionality
|
||||||
|
|
||||||
|
- Fixes and updates in core function in versions 3.1.0 to 3.1.5.
|
||||||
|
|
||||||
|
## 2024-04-25 - 3.0.17 - Feature
|
||||||
|
Now supports PDF to JPG conversion
|
||||||
|
|
||||||
|
- Added support for converting PDF files to JPG format.
|
||||||
|
|
||||||
|
## 2024-03-19 to 2024-04-14 - 3.0.17 - Maintenance
|
||||||
|
Various updates to project configuration files
|
||||||
|
|
||||||
|
- Updated `tsconfig`.
|
||||||
|
- Updated `npmextra.json`.
|
||||||
|
|
||||||
|
## 2023-07-11 to 2024-03-19 - 3.0.15 to 3.0.16 - Organization
|
||||||
|
Switch to new organization scheme and core updates
|
||||||
|
|
||||||
|
- Switched to new organization scheme.
|
||||||
|
- Applied core updates and bug fixes.
|
||||||
|
|
||||||
|
## 2022-11-07 to 2023-07-10 - 3.0.13 to 3.0.14 - Core
|
||||||
|
Fixes and updates to core functionality
|
||||||
|
|
||||||
|
- Various minor bug fixes and updates to core components.
|
||||||
|
|
||||||
|
## 2022-09-13 to 2022-11-07 - 3.0.10 to 3.0.12 - Core
|
||||||
|
Ongoing core updates and maintenance
|
||||||
|
|
||||||
|
- Regular fixes and operational improvements in core functionalities.
|
||||||
|
|
||||||
|
## 2022-06-12 to 2022-09-13 - 3.0.7 to 3.0.9 - Core
|
||||||
|
Continued focus on high-priority bug fixes and core functionalities
|
||||||
|
|
||||||
|
- Regular fixes for critical bugs and enhancements.
|
||||||
|
|
||||||
|
## 2022-03-24 to 2022-06-29 - 3.0.3 to 3.0.6 - Core
|
||||||
|
Further optimization and maintenance releases
|
||||||
|
|
||||||
|
- Further improvements and refinements of issues in core functionalities.
|
||||||
|
|
||||||
|
## 2022-01-05 to 2022-03-25 - 3.0.0 to 3.0.2 - Major Version Release
|
||||||
|
Major release for version 3.0.x, including core fixes
|
||||||
|
|
||||||
|
- Increased version from 2.x to 3.0. New significant changes and fixes.
|
||||||
|
|
||||||
|
## 2022-01-05 to 2022-03-24 - 2.0.13 to 2.0.19 - Core
|
||||||
|
Routine core updates and bug fixes
|
||||||
|
|
||||||
|
- Regular bug fixes in core components.
|
||||||
|
|
||||||
|
## 2019-11-19 to 2022-01-06 - 2.0.0 to 2.0.11 - Core
|
||||||
|
Multiple core updates and a few performance improvements
|
||||||
|
|
||||||
|
- Some performance enhancements and multiple bug fixes.
|
||||||
|
|
||||||
|
## 2019-11-16 to 2019-11-19 - 1.0.27 to 1.0.29 - API
|
||||||
|
Breaking change in API
|
||||||
|
|
||||||
|
- Naming PDF results to better represent their content.
|
||||||
|
|
||||||
|
## 2019-05-29 to 2019-11-15 - 1.0.13 to 1.0.26 - Core
|
||||||
|
Core functional updates and some major restructuring
|
||||||
|
|
||||||
|
- Introduced multiple updates to the core, addressing bugs and improving stability.
|
||||||
|
|
||||||
|
## 2019-04-10 to 2019-05-28 - 1.0.4 to 1.0.12 - Core
|
||||||
|
Fixes and updates in the core
|
||||||
|
|
||||||
|
- Implementation of multiple essential fixes for core components.
|
||||||
|
|
||||||
|
## 2018-10-06 - 1.0.1 to 1.0.3 - Core and Typings
|
||||||
|
Initial implementation and core fixes
|
||||||
|
|
||||||
|
- Initial implementation of the project.
|
||||||
|
- Fixed compilation problems in typings.
|
||||||
|
|
||||||
|
## 2016-01-29 - unknown - Initial
|
||||||
|
Initial commit
|
||||||
|
|
||||||
|
- Initial commit for the project setup.
|
@@ -6,12 +6,29 @@
|
|||||||
"gitzone": {
|
"gitzone": {
|
||||||
"projectType": "npm",
|
"projectType": "npm",
|
||||||
"module": {
|
"module": {
|
||||||
"githost": "gitlab.com",
|
"githost": "code.foss.global",
|
||||||
"gitscope": "pushrocks",
|
"gitscope": "push.rocks",
|
||||||
"gitrepo": "smartpdf",
|
"gitrepo": "smartpdf",
|
||||||
"description": "Create PDFs fast and smoothly",
|
"description": "A library for creating PDFs dynamically from HTML or websites with additional features like merging PDFs.",
|
||||||
"npmPackagename": "@pushrocks/smartpdf",
|
"npmPackagename": "@push.rocks/smartpdf",
|
||||||
"license": "MIT"
|
"license": "MIT",
|
||||||
|
"keywords": [
|
||||||
|
"PDF generation",
|
||||||
|
"HTML to PDF",
|
||||||
|
"website to PDF",
|
||||||
|
"PDF manipulation",
|
||||||
|
"puppeteer",
|
||||||
|
"express",
|
||||||
|
"node.js",
|
||||||
|
"typescript",
|
||||||
|
"automation",
|
||||||
|
"PDF merging",
|
||||||
|
"text extraction",
|
||||||
|
"PDF management"
|
||||||
|
]
|
||||||
}
|
}
|
||||||
|
},
|
||||||
|
"tsdoc": {
|
||||||
|
"legal": "\n## License and Legal Information\n\nThis repository contains open-source code that is licensed under the MIT License. A copy of the MIT License can be found in the [license](license) file within this repository. \n\n**Please note:** The MIT License does not grant permission to use the trade names, trademarks, service marks, or product names of the project, except as required for reasonable and customary use in describing the origin of the work and reproducing the content of the NOTICE file.\n\n### Trademarks\n\nThis project is owned and maintained by Task Venture Capital GmbH. The names and logos associated with Task Venture Capital GmbH and any related products or services are trademarks of Task Venture Capital GmbH and are not included within the scope of the MIT license granted herein. Use of these trademarks must comply with Task Venture Capital GmbH's Trademark Guidelines, and any usage must be approved in writing by Task Venture Capital GmbH.\n\n### Company Information\n\nTask Venture Capital GmbH \nRegistered at District court Bremen HRB 35230 HB, Germany\n\nFor any legal inquiries or if you require further information, please contact us via email at hello@task.vc.\n\nBy using this repository, you acknowledge that you have read this section, agree to comply with its terms, and understand that the licensing of the code does not imply endorsement by Task Venture Capital GmbH of any derivative works.\n"
|
||||||
}
|
}
|
||||||
}
|
}
|
68
package.json
68
package.json
@@ -1,39 +1,39 @@
|
|||||||
{
|
{
|
||||||
"name": "@pushrocks/smartpdf",
|
"name": "@push.rocks/smartpdf",
|
||||||
"version": "3.0.14",
|
"version": "3.3.0",
|
||||||
"private": false,
|
"private": false,
|
||||||
"description": "create pdfs on the fly",
|
"description": "A library for creating PDFs dynamically from HTML or websites with additional features like merging PDFs.",
|
||||||
"main": "dist_ts/index.js",
|
"main": "dist_ts/index.js",
|
||||||
"typings": "dist_ts/index.d.ts",
|
"typings": "dist_ts/index.d.ts",
|
||||||
"type": "module",
|
"type": "module",
|
||||||
"author": "Lossless GmbH",
|
"author": "Lossless GmbH",
|
||||||
"license": "MIT",
|
"license": "MIT",
|
||||||
"scripts": {
|
"scripts": {
|
||||||
"test": "(tstest test/ --web)",
|
"test": "(tstest test/ --verbose --timeout 60)",
|
||||||
"build": "(tsbuild --web --allowimplicitany)",
|
"build": "(tsbuild tsfolders --allowimplicitany)",
|
||||||
"buildDocs": "tsdoc"
|
"buildDocs": "tsdoc"
|
||||||
},
|
},
|
||||||
"devDependencies": {
|
"devDependencies": {
|
||||||
"@gitzone/tsbuild": "^2.1.65",
|
"@git.zone/tsbuild": "^2.6.4",
|
||||||
"@gitzone/tsdoc": "^1.1.12",
|
"@git.zone/tsdoc": "^1.5.0",
|
||||||
"@gitzone/tsrun": "^1.2.35",
|
"@git.zone/tsrun": "^1.3.3",
|
||||||
"@gitzone/tstest": "^1.0.73",
|
"@git.zone/tstest": "^2.3.2",
|
||||||
"@pushrocks/tapbundle": "^5.0.4",
|
"@types/node": "^24.1.0"
|
||||||
"@types/node": "^18.7.18"
|
|
||||||
},
|
},
|
||||||
"dependencies": {
|
"dependencies": {
|
||||||
"@pushrocks/smartdelay": "^2.0.13",
|
"@push.rocks/smartbuffer": "^3.0.5",
|
||||||
"@pushrocks/smartfile": "^10.0.5",
|
"@push.rocks/smartdelay": "^3.0.5",
|
||||||
"@pushrocks/smartnetwork": "^3.0.0",
|
"@push.rocks/smartfile": "^11.2.5",
|
||||||
"@pushrocks/smartpath": "^5.0.5",
|
"@push.rocks/smartnetwork": "^4.1.2",
|
||||||
"@pushrocks/smartpromise": "^3.1.7",
|
"@push.rocks/smartpath": "^6.0.0",
|
||||||
"@pushrocks/smartpuppeteer": "^2.0.2",
|
"@push.rocks/smartpromise": "^4.2.3",
|
||||||
"@pushrocks/smartunique": "^3.0.3",
|
"@push.rocks/smartpuppeteer": "^2.0.5",
|
||||||
"@tsclass/tsclass": "^4.0.21",
|
"@push.rocks/smartunique": "^3.0.9",
|
||||||
"@types/express": "^4.17.14",
|
"@tsclass/tsclass": "^9.2.0",
|
||||||
"express": "^4.18.1",
|
"@types/express": "^5.0.3",
|
||||||
"pdf-merger-js": "^3.4.0",
|
"express": "^5.1.0",
|
||||||
"pdf2json": "^2.0.0"
|
"pdf-lib": "^1.17.1",
|
||||||
|
"pdf2json": "3.2.0"
|
||||||
},
|
},
|
||||||
"files": [
|
"files": [
|
||||||
"ts/**/*",
|
"ts/**/*",
|
||||||
@@ -49,5 +49,25 @@
|
|||||||
],
|
],
|
||||||
"browserslist": [
|
"browserslist": [
|
||||||
"last 1 chrome versions"
|
"last 1 chrome versions"
|
||||||
]
|
],
|
||||||
|
"keywords": [
|
||||||
|
"PDF generation",
|
||||||
|
"HTML to PDF",
|
||||||
|
"website to PDF",
|
||||||
|
"PDF manipulation",
|
||||||
|
"puppeteer",
|
||||||
|
"express",
|
||||||
|
"node.js",
|
||||||
|
"typescript",
|
||||||
|
"automation",
|
||||||
|
"PDF merging",
|
||||||
|
"text extraction",
|
||||||
|
"PDF management"
|
||||||
|
],
|
||||||
|
"homepage": "https://code.foss.global/push.rocks/smartpdf",
|
||||||
|
"repository": {
|
||||||
|
"type": "git",
|
||||||
|
"url": "https://code.foss.global/push.rocks/smartpdf.git"
|
||||||
|
},
|
||||||
|
"packageManager": "pnpm@10.11.0+sha512.6540583f41cc5f628eb3d9773ecee802f4f9ef9923cc45b69890fb47991d4b092964694ec3a4f738a420c918a333062c8b925d312f42e4f0c263eb603551f977"
|
||||||
}
|
}
|
||||||
|
12466
pnpm-lock.yaml
generated
12466
pnpm-lock.yaml
generated
File diff suppressed because it is too large
Load Diff
1
readme.hints.md
Normal file
1
readme.hints.md
Normal file
@@ -0,0 +1 @@
|
|||||||
|
|
350
readme.md
350
readme.md
@@ -1,41 +1,333 @@
|
|||||||
# @pushrocks/smartpdf
|
# @push.rocks/smartpdf
|
||||||
Create PDFs fast and smoothly
|
Create PDFs on the fly from HTML, websites, or existing PDFs with advanced features like text extraction, PDF merging, and PNG conversion.
|
||||||
|
|
||||||
## Availabililty and Links
|
## Install
|
||||||
* [npmjs.org (npm package)](https://www.npmjs.com/package/@pushrocks/smartpdf)
|
To install `@push.rocks/smartpdf`, use npm or yarn:
|
||||||
* [gitlab.com (source)](https://gitlab.com/pushrocks/smartpdf)
|
|
||||||
* [github.com (source mirror)](https://github.com/pushrocks/smartpdf)
|
|
||||||
* [docs (typedoc)](https://pushrocks.gitlab.io/smartpdf/)
|
|
||||||
|
|
||||||
## Status for master
|
```bash
|
||||||
|
npm install @push.rocks/smartpdf --save
|
||||||
|
```
|
||||||
|
|
||||||
Status Category | Status Badge
|
Or with yarn:
|
||||||
-- | --
|
|
||||||
GitLab Pipelines | [](https://lossless.cloud)
|
```bash
|
||||||
GitLab Pipline Test Coverage | [](https://lossless.cloud)
|
yarn add @push.rocks/smartpdf
|
||||||
npm | [](https://lossless.cloud)
|
```
|
||||||
Snyk | [](https://lossless.cloud)
|
|
||||||
TypeScript Support | [](https://lossless.cloud)
|
## Requirements
|
||||||
node Support | [](https://nodejs.org/dist/latest-v10.x/docs/api/)
|
This package requires a Chrome or Chromium installation to be available on the system, as it uses Puppeteer for rendering. The package will automatically detect and use the appropriate executable.
|
||||||
Code Style | [](https://lossless.cloud)
|
|
||||||
PackagePhobia (total standalone install weight) | [](https://lossless.cloud)
|
|
||||||
PackagePhobia (package size on registry) | [](https://lossless.cloud)
|
|
||||||
BundlePhobia (total size when bundled) | [](https://lossless.cloud)
|
|
||||||
Platform support | [](https://lossless.cloud) [](https://lossless.cloud)
|
|
||||||
|
|
||||||
## Usage
|
## Usage
|
||||||
|
`@push.rocks/smartpdf` provides a powerful interface for PDF generation and manipulation. All examples use ESM syntax and TypeScript.
|
||||||
|
|
||||||
## Contribution
|
### Getting Started
|
||||||
|
First, import the necessary classes:
|
||||||
|
|
||||||
We are always happy for code contributions. If you are not the code contributing type that is ok. Still, maintaining Open Source repositories takes considerable time and thought. If you like the quality of what we do and our modules are useful to you we would appreciate a little monthly contribution: You can [contribute one time](https://lossless.link/contribute-onetime) or [contribute monthly](https://lossless.link/contribute). :)
|
```typescript
|
||||||
|
import { SmartPdf, IPdf } from '@push.rocks/smartpdf';
|
||||||
|
```
|
||||||
|
|
||||||
## Contribution
|
### Basic Setup with Automatic Port Allocation
|
||||||
|
SmartPdf automatically finds an available port between 20000-30000 for its internal server:
|
||||||
|
|
||||||
We are always happy for code contributions. If you are not the code contributing type that is ok. Still, maintaining Open Source repositories takes considerable time and thought. If you like the quality of what we do and our modules are useful to you we would appreciate a little monthly contribution: You can [contribute one time](https://lossless.link/contribute-onetime) or [contribute monthly](https://lossless.link/contribute). :)
|
```typescript
|
||||||
|
async function setupSmartPdf() {
|
||||||
|
const smartPdf = await SmartPdf.create();
|
||||||
|
await smartPdf.start();
|
||||||
|
|
||||||
|
// Your PDF operations here
|
||||||
|
|
||||||
|
await smartPdf.stop();
|
||||||
|
}
|
||||||
|
```
|
||||||
|
|
||||||
For further information read the linked docs at the top of this readme.
|
### Advanced Setup with Custom Port Configuration
|
||||||
|
You can specify custom port settings to avoid conflicts or meet specific requirements:
|
||||||
|
|
||||||
> MIT licensed | **©** [Lossless GmbH](https://lossless.gmbh)
|
```typescript
|
||||||
| By using this npm module you agree to our [privacy policy](https://lossless.gmbH/privacy)
|
// Use a specific port
|
||||||
|
const smartPdf = await SmartPdf.create({ port: 3000 });
|
||||||
|
|
||||||
[](https://maintainedby.lossless.com)
|
// Use a custom port range
|
||||||
|
const smartPdf = await SmartPdf.create({
|
||||||
|
portRangeStart: 4000,
|
||||||
|
portRangeEnd: 5000
|
||||||
|
});
|
||||||
|
|
||||||
|
// The server will find an available port in your specified range
|
||||||
|
await smartPdf.start();
|
||||||
|
console.log(`Server running on port: ${smartPdf.serverPort}`);
|
||||||
|
```
|
||||||
|
|
||||||
|
### Creating PDFs from HTML Strings
|
||||||
|
Generate PDFs from HTML content with full CSS support:
|
||||||
|
|
||||||
|
```typescript
|
||||||
|
async function createPdfFromHtml() {
|
||||||
|
const smartPdf = await SmartPdf.create();
|
||||||
|
await smartPdf.start();
|
||||||
|
|
||||||
|
const htmlString = `
|
||||||
|
<!DOCTYPE html>
|
||||||
|
<html>
|
||||||
|
<head>
|
||||||
|
<style>
|
||||||
|
body { font-family: Arial, sans-serif; margin: 40px; }
|
||||||
|
h1 { color: #333; }
|
||||||
|
.highlight { background-color: yellow; }
|
||||||
|
</style>
|
||||||
|
</head>
|
||||||
|
<body>
|
||||||
|
<h1>Professional PDF Document</h1>
|
||||||
|
<p>This PDF was generated from <span class="highlight">HTML content</span>.</p>
|
||||||
|
</body>
|
||||||
|
</html>
|
||||||
|
`;
|
||||||
|
|
||||||
|
const pdf: IPdf = await smartPdf.getA4PdfResultForHtmlString(htmlString);
|
||||||
|
|
||||||
|
// pdf.buffer contains the PDF data
|
||||||
|
// pdf.id contains a unique identifier
|
||||||
|
// pdf.name contains the filename
|
||||||
|
// pdf.metadata contains additional information like extracted text
|
||||||
|
|
||||||
|
await smartPdf.stop();
|
||||||
|
}
|
||||||
|
```
|
||||||
|
|
||||||
|
### Generating PDFs from Websites
|
||||||
|
Capture web pages as PDFs with two different approaches:
|
||||||
|
|
||||||
|
#### A4 Format PDF from Website
|
||||||
|
Captures the viewable area formatted for A4 paper:
|
||||||
|
|
||||||
|
```typescript
|
||||||
|
async function createA4PdfFromWebsite() {
|
||||||
|
const smartPdf = await SmartPdf.create();
|
||||||
|
await smartPdf.start();
|
||||||
|
|
||||||
|
const pdf: IPdf = await smartPdf.getPdfResultForWebsite('https://example.com');
|
||||||
|
|
||||||
|
// Save to file
|
||||||
|
await fs.writeFile('website-a4.pdf', pdf.buffer);
|
||||||
|
|
||||||
|
await smartPdf.stop();
|
||||||
|
}
|
||||||
|
```
|
||||||
|
|
||||||
|
#### Full Webpage as Single PDF
|
||||||
|
Captures the entire webpage in a single PDF, regardless of length:
|
||||||
|
|
||||||
|
```typescript
|
||||||
|
async function createFullPdfFromWebsite() {
|
||||||
|
const smartPdf = await SmartPdf.create();
|
||||||
|
await smartPdf.start();
|
||||||
|
|
||||||
|
const pdf: IPdf = await smartPdf.getFullWebsiteAsSinglePdf('https://example.com');
|
||||||
|
|
||||||
|
// This captures the entire scrollable area
|
||||||
|
await fs.writeFile('website-full.pdf', pdf.buffer);
|
||||||
|
|
||||||
|
await smartPdf.stop();
|
||||||
|
}
|
||||||
|
```
|
||||||
|
|
||||||
|
### Merging Multiple PDFs
|
||||||
|
Combine multiple PDF files into a single document:
|
||||||
|
|
||||||
|
```typescript
|
||||||
|
async function mergePdfs() {
|
||||||
|
const smartPdf = await SmartPdf.create();
|
||||||
|
await smartPdf.start();
|
||||||
|
|
||||||
|
// Create or load your PDFs
|
||||||
|
const pdf1 = await smartPdf.getA4PdfResultForHtmlString('<h1>Document 1</h1>');
|
||||||
|
const pdf2 = await smartPdf.getA4PdfResultForHtmlString('<h1>Document 2</h1>');
|
||||||
|
const pdf3 = await smartPdf.readFileToPdfObject('./existing-document.pdf');
|
||||||
|
|
||||||
|
// Merge PDFs - order matters!
|
||||||
|
const mergedPdf: Uint8Array = await smartPdf.mergePdfs([
|
||||||
|
pdf1.buffer,
|
||||||
|
pdf2.buffer,
|
||||||
|
pdf3.buffer
|
||||||
|
]);
|
||||||
|
|
||||||
|
// Save the merged PDF
|
||||||
|
await fs.writeFile('merged-document.pdf', mergedPdf);
|
||||||
|
|
||||||
|
await smartPdf.stop();
|
||||||
|
}
|
||||||
|
```
|
||||||
|
|
||||||
|
### Reading PDFs and Extracting Text
|
||||||
|
Extract text content from existing PDFs:
|
||||||
|
|
||||||
|
```typescript
|
||||||
|
async function extractTextFromPdf() {
|
||||||
|
const smartPdf = await SmartPdf.create();
|
||||||
|
|
||||||
|
// Read PDF from disk
|
||||||
|
const pdf: IPdf = await smartPdf.readFileToPdfObject('/path/to/document.pdf');
|
||||||
|
|
||||||
|
// Extract all text
|
||||||
|
const extractedText = await smartPdf.extractTextFromPdfBuffer(pdf.buffer);
|
||||||
|
console.log('Extracted text:', extractedText);
|
||||||
|
|
||||||
|
// The pdf object also contains metadata with text extraction
|
||||||
|
console.log('Metadata:', pdf.metadata);
|
||||||
|
}
|
||||||
|
```
|
||||||
|
|
||||||
|
### Converting PDF to PNG Images
|
||||||
|
Convert each page of a PDF into PNG images:
|
||||||
|
|
||||||
|
```typescript
|
||||||
|
async function convertPdfToPng() {
|
||||||
|
const smartPdf = await SmartPdf.create();
|
||||||
|
await smartPdf.start();
|
||||||
|
|
||||||
|
// Load a PDF
|
||||||
|
const pdf = await smartPdf.readFileToPdfObject('./document.pdf');
|
||||||
|
|
||||||
|
// Convert to PNG images (one per page)
|
||||||
|
const pngImages: Uint8Array[] = await smartPdf.convertPDFToPngBytes(pdf.buffer);
|
||||||
|
|
||||||
|
// Save each page as a PNG
|
||||||
|
pngImages.forEach((pngBuffer, index) => {
|
||||||
|
fs.writeFileSync(`page-${index + 1}.png`, pngBuffer);
|
||||||
|
});
|
||||||
|
|
||||||
|
await smartPdf.stop();
|
||||||
|
}
|
||||||
|
```
|
||||||
|
|
||||||
|
### Using External Browser Instance
|
||||||
|
For advanced use cases, you can provide your own Puppeteer browser instance:
|
||||||
|
|
||||||
|
```typescript
|
||||||
|
import puppeteer from 'puppeteer';
|
||||||
|
|
||||||
|
async function useExternalBrowser() {
|
||||||
|
// Create your own browser instance with custom options
|
||||||
|
const browser = await puppeteer.launch({
|
||||||
|
headless: true,
|
||||||
|
args: ['--no-sandbox', '--disable-setuid-sandbox']
|
||||||
|
});
|
||||||
|
|
||||||
|
const smartPdf = await SmartPdf.create();
|
||||||
|
await smartPdf.start(browser);
|
||||||
|
|
||||||
|
// Use SmartPdf normally
|
||||||
|
const pdf = await smartPdf.getA4PdfResultForHtmlString('<h1>Hello</h1>');
|
||||||
|
|
||||||
|
// SmartPdf will not close the browser when stopping
|
||||||
|
await smartPdf.stop();
|
||||||
|
|
||||||
|
// You control the browser lifecycle
|
||||||
|
await browser.close();
|
||||||
|
}
|
||||||
|
```
|
||||||
|
|
||||||
|
### Running Multiple Instances
|
||||||
|
Thanks to automatic port allocation, you can run multiple SmartPdf instances simultaneously:
|
||||||
|
|
||||||
|
```typescript
|
||||||
|
async function runMultipleInstances() {
|
||||||
|
// Each instance automatically finds its own free port
|
||||||
|
const instance1 = await SmartPdf.create();
|
||||||
|
const instance2 = await SmartPdf.create();
|
||||||
|
const instance3 = await SmartPdf.create();
|
||||||
|
|
||||||
|
// Start all instances
|
||||||
|
await Promise.all([
|
||||||
|
instance1.start(),
|
||||||
|
instance2.start(),
|
||||||
|
instance3.start()
|
||||||
|
]);
|
||||||
|
|
||||||
|
console.log(`Instance 1 running on port: ${instance1.serverPort}`);
|
||||||
|
console.log(`Instance 2 running on port: ${instance2.serverPort}`);
|
||||||
|
console.log(`Instance 3 running on port: ${instance3.serverPort}`);
|
||||||
|
|
||||||
|
// Use instances independently
|
||||||
|
const pdfs = await Promise.all([
|
||||||
|
instance1.getA4PdfResultForHtmlString('<h1>PDF 1</h1>'),
|
||||||
|
instance2.getA4PdfResultForHtmlString('<h1>PDF 2</h1>'),
|
||||||
|
instance3.getA4PdfResultForHtmlString('<h1>PDF 3</h1>')
|
||||||
|
]);
|
||||||
|
|
||||||
|
// Clean up all instances
|
||||||
|
await Promise.all([
|
||||||
|
instance1.stop(),
|
||||||
|
instance2.stop(),
|
||||||
|
instance3.stop()
|
||||||
|
]);
|
||||||
|
}
|
||||||
|
```
|
||||||
|
|
||||||
|
### Error Handling
|
||||||
|
Always wrap SmartPdf operations in try-catch blocks and ensure proper cleanup:
|
||||||
|
|
||||||
|
```typescript
|
||||||
|
async function safePdfGeneration() {
|
||||||
|
let smartPdf: SmartPdf;
|
||||||
|
|
||||||
|
try {
|
||||||
|
smartPdf = await SmartPdf.create();
|
||||||
|
await smartPdf.start();
|
||||||
|
|
||||||
|
const pdf = await smartPdf.getA4PdfResultForHtmlString('<h1>Hello</h1>');
|
||||||
|
// Process PDF...
|
||||||
|
|
||||||
|
} catch (error) {
|
||||||
|
console.error('PDF generation failed:', error);
|
||||||
|
// Handle error appropriately
|
||||||
|
} finally {
|
||||||
|
// Always cleanup
|
||||||
|
if (smartPdf) {
|
||||||
|
await smartPdf.stop();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
```
|
||||||
|
|
||||||
|
### IPdf Interface
|
||||||
|
The `IPdf` interface represents a PDF with its metadata:
|
||||||
|
|
||||||
|
```typescript
|
||||||
|
interface IPdf {
|
||||||
|
name: string; // Filename of the PDF
|
||||||
|
buffer: Buffer; // PDF content as buffer
|
||||||
|
id: string | null; // Unique identifier
|
||||||
|
metadata?: {
|
||||||
|
textExtraction?: string; // Extracted text content
|
||||||
|
};
|
||||||
|
}
|
||||||
|
```
|
||||||
|
|
||||||
|
## Best Practices
|
||||||
|
|
||||||
|
1. **Always start and stop**: Initialize with `start()` and cleanup with `stop()` to properly manage resources.
|
||||||
|
2. **Port management**: Use the automatic port allocation feature to avoid conflicts when running multiple instances.
|
||||||
|
3. **Error handling**: Always implement proper error handling as PDF generation can fail due to various reasons.
|
||||||
|
4. **Resource cleanup**: Ensure `stop()` is called even if an error occurs to prevent memory leaks.
|
||||||
|
5. **HTML optimization**: When creating PDFs from HTML, ensure your HTML is well-formed and CSS is embedded or inlined.
|
||||||
|
|
||||||
|
## License and Legal Information
|
||||||
|
|
||||||
|
This repository contains open-source code that is licensed under the MIT License. A copy of the MIT License can be found in the [license](license) file within this repository.
|
||||||
|
|
||||||
|
**Please note:** The MIT License does not grant permission to use the trade names, trademarks, service marks, or product names of the project, except as required for reasonable and customary use in describing the origin of the work and reproducing the content of the NOTICE file.
|
||||||
|
|
||||||
|
### Trademarks
|
||||||
|
|
||||||
|
This project is owned and maintained by Task Venture Capital GmbH. The names and logos associated with Task Venture Capital GmbH and any related products or services are trademarks of Task Venture Capital GmbH and are not included within the scope of the MIT license granted herein. Use of these trademarks must comply with Task Venture Capital GmbH's Trademark Guidelines, and any usage must be approved in writing by Task Venture Capital GmbH.
|
||||||
|
|
||||||
|
### Company Information
|
||||||
|
|
||||||
|
Task Venture Capital GmbH
|
||||||
|
Registered at District court Bremen HRB 35230 HB, Germany
|
||||||
|
|
||||||
|
For any legal inquiries or if you require further information, please contact us via email at hello@task.vc.
|
||||||
|
|
||||||
|
By using this repository, you acknowledge that you have read this section, agree to comply with its terms, and understand that the licensing of the code does not imply endorsement by Task Venture Capital GmbH of any derivative works.
|
97
test/test.port.ts
Normal file
97
test/test.port.ts
Normal file
@@ -0,0 +1,97 @@
|
|||||||
|
import { expect, tap } from '@git.zone/tstest/tapbundle';
|
||||||
|
import * as smartpdf from '../ts/index.js';
|
||||||
|
|
||||||
|
tap.test('should create multiple SmartPdf instances with automatic port allocation', async () => {
|
||||||
|
const instance1 = new smartpdf.SmartPdf();
|
||||||
|
const instance2 = new smartpdf.SmartPdf();
|
||||||
|
const instance3 = new smartpdf.SmartPdf();
|
||||||
|
|
||||||
|
// Start all instances
|
||||||
|
await instance1.start();
|
||||||
|
await instance2.start();
|
||||||
|
await instance3.start();
|
||||||
|
|
||||||
|
// Verify all instances have different ports
|
||||||
|
expect(instance1.serverPort).toBeGreaterThanOrEqual(20000);
|
||||||
|
expect(instance1.serverPort).toBeLessThanOrEqual(30000);
|
||||||
|
expect(instance2.serverPort).toBeGreaterThanOrEqual(20000);
|
||||||
|
expect(instance2.serverPort).toBeLessThanOrEqual(30000);
|
||||||
|
expect(instance3.serverPort).toBeGreaterThanOrEqual(20000);
|
||||||
|
expect(instance3.serverPort).toBeLessThanOrEqual(30000);
|
||||||
|
|
||||||
|
// Ensure all ports are different
|
||||||
|
expect(instance1.serverPort).not.toEqual(instance2.serverPort);
|
||||||
|
expect(instance1.serverPort).not.toEqual(instance3.serverPort);
|
||||||
|
expect(instance2.serverPort).not.toEqual(instance3.serverPort);
|
||||||
|
|
||||||
|
console.log(`Instance 1 port: ${instance1.serverPort}`);
|
||||||
|
console.log(`Instance 2 port: ${instance2.serverPort}`);
|
||||||
|
console.log(`Instance 3 port: ${instance3.serverPort}`);
|
||||||
|
|
||||||
|
// Test that all instances work correctly
|
||||||
|
const pdf1 = await instance1.getA4PdfResultForHtmlString('<h1>Instance 1</h1>');
|
||||||
|
const pdf2 = await instance2.getA4PdfResultForHtmlString('<h1>Instance 2</h1>');
|
||||||
|
const pdf3 = await instance3.getA4PdfResultForHtmlString('<h1>Instance 3</h1>');
|
||||||
|
|
||||||
|
expect(pdf1.buffer).toBeInstanceOf(Buffer);
|
||||||
|
expect(pdf2.buffer).toBeInstanceOf(Buffer);
|
||||||
|
expect(pdf3.buffer).toBeInstanceOf(Buffer);
|
||||||
|
|
||||||
|
// Clean up
|
||||||
|
await instance1.stop();
|
||||||
|
await instance2.stop();
|
||||||
|
await instance3.stop();
|
||||||
|
});
|
||||||
|
|
||||||
|
tap.test('should create SmartPdf instance with custom port range', async () => {
|
||||||
|
const customInstance = new smartpdf.SmartPdf({
|
||||||
|
portRangeStart: 25000,
|
||||||
|
portRangeEnd: 26000
|
||||||
|
});
|
||||||
|
|
||||||
|
await customInstance.start();
|
||||||
|
|
||||||
|
expect(customInstance.serverPort).toBeGreaterThanOrEqual(25000);
|
||||||
|
expect(customInstance.serverPort).toBeLessThanOrEqual(26000);
|
||||||
|
|
||||||
|
console.log(`Custom range instance port: ${customInstance.serverPort}`);
|
||||||
|
|
||||||
|
await customInstance.stop();
|
||||||
|
});
|
||||||
|
|
||||||
|
tap.test('should create SmartPdf instance with specific port', async () => {
|
||||||
|
const specificPortInstance = new smartpdf.SmartPdf({
|
||||||
|
port: 28888
|
||||||
|
});
|
||||||
|
|
||||||
|
await specificPortInstance.start();
|
||||||
|
|
||||||
|
expect(specificPortInstance.serverPort).toEqual(28888);
|
||||||
|
|
||||||
|
console.log(`Specific port instance: ${specificPortInstance.serverPort}`);
|
||||||
|
|
||||||
|
await specificPortInstance.stop();
|
||||||
|
});
|
||||||
|
|
||||||
|
tap.test('should throw error when specific port is already in use', async () => {
|
||||||
|
const instance1 = new smartpdf.SmartPdf({ port: 29999 });
|
||||||
|
await instance1.start();
|
||||||
|
|
||||||
|
const instance2 = new smartpdf.SmartPdf({ port: 29999 });
|
||||||
|
|
||||||
|
let errorThrown = false;
|
||||||
|
try {
|
||||||
|
await instance2.start();
|
||||||
|
} catch (error) {
|
||||||
|
errorThrown = true;
|
||||||
|
expect(error.message).toInclude('already in use');
|
||||||
|
}
|
||||||
|
|
||||||
|
expect(errorThrown).toBeTrue();
|
||||||
|
|
||||||
|
await instance1.stop();
|
||||||
|
});
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
export default tap.start();
|
91
test/test.ts
91
test/test.ts
@@ -1,60 +1,85 @@
|
|||||||
import { expect, tap } from '@pushrocks/tapbundle';
|
import { expect, tap } from '@git.zone/tstest/tapbundle';
|
||||||
import * as smartpdf from '../ts/index.js';
|
import * as smartpdf from '../ts/index.js';
|
||||||
|
import * as fs from 'fs';
|
||||||
|
import * as path from 'path';
|
||||||
|
|
||||||
let testSmartPdf: smartpdf.SmartPdf;
|
let testSmartPdf: smartpdf.SmartPdf;
|
||||||
|
|
||||||
tap.test('should create a valid instance of smartpdf', async () => {
|
/**
|
||||||
|
* Ensures that a directory exists.
|
||||||
|
* @param dirPath - The directory path to ensure.
|
||||||
|
*/
|
||||||
|
function ensureDir(dirPath: string): void {
|
||||||
|
if (!fs.existsSync(dirPath)) {
|
||||||
|
fs.mkdirSync(dirPath, { recursive: true });
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
tap.test('should create a valid instance of SmartPdf', async () => {
|
||||||
testSmartPdf = new smartpdf.SmartPdf();
|
testSmartPdf = new smartpdf.SmartPdf();
|
||||||
expect(testSmartPdf).toBeInstanceOf(smartpdf.SmartPdf);
|
expect(testSmartPdf).toBeInstanceOf(smartpdf.SmartPdf);
|
||||||
});
|
});
|
||||||
|
|
||||||
tap.test('should start the instance', async () => {
|
tap.test('should start the SmartPdf instance', async () => {
|
||||||
await testSmartPdf.start();
|
await testSmartPdf.start();
|
||||||
});
|
});
|
||||||
|
|
||||||
tap.test('should create a pdf from html string', async () => {
|
tap.test('should create PDFs from HTML string', async () => {
|
||||||
await testSmartPdf.getA4PdfResultForHtmlString('hi');
|
const pdf1 = await testSmartPdf.getA4PdfResultForHtmlString('hi');
|
||||||
|
const pdf2 = await testSmartPdf.getA4PdfResultForHtmlString('hello');
|
||||||
|
expect(pdf1.buffer).toBeInstanceOf(Buffer);
|
||||||
|
expect(pdf2.buffer).toBeInstanceOf(Buffer);
|
||||||
});
|
});
|
||||||
|
|
||||||
tap.test('should create a pdf from html string', async () => {
|
tap.test('should create PDFs from websites', async () => {
|
||||||
await testSmartPdf.getA4PdfResultForHtmlString('hi');
|
const pdfA4 = await testSmartPdf.getPdfResultForWebsite('https://www.wikipedia.org');
|
||||||
|
const pdfSingle = await testSmartPdf.getFullWebsiteAsSinglePdf('https://www.wikipedia.org');
|
||||||
|
expect(pdfA4.buffer).toBeInstanceOf(Buffer);
|
||||||
|
expect(pdfSingle.buffer).toBeInstanceOf(Buffer);
|
||||||
});
|
});
|
||||||
|
|
||||||
tap.test('should create a pdf from website as A4', async () => {
|
tap.test('should create valid PDF results and write them to disk', async () => {
|
||||||
await testSmartPdf.getPdfResultForWebsite('https://www.wikipedia.org');
|
const writePdfToDisk = async (urlArg: string, fileName: string) => {
|
||||||
});
|
|
||||||
|
|
||||||
tap.test('should create a pdf from website as single page PDF', async () => {
|
|
||||||
await testSmartPdf.getFullWebsiteAsSinglePdf('https://www.wikipedia.org');
|
|
||||||
});
|
|
||||||
|
|
||||||
tap.test('should create a valid PDFResult', async () => {
|
|
||||||
const writePDfToDisk = async (urlArg: string, fileName: string) => {
|
|
||||||
const pdfResult = await testSmartPdf.getFullWebsiteAsSinglePdf(urlArg);
|
const pdfResult = await testSmartPdf.getFullWebsiteAsSinglePdf(urlArg);
|
||||||
expect(pdfResult.buffer).toBeInstanceOf(Buffer);
|
expect(pdfResult.buffer).toBeInstanceOf(Buffer);
|
||||||
const fs = await import('fs');
|
ensureDir('.nogit');
|
||||||
|
fs.writeFileSync(path.join('.nogit', fileName), pdfResult.buffer as Buffer);
|
||||||
if (!fs.existsSync('.nogit/')) {
|
|
||||||
fs.mkdirSync('.nogit/');
|
|
||||||
}
|
|
||||||
fs.writeFileSync(`.nogit/${fileName}`, pdfResult.buffer as Buffer);
|
|
||||||
};
|
};
|
||||||
await writePDfToDisk('https://maintainedby.lossless.com/', '1.pdf');
|
await writePdfToDisk('https://lossless.com/', '1.pdf');
|
||||||
await writePDfToDisk('https://rendertron.lossless.one/render/https://layer.io', '2.pdf');
|
await writePdfToDisk('https://layer.io', '2.pdf');
|
||||||
});
|
});
|
||||||
|
|
||||||
tap.test('should combine pdfs', async () => {
|
tap.test('should merge PDFs into a combined PDF', async () => {
|
||||||
const fs = await import('fs');
|
|
||||||
const pdf1 = await testSmartPdf.readFileToPdfObject('.nogit/1.pdf');
|
const pdf1 = await testSmartPdf.readFileToPdfObject('.nogit/1.pdf');
|
||||||
const pdf2 = await testSmartPdf.readFileToPdfObject('.nogit/2.pdf');
|
const pdf2 = await testSmartPdf.readFileToPdfObject('.nogit/2.pdf');
|
||||||
fs.writeFileSync(
|
const mergedBuffer = await testSmartPdf.mergePdfs([pdf1.buffer, pdf2.buffer]);
|
||||||
`.nogit/combined.pdf`,
|
ensureDir('.nogit');
|
||||||
(await testSmartPdf.mergePdfs([pdf1, pdf2])).buffer as Buffer
|
fs.writeFileSync(path.join('.nogit', 'combined.pdf'), mergedBuffer);
|
||||||
);
|
|
||||||
});
|
});
|
||||||
|
|
||||||
tap.test('should be able to close properly', async () => {
|
tap.test('should create PNG images from combined PDF using Puppeteer conversion', async () => {
|
||||||
|
const pdfObject = await testSmartPdf.readFileToPdfObject('.nogit/combined.pdf');
|
||||||
|
const images = await testSmartPdf.convertPDFToPngBytes(pdfObject.buffer);
|
||||||
|
expect(images.length).toBeGreaterThan(0);
|
||||||
|
console.log('Puppeteer-based conversion image sizes:', images.map(img => img.length));
|
||||||
|
});
|
||||||
|
|
||||||
|
tap.test('should store PNG results from both conversion functions in .nogit/testresults', async () => {
|
||||||
|
const testResultsDir = path.join('.nogit', 'testresults');
|
||||||
|
ensureDir(testResultsDir);
|
||||||
|
|
||||||
|
const pdfObject = await testSmartPdf.readFileToPdfObject('.nogit/combined.pdf');
|
||||||
|
|
||||||
|
// Convert using Puppeteer-based function and store images
|
||||||
|
const imagesPuppeteer = await testSmartPdf.convertPDFToPngBytes(pdfObject.buffer);
|
||||||
|
imagesPuppeteer.forEach((img, index) => {
|
||||||
|
const filePath = path.join(testResultsDir, `puppeteer_method_page_${index + 1}.png`);
|
||||||
|
fs.writeFileSync(filePath, Buffer.from(img));
|
||||||
|
});
|
||||||
|
});
|
||||||
|
|
||||||
|
tap.test('should close the SmartPdf instance properly', async () => {
|
||||||
await testSmartPdf.stop();
|
await testSmartPdf.stop();
|
||||||
});
|
});
|
||||||
|
|
||||||
tap.start();
|
tap.start();
|
@@ -1,8 +1,8 @@
|
|||||||
/**
|
/**
|
||||||
* autocreated commitinfo by @pushrocks/commitinfo
|
* autocreated commitinfo by @push.rocks/commitinfo
|
||||||
*/
|
*/
|
||||||
export const commitinfo = {
|
export const commitinfo = {
|
||||||
name: '@pushrocks/smartpdf',
|
name: '@push.rocks/smartpdf',
|
||||||
version: '3.0.14',
|
version: '3.2.2',
|
||||||
description: 'create pdfs on the fly'
|
description: 'A library for creating PDFs dynamically from HTML or websites with additional features like merging PDFs.'
|
||||||
}
|
}
|
||||||
|
@@ -7,3 +7,9 @@ declare global {
|
|||||||
|
|
||||||
// normal
|
// normal
|
||||||
export * from './smartpdf.classes.smartpdf.js';
|
export * from './smartpdf.classes.smartpdf.js';
|
||||||
|
|
||||||
|
// additional types
|
||||||
|
import type * as tsclassTypes from '@tsclass/tsclass';
|
||||||
|
type IPdf = tsclassTypes.business.IPdf;
|
||||||
|
|
||||||
|
export type { IPdf };
|
||||||
|
@@ -2,14 +2,21 @@ import * as plugins from './smartpdf.plugins.js';
|
|||||||
import * as paths from './smartpdf.paths.js';
|
import * as paths from './smartpdf.paths.js';
|
||||||
import { Server } from 'http';
|
import { Server } from 'http';
|
||||||
import { PdfCandidate } from './smartpdf.classes.pdfcandidate.js';
|
import { PdfCandidate } from './smartpdf.classes.pdfcandidate.js';
|
||||||
import { IPdf } from '@tsclass/tsclass/dist_ts/business/pdf.js';
|
import { type IPdf } from '@tsclass/tsclass/dist_ts/business/pdf.js';
|
||||||
|
import { execFile } from 'child_process';
|
||||||
|
|
||||||
declare const document: any;
|
declare const document: any;
|
||||||
|
|
||||||
|
export interface ISmartPdfOptions {
|
||||||
|
port?: number;
|
||||||
|
portRangeStart?: number;
|
||||||
|
portRangeEnd?: number;
|
||||||
|
}
|
||||||
|
|
||||||
export class SmartPdf {
|
export class SmartPdf {
|
||||||
// STATIC
|
// STATIC
|
||||||
public static async create() {
|
public static async create(optionsArg?: ISmartPdfOptions) {
|
||||||
const smartpdfInstance = new SmartPdf();
|
const smartpdfInstance = new SmartPdf(optionsArg);
|
||||||
return smartpdfInstance;
|
return smartpdfInstance;
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -20,9 +27,15 @@ export class SmartPdf {
|
|||||||
externalBrowserBool: boolean = false;
|
externalBrowserBool: boolean = false;
|
||||||
private _readyDeferred: plugins.smartpromise.Deferred<void>;
|
private _readyDeferred: plugins.smartpromise.Deferred<void>;
|
||||||
private _candidates: { [key: string]: PdfCandidate } = {};
|
private _candidates: { [key: string]: PdfCandidate } = {};
|
||||||
|
private _options: ISmartPdfOptions;
|
||||||
|
|
||||||
constructor() {
|
constructor(optionsArg?: ISmartPdfOptions) {
|
||||||
this._readyDeferred = new plugins.smartpromise.Deferred();
|
this._readyDeferred = new plugins.smartpromise.Deferred();
|
||||||
|
this._options = {
|
||||||
|
portRangeStart: 20000,
|
||||||
|
portRangeEnd: 30000,
|
||||||
|
...optionsArg
|
||||||
|
};
|
||||||
}
|
}
|
||||||
|
|
||||||
async start(headlessBrowserArg?: plugins.smartpuppeteer.puppeteer.Browser) {
|
async start(headlessBrowserArg?: plugins.smartpuppeteer.puppeteer.Browser) {
|
||||||
@@ -34,21 +47,56 @@ export class SmartPdf {
|
|||||||
this.externalBrowserBool = true;
|
this.externalBrowserBool = true;
|
||||||
} else {
|
} else {
|
||||||
this.headlessBrowser = await plugins.smartpuppeteer.getEnvAwareBrowserInstance({
|
this.headlessBrowser = await plugins.smartpuppeteer.getEnvAwareBrowserInstance({
|
||||||
forceNoSandbox: true,
|
forceNoSandbox: false,
|
||||||
});
|
});
|
||||||
}
|
}
|
||||||
|
|
||||||
// setup server
|
// Find an available port BEFORE creating server
|
||||||
|
const smartnetworkInstance = new plugins.smartnetwork.SmartNetwork();
|
||||||
|
|
||||||
|
if (this._options.port) {
|
||||||
|
// If a specific port is requested, check if it's available
|
||||||
|
const isPortAvailable = await smartnetworkInstance.isLocalPortUnused(this._options.port);
|
||||||
|
if (isPortAvailable) {
|
||||||
|
this.serverPort = this._options.port;
|
||||||
|
} else {
|
||||||
|
// Clean up browser if we created one
|
||||||
|
if (!this.externalBrowserBool && this.headlessBrowser) {
|
||||||
|
await this.headlessBrowser.close();
|
||||||
|
}
|
||||||
|
throw new Error(`Requested port ${this._options.port} is already in use`);
|
||||||
|
}
|
||||||
|
} else {
|
||||||
|
// Find a free port in the specified range
|
||||||
|
this.serverPort = await smartnetworkInstance.findFreePort(
|
||||||
|
this._options.portRangeStart,
|
||||||
|
this._options.portRangeEnd
|
||||||
|
);
|
||||||
|
if (!this.serverPort) {
|
||||||
|
// Clean up browser if we created one
|
||||||
|
if (!this.externalBrowserBool && this.headlessBrowser) {
|
||||||
|
await this.headlessBrowser.close();
|
||||||
|
}
|
||||||
|
throw new Error(`No free ports available in range ${this._options.portRangeStart}-${this._options.portRangeEnd}`);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
// Now setup server after we know we have a valid port
|
||||||
const app = plugins.express();
|
const app = plugins.express();
|
||||||
app.get('/:pdfId', (req, res) => {
|
app.get('/:pdfId', (req, res) => {
|
||||||
res.setHeader('PDF-ID', this._candidates[req.params.pdfId].pdfId);
|
const wantedCandidate = this._candidates[req.params.pdfId];
|
||||||
res.send(this._candidates[req.params.pdfId].htmlString);
|
if (!wantedCandidate) {
|
||||||
|
console.log(`${req.url} not attached to a candidate`);
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
res.setHeader('pdf-id', wantedCandidate.pdfId);
|
||||||
|
res.send(wantedCandidate.htmlString);
|
||||||
});
|
});
|
||||||
this.htmlServerInstance = plugins.http.createServer(app);
|
this.htmlServerInstance = plugins.http.createServer(app);
|
||||||
const smartnetworkInstance = new plugins.smartnetwork.SmartNetwork();
|
|
||||||
const portAvailable = smartnetworkInstance.isLocalPortUnused(3210);
|
this.htmlServerInstance.listen(this.serverPort, 'localhost');
|
||||||
this.htmlServerInstance.listen(3210, 'localhost');
|
|
||||||
this.htmlServerInstance.on('listening', () => {
|
this.htmlServerInstance.on('listening', () => {
|
||||||
|
console.log(`SmartPdf server listening on port ${this.serverPort}`);
|
||||||
this._readyDeferred.resolve();
|
this._readyDeferred.resolve();
|
||||||
done.resolve();
|
done.resolve();
|
||||||
});
|
});
|
||||||
@@ -70,7 +118,7 @@ export class SmartPdf {
|
|||||||
}
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* returns a pdf for a given html string;
|
* Returns a PDF for a given HTML string.
|
||||||
*/
|
*/
|
||||||
async getA4PdfResultForHtmlString(htmlStringArg: string): Promise<plugins.tsclass.business.IPdf> {
|
async getA4PdfResultForHtmlString(htmlStringArg: string): Promise<plugins.tsclass.business.IPdf> {
|
||||||
await this._readyDeferred.promise;
|
await this._readyDeferred.promise;
|
||||||
@@ -81,10 +129,9 @@ export class SmartPdf {
|
|||||||
width: 794,
|
width: 794,
|
||||||
height: 1122,
|
height: 1122,
|
||||||
});
|
});
|
||||||
const response = await page.goto(`http://localhost:3210/${pdfCandidate.pdfId}`, {
|
const response = await page.goto(`http://localhost:${this.serverPort}/${pdfCandidate.pdfId}`, {
|
||||||
waitUntil: 'networkidle2',
|
waitUntil: 'networkidle2',
|
||||||
});
|
});
|
||||||
// await plugins.smartdelay.delayFor(1000);
|
|
||||||
const headers = response.headers();
|
const headers = response.headers();
|
||||||
if (headers['pdf-id'] !== pdfCandidate.pdfId) {
|
if (headers['pdf-id'] !== pdfCandidate.pdfId) {
|
||||||
console.log('Error! Headers do not match. For security reasons no pdf is being emitted!');
|
console.log('Error! Headers do not match. For security reasons no pdf is being emitted!');
|
||||||
@@ -99,6 +146,8 @@ export class SmartPdf {
|
|||||||
printBackground: true,
|
printBackground: true,
|
||||||
displayHeaderFooter: false,
|
displayHeaderFooter: false,
|
||||||
});
|
});
|
||||||
|
// Convert Uint8Array to Node Buffer
|
||||||
|
const nodePdfBuffer = Buffer.from(pdfBuffer);
|
||||||
await page.close();
|
await page.close();
|
||||||
delete this._candidates[pdfCandidate.pdfId];
|
delete this._candidates[pdfCandidate.pdfId];
|
||||||
pdfCandidate.doneDeferred.resolve();
|
pdfCandidate.doneDeferred.resolve();
|
||||||
@@ -107,9 +156,9 @@ export class SmartPdf {
|
|||||||
id: pdfCandidate.pdfId,
|
id: pdfCandidate.pdfId,
|
||||||
name: `${pdfCandidate.pdfId}.js`,
|
name: `${pdfCandidate.pdfId}.js`,
|
||||||
metadata: {
|
metadata: {
|
||||||
textExtraction: await this.extractTextFromPdfBuffer(pdfBuffer),
|
textExtraction: await this.extractTextFromPdfBuffer(nodePdfBuffer),
|
||||||
},
|
},
|
||||||
buffer: pdfBuffer,
|
buffer: nodePdfBuffer,
|
||||||
};
|
};
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -134,14 +183,16 @@ export class SmartPdf {
|
|||||||
printBackground: true,
|
printBackground: true,
|
||||||
displayHeaderFooter: false,
|
displayHeaderFooter: false,
|
||||||
});
|
});
|
||||||
|
// Convert Uint8Array to Node Buffer
|
||||||
|
const nodePdfBuffer = Buffer.from(pdfBuffer);
|
||||||
await page.close();
|
await page.close();
|
||||||
return {
|
return {
|
||||||
id: pdfId,
|
id: pdfId,
|
||||||
name: `${pdfId}.js`,
|
name: `${pdfId}.js`,
|
||||||
metadata: {
|
metadata: {
|
||||||
textExtraction: await this.extractTextFromPdfBuffer(pdfBuffer),
|
textExtraction: await this.extractTextFromPdfBuffer(nodePdfBuffer),
|
||||||
},
|
},
|
||||||
buffer: pdfBuffer,
|
buffer: nodePdfBuffer,
|
||||||
};
|
};
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -151,15 +202,23 @@ export class SmartPdf {
|
|||||||
width: 1920,
|
width: 1920,
|
||||||
height: 1200,
|
height: 1200,
|
||||||
});
|
});
|
||||||
page.emulateMediaType('screen');
|
await page.emulateMediaType('screen');
|
||||||
const response = await page.goto(websiteUrl, { waitUntil: 'networkidle2' });
|
const response = await page.goto(websiteUrl, { waitUntil: 'networkidle2' });
|
||||||
const pdfId = plugins.smartunique.shortId();
|
const pdfId = plugins.smartunique.shortId();
|
||||||
|
// Use both document.body and document.documentElement to ensure we have a valid height and width.
|
||||||
const { documentHeight, documentWidth } = await page.evaluate(() => {
|
const { documentHeight, documentWidth } = await page.evaluate(() => {
|
||||||
return {
|
return {
|
||||||
documentHeight: document.body.scrollHeight,
|
documentHeight: Math.max(
|
||||||
documentWidth: document.body.clientWidth,
|
document.body.scrollHeight,
|
||||||
|
document.documentElement.scrollHeight
|
||||||
|
) || 1200,
|
||||||
|
documentWidth: Math.max(
|
||||||
|
document.body.clientWidth,
|
||||||
|
document.documentElement.clientWidth
|
||||||
|
) || 1920,
|
||||||
};
|
};
|
||||||
});
|
});
|
||||||
|
// Update viewport height to the full document height.
|
||||||
await page.setViewport({
|
await page.setViewport({
|
||||||
width: 1920,
|
width: 1920,
|
||||||
height: documentHeight,
|
height: documentHeight,
|
||||||
@@ -172,35 +231,35 @@ export class SmartPdf {
|
|||||||
scale: 1,
|
scale: 1,
|
||||||
pageRanges: '1',
|
pageRanges: '1',
|
||||||
});
|
});
|
||||||
|
// Convert Uint8Array to Node Buffer
|
||||||
|
const nodePdfBuffer = Buffer.from(pdfBuffer);
|
||||||
await page.close();
|
await page.close();
|
||||||
return {
|
return {
|
||||||
id: pdfId,
|
id: pdfId,
|
||||||
name: `${pdfId}.js`,
|
name: `${pdfId}.js`,
|
||||||
metadata: {
|
metadata: {
|
||||||
textExtraction: await this.extractTextFromPdfBuffer(pdfBuffer),
|
textExtraction: await this.extractTextFromPdfBuffer(nodePdfBuffer),
|
||||||
},
|
},
|
||||||
buffer: pdfBuffer,
|
buffer: nodePdfBuffer,
|
||||||
};
|
};
|
||||||
}
|
}
|
||||||
|
|
||||||
public async mergePdfs(pdfArrayArg: plugins.tsclass.business.IPdf[]): Promise<IPdf> {
|
public async mergePdfs(inputPdfBuffers: Uint8Array[]): Promise<Uint8Array> {
|
||||||
const merger = new plugins.pdfMerger();
|
const mergedPdf = await plugins.pdfLib.PDFDocument.create();
|
||||||
for (const pdf of pdfArrayArg) {
|
for (const pdfBytes of inputPdfBuffers) {
|
||||||
merger.add(Buffer.from(pdf.buffer));
|
const pdfDoc = await plugins.pdfLib.PDFDocument.load(pdfBytes);
|
||||||
|
const pages = await mergedPdf.copyPages(pdfDoc, pdfDoc.getPageIndices());
|
||||||
|
pages.forEach((page) => mergedPdf.addPage(page));
|
||||||
}
|
}
|
||||||
const resultBuffer = await merger.saveAsBuffer();
|
|
||||||
return {
|
const mergedPdfBytes = await mergedPdf.save();
|
||||||
name: 'mergedPdf',
|
return mergedPdfBytes;
|
||||||
buffer: resultBuffer,
|
|
||||||
id: null,
|
|
||||||
metadata: null,
|
|
||||||
};
|
|
||||||
}
|
}
|
||||||
|
|
||||||
public async readFileToPdfObject(pathArg: string): Promise<plugins.tsclass.business.IPdf> {
|
public async readFileToPdfObject(pathArg: string): Promise<plugins.tsclass.business.IPdf> {
|
||||||
const path = plugins.smartpath.transform.makeAbsolute(pathArg);
|
const absolutePath = plugins.smartpath.transform.makeAbsolute(pathArg);
|
||||||
const parsedPath = plugins.path.parse(path);
|
const parsedPath = plugins.path.parse(absolutePath);
|
||||||
const buffer = await plugins.smartfile.fs.toBuffer(path);
|
const buffer = await plugins.smartfile.fs.toBuffer(absolutePath);
|
||||||
return {
|
return {
|
||||||
name: parsedPath.base,
|
name: parsedPath.base,
|
||||||
buffer,
|
buffer,
|
||||||
@@ -226,4 +285,110 @@ export class SmartPdf {
|
|||||||
pdfParser.parseBuffer(pdfBufferArg);
|
pdfParser.parseBuffer(pdfBufferArg);
|
||||||
return deferred.promise;
|
return deferred.promise;
|
||||||
}
|
}
|
||||||
}
|
|
||||||
|
/**
|
||||||
|
* Checks for the presence of required dependencies: GraphicsMagick and Ghostscript.
|
||||||
|
*/
|
||||||
|
private async checkDependencies(): Promise<void> {
|
||||||
|
await Promise.all([
|
||||||
|
this.checkCommandExists('gm', ['version']),
|
||||||
|
this.checkCommandExists('gs', ['--version']),
|
||||||
|
]);
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Checks if a given command exists by trying to execute it.
|
||||||
|
*/
|
||||||
|
private checkCommandExists(command: string, args: string[]): Promise<void> {
|
||||||
|
return new Promise((resolve, reject) => {
|
||||||
|
execFile(command, args, (error, stdout, stderr) => {
|
||||||
|
if (error) {
|
||||||
|
reject(new Error(`Dependency check failed: ${command} is not installed or not in the PATH. ${error.message}`));
|
||||||
|
} else {
|
||||||
|
resolve();
|
||||||
|
}
|
||||||
|
});
|
||||||
|
});
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Converts a PDF to PNG bytes for each page using Puppeteer and PDF.js.
|
||||||
|
* This method creates a temporary HTML page that loads PDF.js from a CDN,
|
||||||
|
* renders each PDF page to a canvas, and then screenshots each canvas element.
|
||||||
|
*/
|
||||||
|
public async convertPDFToPngBytes(
|
||||||
|
pdfBytes: Uint8Array,
|
||||||
|
options: { width?: number; height?: number; quality?: number } = {}
|
||||||
|
): Promise<Uint8Array[]> {
|
||||||
|
// Note: options.width, options.height, and options.quality are not applied here,
|
||||||
|
// as the rendered canvas size is determined by the PDF page dimensions.
|
||||||
|
|
||||||
|
// Create a new page using the headless browser.
|
||||||
|
const page = await this.headlessBrowser.newPage();
|
||||||
|
|
||||||
|
// Prepare PDF data as a base64 string.
|
||||||
|
const base64Pdf: string = Buffer.from(pdfBytes).toString('base64');
|
||||||
|
|
||||||
|
// HTML template that loads PDF.js and renders the PDF.
|
||||||
|
const htmlTemplate: string = `
|
||||||
|
<!DOCTYPE html>
|
||||||
|
<html>
|
||||||
|
<head>
|
||||||
|
<meta charset="utf-8">
|
||||||
|
<title>PDF to PNG Converter</title>
|
||||||
|
<style>
|
||||||
|
body { margin: 0; }
|
||||||
|
canvas { display: block; margin: 10px auto; }
|
||||||
|
</style>
|
||||||
|
<script src="https://cdnjs.cloudflare.com/ajax/libs/pdf.js/2.16.105/pdf.min.js"></script>
|
||||||
|
</head>
|
||||||
|
<body>
|
||||||
|
<script>
|
||||||
|
(async function() {
|
||||||
|
pdfjsLib.GlobalWorkerOptions.workerSrc = 'https://cdnjs.cloudflare.com/ajax/libs/pdf.js/2.16.105/pdf.worker.min.js';
|
||||||
|
const pdfData = "__PDF_DATA__";
|
||||||
|
const raw = atob(pdfData);
|
||||||
|
const pdfArray = new Uint8Array([...raw].map(c => c.charCodeAt(0)));
|
||||||
|
const loadingTask = pdfjsLib.getDocument({data: pdfArray});
|
||||||
|
const pdf = await loadingTask.promise;
|
||||||
|
const numPages = pdf.numPages;
|
||||||
|
for (let pageNum = 1; pageNum <= numPages; pageNum++) {
|
||||||
|
const page = await pdf.getPage(pageNum);
|
||||||
|
const viewport = page.getViewport({ scale: 1.0 });
|
||||||
|
const canvas = document.createElement('canvas');
|
||||||
|
const context = canvas.getContext('2d');
|
||||||
|
canvas.width = viewport.width;
|
||||||
|
canvas.height = viewport.height;
|
||||||
|
await page.render({ canvasContext: context, viewport: viewport }).promise;
|
||||||
|
document.body.appendChild(canvas);
|
||||||
|
}
|
||||||
|
window.renderComplete = true;
|
||||||
|
})();
|
||||||
|
</script>
|
||||||
|
</body>
|
||||||
|
</html>
|
||||||
|
`;
|
||||||
|
|
||||||
|
// Replace the placeholder with the actual base64 PDF data.
|
||||||
|
const htmlContent: string = htmlTemplate.replace("__PDF_DATA__", base64Pdf);
|
||||||
|
|
||||||
|
// Set the page content.
|
||||||
|
await page.setContent(htmlContent, { waitUntil: 'networkidle0' });
|
||||||
|
|
||||||
|
// Wait until the PDF.js rendering is complete.
|
||||||
|
await page.waitForFunction(() => (window as any).renderComplete === true, { timeout: 30000 });
|
||||||
|
|
||||||
|
// Query all canvas elements (each representing a rendered PDF page).
|
||||||
|
const canvasElements = await page.$$('canvas');
|
||||||
|
const pngBuffers: Uint8Array[] = [];
|
||||||
|
|
||||||
|
for (const canvasElement of canvasElements) {
|
||||||
|
// Screenshot the canvas element. The screenshot will be a PNG buffer.
|
||||||
|
const screenshotBuffer = (await canvasElement.screenshot({ encoding: 'binary' })) as Buffer;
|
||||||
|
pngBuffers.push(new Uint8Array(screenshotBuffer));
|
||||||
|
}
|
||||||
|
|
||||||
|
await page.close();
|
||||||
|
return pngBuffers;
|
||||||
|
}
|
||||||
|
}
|
@@ -5,15 +5,17 @@ import * as path from 'path';
|
|||||||
export { http, path };
|
export { http, path };
|
||||||
|
|
||||||
// @pushrocks
|
// @pushrocks
|
||||||
import * as smartfile from '@pushrocks/smartfile';
|
import * as smartbuffer from '@push.rocks/smartbuffer';
|
||||||
import * as smartdelay from '@pushrocks/smartdelay';
|
import * as smartfile from '@push.rocks/smartfile';
|
||||||
import * as smartpromise from '@pushrocks/smartpromise';
|
import * as smartdelay from '@push.rocks/smartdelay';
|
||||||
import * as smartpath from '@pushrocks/smartpath';
|
import * as smartpromise from '@push.rocks/smartpromise';
|
||||||
import * as smartpuppeteer from '@pushrocks/smartpuppeteer';
|
import * as smartpath from '@push.rocks/smartpath';
|
||||||
import * as smartnetwork from '@pushrocks/smartnetwork';
|
import * as smartpuppeteer from '@push.rocks/smartpuppeteer';
|
||||||
import * as smartunique from '@pushrocks/smartunique';
|
import * as smartnetwork from '@push.rocks/smartnetwork';
|
||||||
|
import * as smartunique from '@push.rocks/smartunique';
|
||||||
|
|
||||||
export {
|
export {
|
||||||
|
smartbuffer,
|
||||||
smartfile,
|
smartfile,
|
||||||
smartdelay,
|
smartdelay,
|
||||||
smartpromise,
|
smartpromise,
|
||||||
@@ -29,9 +31,8 @@ import * as tsclass from '@tsclass/tsclass';
|
|||||||
export { tsclass };
|
export { tsclass };
|
||||||
|
|
||||||
// thirdparty
|
// thirdparty
|
||||||
import pdfMerger from 'pdf-merger-js';
|
|
||||||
// @ts-ignore
|
|
||||||
import pdf2json from 'pdf2json';
|
|
||||||
import express from 'express';
|
import express from 'express';
|
||||||
|
import pdf2json from 'pdf2json';
|
||||||
|
import pdfLib from 'pdf-lib';
|
||||||
|
|
||||||
export { pdfMerger, pdf2json, express };
|
export { express, pdf2json, pdfLib, };
|
||||||
|
@@ -1,9 +1,14 @@
|
|||||||
{
|
{
|
||||||
"compilerOptions": {
|
"compilerOptions": {
|
||||||
"experimentalDecorators": true,
|
"experimentalDecorators": true,
|
||||||
|
"useDefineForClassFields": false,
|
||||||
"target": "ES2022",
|
"target": "ES2022",
|
||||||
"module": "ES2022",
|
"module": "NodeNext",
|
||||||
"moduleResolution": "nodenext",
|
"moduleResolution": "NodeNext",
|
||||||
"allowSyntheticDefaultImports": true
|
"esModuleInterop": true,
|
||||||
}
|
"verbatimModuleSyntax": true
|
||||||
|
},
|
||||||
|
"exclude": [
|
||||||
|
"dist_*/**/*.d.ts"
|
||||||
|
]
|
||||||
}
|
}
|
||||||
|
Reference in New Issue
Block a user