9 Commits
v0.0.9 ... main

Author SHA1 Message Date
Adrian Zürcher
4a9397457d add new functions for zip and byte slices 2026-01-07 17:04:26 +01:00
Adrian Zürcher
e6e833533e add progress to function 2026-01-06 11:12:15 +01:00
Adrian Zürcher
1822fc3628 add missing model 2026-01-06 10:15:08 +01:00
Adrian Zürcher
d80764b943 update function convert html 2026-01-06 10:03:20 +01:00
Adrian Zürcher
bd07add64e add function convert html 2026-01-06 09:54:47 +01:00
Adrian Zürcher
7fec8e1101 fix orphan instances 2025-12-29 17:15:52 +01:00
Adrian Zürcher
5b20d4406c fix canelation 2025-12-29 16:48:07 +01:00
Adrian Zürcher
40f683a917 fix hid terminal on windows 2025-12-29 14:59:24 +01:00
Adrian Zürcher
ff460fffa1 add new flags 2025-12-29 12:13:12 +01:00
7 changed files with 375 additions and 42 deletions

1
.gitignore vendored
View File

@@ -1,3 +1,4 @@
*.pdf *.pdf
assets assets
dst dst
*.zip

View File

@@ -1,6 +1,8 @@
package converter package converter
import ( import (
"archive/zip"
"bytes"
"context" "context"
"errors" "errors"
"fmt" "fmt"
@@ -18,8 +20,10 @@ import (
// html to pdf converter structure for // html to pdf converter structure for
type Converter struct { type Converter struct {
chromePath string chromePath string
ctx context.Context allocCtx context.Context
cancel context.CancelFunc allocCancel context.CancelFunc // Cancels the whole Chrome process manager
browserCtx context.Context // The specific browser instance
browserCancel context.CancelFunc // Closes the browser
progress func(progress int) progress func(progress int)
} }
@@ -27,10 +31,6 @@ type Converter struct {
func NewConverter(chromePath string) (*Converter, error) { func NewConverter(chromePath string) (*Converter, error) {
var err error var err error
if runtime.GOOS == "windows" {
hideConsole()
}
c := &Converter{chromePath: chromePath} c := &Converter{chromePath: chromePath}
chromePath, err = c.getChromePath() chromePath, err = c.getChromePath()
if err != nil { if err != nil {
@@ -42,14 +42,21 @@ func NewConverter(chromePath string) (*Converter, error) {
chromedp.NoSandbox, chromedp.NoSandbox,
chromedp.Headless, chromedp.Headless,
chromedp.DisableGPU, chromedp.DisableGPU,
chromedp.Flag("disable-software-rasterizer", true),
chromedp.Flag("disable-dev-shm-usage", true),
chromedp.Flag("no-first-run", true),
) )
var allocCtx context.Context opts = append(opts, platformOptions())
allocCtx, c.cancel = chromedp.NewExecAllocator(context.Background(), opts...)
c.ctx, c.cancel = chromedp.NewContext(allocCtx) c.allocCtx, c.allocCancel = chromedp.NewExecAllocator(context.Background(), opts...)
c.browserCtx, c.browserCancel = chromedp.NewContext(c.allocCtx)
// 5. "Warm up" the browser to ensure the executable actually runs
// This catches "file not found" or permission errors immediately
err = chromedp.Run(c.browserCtx)
if err != nil {
c.Close() // Cleanup if start fails
return nil, fmt.Errorf("failed to start chrome: %w", err)
}
return c, nil return c, nil
} }
@@ -58,7 +65,7 @@ func (c *Converter) SetProgressCallback(cb func(progress int)) {
} }
// Convert converts all given input files // Convert converts all given input files
func (c *Converter) Convert(files ...models.File) error { func (c *Converter) ConvertToPdf(files ...models.File) error {
for i, f := range files { for i, f := range files {
if c.progress != nil { if c.progress != nil {
c.progress(i + 1) c.progress(i + 1)
@@ -86,10 +93,11 @@ func (c *Converter) Convert(files ...models.File) error {
htmlURL.WriteString(filepath.ToSlash(absPath)) htmlURL.WriteString(filepath.ToSlash(absPath))
c.ctx, c.cancel = context.WithTimeout(c.ctx, 60*time.Second) taskCtx, taskCancel := chromedp.NewContext(c.browserCtx)
timeoutCtx, timeoutCancel := context.WithTimeout(taskCtx, 60*time.Second)
var pdfData []byte var pdfData []byte
err = chromedp.Run(c.ctx, err = chromedp.Run(timeoutCtx,
chromedp.Navigate(htmlURL.String()), chromedp.Navigate(htmlURL.String()),
chromedp.WaitReady("body", chromedp.ByQuery), chromedp.WaitReady("body", chromedp.ByQuery),
chromedp.ActionFunc(func(ctx context.Context) error { chromedp.ActionFunc(func(ctx context.Context) error {
@@ -106,21 +114,207 @@ func (c *Converter) Convert(files ...models.File) error {
}), }),
) )
timeoutCancel()
taskCancel()
if err != nil { if err != nil {
c.cancel()
return err return err
} }
// Save PDF to file // Save PDF to file
if err := os.WriteFile(f.Output, pdfData, 0644); err != nil { if err := os.WriteFile(f.Output, pdfData, 0644); err != nil {
c.cancel()
return err return err
} }
} }
c.cancel()
return nil return nil
} }
// Convert converts all given input files
func (c *Converter) ConvertHtmlsToPdf(htmls ...models.Html) error {
for i, h := range htmls {
if c.progress != nil {
c.progress(i + 1)
}
if len(h.Html) == 0 {
return fmt.Errorf("no .html input provided")
} else if h.Output == "" || filepath.Ext(h.Output) != ".pdf" {
return fmt.Errorf("no .pdf output file path provided: %s", h.Output)
}
taskCtx, taskCancel := chromedp.NewContext(c.browserCtx)
timeoutCtx, timeoutCancel := context.WithTimeout(taskCtx, 60*time.Second)
var pdfData []byte
err := chromedp.Run(timeoutCtx,
// Start with a blank page
chromedp.Navigate("about:blank"),
// Inject HTML directly
chromedp.ActionFunc(func(ctx context.Context) error {
frameTree, err := page.GetFrameTree().Do(ctx)
if err != nil {
return err
}
return page.SetDocumentContent(frameTree.Frame.ID, string(h.Html)).Do(ctx)
}),
chromedp.WaitReady("body", chromedp.ByQuery),
chromedp.ActionFunc(func(ctx context.Context) error {
buf, _, err := page.PrintToPDF().
WithPrintBackground(true).
WithPaperWidth(8.27).
WithPaperHeight(11.69).
Do(ctx)
if err != nil {
return err
}
pdfData = buf
return nil
}),
)
timeoutCancel()
taskCancel()
if err != nil {
return err
}
// Save PDF to file
if err := os.WriteFile(h.Output, pdfData, 0644); err != nil {
return err
}
}
return nil
}
// Convert converts all given input files
func (c *Converter) ConvertHtmlsToBytes(htmls ...models.Html) ([][]byte, error) {
var output [][]byte
for i, h := range htmls {
if c.progress != nil {
c.progress(i + 1)
}
if len(h.Html) == 0 {
return nil, fmt.Errorf("no .html input provided")
} else if h.Output == "" || filepath.Ext(h.Output) != ".pdf" {
return nil, fmt.Errorf("no .pdf output file path provided: %s", h.Output)
}
taskCtx, taskCancel := chromedp.NewContext(c.browserCtx)
timeoutCtx, timeoutCancel := context.WithTimeout(taskCtx, 60*time.Second)
var pdfData []byte
err := chromedp.Run(timeoutCtx,
// Start with a blank page
chromedp.Navigate("about:blank"),
// Inject HTML directly
chromedp.ActionFunc(func(ctx context.Context) error {
frameTree, err := page.GetFrameTree().Do(ctx)
if err != nil {
return err
}
return page.SetDocumentContent(frameTree.Frame.ID, string(h.Html)).Do(ctx)
}),
chromedp.WaitReady("body", chromedp.ByQuery),
chromedp.ActionFunc(func(ctx context.Context) error {
buf, _, err := page.PrintToPDF().
WithPrintBackground(true).
WithPaperWidth(8.27).
WithPaperHeight(11.69).
Do(ctx)
if err != nil {
return err
}
pdfData = buf
return nil
}),
)
timeoutCancel()
taskCancel()
if err != nil {
return nil, err
}
// add to array of bytes
output = append(output, pdfData)
}
return output, nil
}
// Convert html to pdf and return zip as bytes
func (c *Converter) ConvertHtmlsToZip(htmls ...models.Html) ([]byte, error) {
zipBuf := new(bytes.Buffer)
zipWriter := zip.NewWriter(zipBuf)
for i, h := range htmls {
if c.progress != nil {
c.progress(i + 1)
}
if len(h.Html) == 0 {
return nil, fmt.Errorf("no .html input provided")
} else if h.Output == "" || filepath.Ext(h.Output) != ".pdf" {
return nil, fmt.Errorf("no .pdf output file path provided: %s", h.Output)
}
taskCtx, taskCancel := chromedp.NewContext(c.browserCtx)
timeoutCtx, timeoutCancel := context.WithTimeout(taskCtx, 60*time.Second)
var pdfData []byte
err := chromedp.Run(timeoutCtx,
// Start with a blank page
chromedp.Navigate("about:blank"),
// Inject HTML directly
chromedp.ActionFunc(func(ctx context.Context) error {
frameTree, err := page.GetFrameTree().Do(ctx)
if err != nil {
return err
}
return page.SetDocumentContent(frameTree.Frame.ID, string(h.Html)).Do(ctx)
}),
chromedp.WaitReady("body", chromedp.ByQuery),
chromedp.ActionFunc(func(ctx context.Context) error {
buf, _, err := page.PrintToPDF().
WithPrintBackground(true).
WithPaperWidth(8.27).
WithPaperHeight(11.69).
Do(ctx)
if err != nil {
return err
}
pdfData = buf
return nil
}),
)
timeoutCancel()
taskCancel()
if err != nil {
return nil, err
}
// add to zip
f, err := zipWriter.Create(h.Output)
if err != nil {
return nil, err
}
f.Write(pdfData)
}
zipWriter.Close()
return zipBuf.Bytes(), nil
}
func (c *Converter) Close() {
// Close browser first, then allocator
if c.browserCancel != nil {
c.browserCancel()
}
if c.allocCancel != nil {
c.allocCancel()
}
}
// getChromePath checks for system Chrome, else falls back to bundled headless shell // getChromePath checks for system Chrome, else falls back to bundled headless shell
func (c *Converter) getChromePath() (string, error) { func (c *Converter) getChromePath() (string, error) {

View File

@@ -2,8 +2,9 @@
package converter package converter
// hideConsole does nothing on non-Windows systems import "github.com/chromedp/chromedp"
func hideConsole() {
// macOS and Linux don't have the same "console window" concept func platformOptions() chromedp.ExecAllocatorOption {
// that needs manual hiding at runtime like Windows. // Returns a no-op option for Mac/Linux
return chromedp.NoSandbox
} }

View File

@@ -3,21 +3,18 @@
package converter package converter
import ( import (
"os/exec"
"syscall" "syscall"
"github.com/chromedp/chromedp"
) )
var ( func platformOptions() chromedp.ExecAllocatorOption {
kernel32 = syscall.NewLazyDLL("kernel32.dll") return chromedp.ModifyCmdFunc(func(cmd *exec.Cmd) {
user32 = syscall.NewLazyDLL("user32.dll") if cmd.SysProcAttr == nil {
getConsoleWindow = kernel32.NewProc("GetConsoleWindow") cmd.SysProcAttr = &syscall.SysProcAttr{}
showWindow = user32.NewProc("ShowWindow")
)
const SW_HIDE = 0
func hideConsole() {
hwnd, _, _ := getConsoleWindow.Call()
if hwnd != 0 {
showWindow.Call(hwnd, SW_HIDE)
} }
cmd.SysProcAttr.HideWindow = true
cmd.SysProcAttr.CreationFlags = 0x08000000 // CREATE_NO_WINDOW
})
} }

View File

@@ -15,7 +15,9 @@ func Convert(chromePath, inputFile, outputFile string) error {
if err != nil { if err != nil {
return err return err
} }
return c.Convert(input) defer c.Close()
return c.ConvertToPdf(input)
} }
// NewConverterInstance start new chrome headless shell instance // NewConverterInstance start new chrome headless shell instance

View File

@@ -1,6 +1,7 @@
package html2pdf package html2pdf
import ( import (
"bytes"
"fmt" "fmt"
"os" "os"
"path/filepath" "path/filepath"
@@ -42,17 +43,145 @@ func TestConvertFiles(t *testing.T) {
}) })
} }
c, err := converter.NewConverter("./assets") c, err := converter.NewConverter("assets/chrome-headless-shell/win64")
if err != nil { if err != nil {
t.Fatal(err) t.Fatal(err)
} }
defer c.Close()
c.SetProgressCallback(func(progress int) { c.SetProgressCallback(func(progress int) {
fmt.Println(progress) fmt.Println(progress)
}) })
if err := c.Convert(input...); err != nil { if err := c.ConvertToPdf(input...); err != nil {
t.Fatal(err) t.Fatal(err)
} }
t.Log("test successfull") t.Log("test successfull")
} }
func TestConvertHtml(t *testing.T) {
t.Log("start test ConvertHtml")
// Skip in short mode (useful for CI)
if testing.Short() {
t.Skip("skipping ConvertHtml integration test in short mode")
}
html := []byte(`
<!DOCTYPE html>
<html>
<head>
<meta charset="utf-8">
<title>Test PDF</title>
<style>
body { font-family: Arial, sans-serif; }
h1 { color: #333; }
</style>
</head>
<body>
<h1>Hello PDF</h1>
<p>This is a test.</p>
</body>
</html>
`)
tmpDir := t.TempDir()
outputPath := filepath.Join(tmpDir, "test.pdf")
c, err := converter.NewConverter("assets/chrome-headless-shell/win64")
if err != nil {
t.Fatal(err)
}
defer c.Close()
err = c.ConvertHtmlsToPdf(models.Html{Html: html, Output: outputPath})
if err != nil {
t.Fatalf("ConvertHtml failed: %v", err)
}
// Assert PDF exists
data, err := os.ReadFile(outputPath)
if err != nil {
t.Fatalf("PDF not created: %v", err)
}
// Assert non-empty
if len(data) == 0 {
t.Fatal("PDF file is empty")
}
// Assert valid PDF header
if !bytes.HasPrefix(data, []byte("%PDF-")) {
t.Fatalf("output is not a valid PDF (missing %%PDF- header)")
}
t.Log("ConvertHtml test successful")
}
func TestConvertHtmlsToPDFZip(t *testing.T) {
t.Log("start test ConvertHtml")
// Skip in short mode (useful for CI)
if testing.Short() {
t.Skip("skipping ConvertHtml integration test in short mode")
}
html := []byte(`
<!DOCTYPE html>
<html>
<head>
<meta charset="utf-8">
<title>Test PDF</title>
<style>
body { font-family: Arial, sans-serif; }
h1 { color: #333; }
</style>
</head>
<body>
<h1>Hello PDF</h1>
<p>This is a test.</p>
</body>
</html>
`)
outputPath := filepath.Join("test.pdf")
c, err := converter.NewConverter("assets/chrome-headless-shell/win64")
if err != nil {
t.Fatal(err)
}
defer c.Close()
b, err := c.ConvertHtmlsToZip(models.Html{Html: html, Output: outputPath})
if err != nil {
t.Fatalf("ConvertHtml failed: %v", err)
}
f, err := os.Create("test.zip")
if err != nil {
t.Fatalf("create file: %v", err)
}
defer f.Close()
_, err = f.Write(b)
if err != nil {
t.Fatalf("write to file: %v", err)
}
// // Assert PDF exists
// data, err := os.ReadFile(outputPath)
// if err != nil {
// t.Fatalf("PDF not created: %v", err)
// }
// // Assert non-empty
// if len(data) == 0 {
// t.Fatal("PDF file is empty")
// }
// // Assert valid PDF header
// if !bytes.HasPrefix(data, []byte("%PDF-")) {
// t.Fatalf("output is not a valid PDF (missing %%PDF- header)")
// }
t.Log("ConvertHtml test successful")
}

9
models/html.go Normal file
View File

@@ -0,0 +1,9 @@
package models
type Htmls []Html
// input model for converter
type Html struct {
Html []byte
Output string
}