unarr/internal/engine/verify.go
Deivid Soto a5f3f0914a fix(engine): cross-backend integrity guard with retry-then-damaged
A truncated debrid download (in-memory byte counter hit 100% while the
NFS write-back silently dropped most of the bytes) was marked completed.
The 1.1.6 fsync fix closed the debrid-specific hole; this generalizes the
guarantee so "completed" never means a corrupt file on ANY backend.

- IntegrityError + bounded retry: on a corrupt/short result the manager
  re-downloads the same source up to 3x (clean start), then surfaces the
  task as damaged ("corrupt download:" prefix) instead of completing it.
- verify (size mismatch / empty), debrid (incomplete / post-write / flush),
  torrent (BytesMissing), usenet (par2 unrepairable / repair-failed) all
  classify integrity failures so they route through the retry/damaged path.
- scanner: a file ffprobe can't read is emitted as a damaged library_item
  (reason "unreadable") instead of being silently dropped from the sync.
- tests: manager retry-then-success + retry-exhausted-then-damaged,
  verifying->resolving transition, damaged sync item.
2026-06-17 12:58:43 +02:00

64 lines
1.7 KiB
Go

package engine
import (
"fmt"
"os"
"path/filepath"
)
// verify checks that a downloaded file or directory is valid.
func verify(result *Result) error {
if result == nil || result.FilePath == "" {
return fmt.Errorf("no file path in result")
}
fi, err := os.Stat(result.FilePath)
if err != nil {
return fmt.Errorf("file not found: %w", err)
}
// Get actual size — handle both files and directories (multi-file torrents)
var actualSize int64
if fi.IsDir() {
actualSize, err = dirSize(result.FilePath)
if err != nil {
return fmt.Errorf("could not calculate dir size: %w", err)
}
} else {
actualSize = fi.Size()
}
if actualSize == 0 {
// Integrity, not transport: a zero-byte result is corrupt — let the manager
// re-download clean rather than surface an empty file as completed.
return integrityErr("empty", "download is empty: %s", result.FilePath)
}
// If we know the expected size, check within 2% tolerance (container/muxing
// overhead). A shortfall beyond that is a truncated/corrupt file — classify it
// as an IntegrityError so the manager re-downloads clean instead of completing
// a half file (the last line of defense across every backend).
if result.Size > 0 {
tolerance := int64(float64(result.Size) * 0.02)
if actualSize < result.Size-tolerance {
return integrityErr("size_mismatch", "size mismatch: expected %d, got %d", result.Size, actualSize)
}
}
return nil
}
// dirSize returns total size of all files in a directory.
func dirSize(path string) (int64, error) {
var total int64
err := filepath.Walk(path, func(_ string, fi os.FileInfo, err error) error {
if err != nil {
return err
}
if !fi.IsDir() {
total += fi.Size()
}
return nil
})
return total, err
}