Files
webarchive/entity/page.go
2023-03-26 16:11:00 +03:00

100 lines
1.7 KiB
Go

package entity
import (
"context"
"fmt"
"sync"
"time"
"github.com/google/uuid"
)
type Processor interface {
Process(ctx context.Context, format Format, url string) Result
}
type Format uint8
const (
FormatHeaders Format = iota
FormatSingleFile
FormatPDF
)
type Status uint8
const (
StatusNew Status = iota
StatusProcessing
StatusDone
StatusFailed
StatusWithErrors
)
func NewPage(url string, description string, formats ...Format) *Page {
return &Page{
ID: uuid.New(),
URL: url,
Description: description,
Formats: formats,
Created: time.Now(),
Version: 1,
}
}
type Page struct {
ID uuid.UUID
URL string
Description string
Created time.Time
Formats []Format
Results Results
Version uint16
Status Status
}
func (p *Page) SetProcessing() {
p.Status = StatusProcessing
}
func (p *Page) Process(ctx context.Context, wg *sync.WaitGroup, processor Processor) {
defer wg.Done()
innerWG := sync.WaitGroup{}
innerWG.Add(len(p.Formats))
for _, format := range p.Formats {
go func(format Format) {
defer innerWG.Done()
defer func() {
if err := recover(); err != nil {
p.Results.Add(Result{Format: format, Err: fmt.Errorf("recovered from panic: %v", err)})
}
}()
result := processor.Process(ctx, format, p.URL)
p.Results.Add(result)
}(format)
}
var hasResultWithOutErrors bool
for _, result := range p.Results.Results() {
if result.Err != nil {
p.Status = StatusWithErrors
} else {
hasResultWithOutErrors = true
}
}
if !hasResultWithOutErrors {
p.Status = StatusFailed
}
if p.Status == StatusProcessing {
p.Status = StatusDone
}
innerWG.Wait()
}