2022-01-08 17:17:01 +01:00
|
|
|
/*
|
|
|
|
GoToSocial
|
|
|
|
Copyright (C) 2021-2022 GoToSocial Authors admin@gotosocial.org
|
|
|
|
|
|
|
|
This program is free software: you can redistribute it and/or modify
|
|
|
|
it under the terms of the GNU Affero General Public License as published by
|
|
|
|
the Free Software Foundation, either version 3 of the License, or
|
|
|
|
(at your option) any later version.
|
|
|
|
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
GNU Affero General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU Affero General Public License
|
|
|
|
along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
*/
|
|
|
|
|
2022-01-02 15:00:53 +01:00
|
|
|
package media
|
|
|
|
|
2022-01-03 17:37:38 +01:00
|
|
|
import (
|
2022-01-04 17:37:54 +01:00
|
|
|
"context"
|
2022-01-03 17:37:38 +01:00
|
|
|
"fmt"
|
2022-01-11 17:49:14 +01:00
|
|
|
"strings"
|
2022-01-03 17:37:38 +01:00
|
|
|
"sync"
|
2022-01-08 17:17:01 +01:00
|
|
|
"time"
|
2022-01-03 17:37:38 +01:00
|
|
|
|
2022-01-04 17:37:54 +01:00
|
|
|
"codeberg.org/gruf/go-store/kv"
|
|
|
|
"github.com/superseriousbusiness/gotosocial/internal/db"
|
2022-01-03 17:37:38 +01:00
|
|
|
"github.com/superseriousbusiness/gotosocial/internal/gtsmodel"
|
2022-01-11 17:49:14 +01:00
|
|
|
"github.com/superseriousbusiness/gotosocial/internal/id"
|
|
|
|
"github.com/superseriousbusiness/gotosocial/internal/uris"
|
2022-01-03 17:37:38 +01:00
|
|
|
)
|
2022-01-02 15:00:53 +01:00
|
|
|
|
2022-01-11 17:49:14 +01:00
|
|
|
// ProcessingMedia represents a piece of media that is currently being processed. It exposes
|
2022-01-10 18:36:09 +01:00
|
|
|
// various functions for retrieving data from the process.
|
2022-01-11 17:49:14 +01:00
|
|
|
type ProcessingMedia struct {
|
2022-01-04 17:37:54 +01:00
|
|
|
mu sync.Mutex
|
|
|
|
|
|
|
|
/*
|
|
|
|
below fields should be set on newly created media;
|
|
|
|
attachment will be updated incrementally as media goes through processing
|
|
|
|
*/
|
|
|
|
|
2022-01-11 17:49:14 +01:00
|
|
|
attachment *gtsmodel.MediaAttachment
|
|
|
|
data DataFunc
|
2022-01-09 18:41:22 +01:00
|
|
|
|
2022-01-11 17:49:14 +01:00
|
|
|
rawData []byte // will be set once the fetchRawData function has been called
|
2022-01-04 17:37:54 +01:00
|
|
|
|
|
|
|
/*
|
|
|
|
below fields represent the processing state of the media thumbnail
|
|
|
|
*/
|
|
|
|
|
2022-01-08 13:45:42 +01:00
|
|
|
thumbstate processState
|
|
|
|
thumb *ImageMeta
|
2022-01-04 17:37:54 +01:00
|
|
|
|
|
|
|
/*
|
|
|
|
below fields represent the processing state of the full-sized media
|
|
|
|
*/
|
|
|
|
|
2022-01-08 13:45:42 +01:00
|
|
|
fullSizeState processState
|
|
|
|
fullSize *ImageMeta
|
2022-01-04 17:37:54 +01:00
|
|
|
|
|
|
|
/*
|
|
|
|
below pointers to database and storage are maintained so that
|
|
|
|
the media can store and update itself during processing steps
|
|
|
|
*/
|
|
|
|
|
|
|
|
database db.DB
|
|
|
|
storage *kv.KVStore
|
|
|
|
|
|
|
|
err error // error created during processing, if any
|
2022-01-15 17:36:15 +01:00
|
|
|
|
|
|
|
// track whether this media has already been put in the databse
|
|
|
|
insertedInDB bool
|
2022-01-03 17:37:38 +01:00
|
|
|
}
|
|
|
|
|
2022-01-11 17:49:14 +01:00
|
|
|
// AttachmentID returns the ID of the underlying media attachment without blocking processing.
|
|
|
|
func (p *ProcessingMedia) AttachmentID() string {
|
|
|
|
return p.attachment.ID
|
|
|
|
}
|
|
|
|
|
|
|
|
// LoadAttachment blocks until the thumbnail and fullsize content
|
|
|
|
// has been processed, and then returns the completed attachment.
|
|
|
|
func (p *ProcessingMedia) LoadAttachment(ctx context.Context) (*gtsmodel.MediaAttachment, error) {
|
|
|
|
if err := p.fetchRawData(ctx); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
if _, err := p.loadThumb(ctx); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
if _, err := p.loadFullSize(ctx); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2022-01-15 17:36:15 +01:00
|
|
|
// store the result in the database before returning it
|
|
|
|
p.mu.Lock()
|
|
|
|
defer p.mu.Unlock()
|
|
|
|
if !p.insertedInDB {
|
|
|
|
if err := p.database.Put(ctx, p.attachment); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
p.insertedInDB = true
|
|
|
|
}
|
|
|
|
|
2022-01-11 17:49:14 +01:00
|
|
|
return p.attachment, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// Finished returns true if processing has finished for both the thumbnail
|
|
|
|
// and full fized version of this piece of media.
|
|
|
|
func (p *ProcessingMedia) Finished() bool {
|
|
|
|
return p.thumbstate == complete && p.fullSizeState == complete
|
|
|
|
}
|
|
|
|
|
|
|
|
func (p *ProcessingMedia) loadThumb(ctx context.Context) (*ImageMeta, error) {
|
2022-01-10 18:36:09 +01:00
|
|
|
p.mu.Lock()
|
|
|
|
defer p.mu.Unlock()
|
2022-01-04 17:37:54 +01:00
|
|
|
|
2022-01-10 18:36:09 +01:00
|
|
|
switch p.thumbstate {
|
2022-01-04 17:37:54 +01:00
|
|
|
case received:
|
|
|
|
// we haven't processed a thumbnail for this media yet so do it now
|
2022-01-09 18:41:22 +01:00
|
|
|
|
|
|
|
// check if we need to create a blurhash or if there's already one set
|
|
|
|
var createBlurhash bool
|
2022-01-10 18:36:09 +01:00
|
|
|
if p.attachment.Blurhash == "" {
|
2022-01-09 18:41:22 +01:00
|
|
|
// no blurhash created yet
|
|
|
|
createBlurhash = true
|
|
|
|
}
|
|
|
|
|
2022-01-10 18:36:09 +01:00
|
|
|
thumb, err := deriveThumbnail(p.rawData, p.attachment.File.ContentType, createBlurhash)
|
2022-01-04 17:37:54 +01:00
|
|
|
if err != nil {
|
2022-01-10 18:36:09 +01:00
|
|
|
p.err = fmt.Errorf("error deriving thumbnail: %s", err)
|
|
|
|
p.thumbstate = errored
|
|
|
|
return nil, p.err
|
2022-01-04 17:37:54 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// put the thumbnail in storage
|
2022-01-10 18:36:09 +01:00
|
|
|
if err := p.storage.Put(p.attachment.Thumbnail.Path, thumb.image); err != nil {
|
|
|
|
p.err = fmt.Errorf("error storing thumbnail: %s", err)
|
|
|
|
p.thumbstate = errored
|
|
|
|
return nil, p.err
|
2022-01-04 17:37:54 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// set appropriate fields on the attachment based on the thumbnail we derived
|
2022-01-09 18:41:22 +01:00
|
|
|
if createBlurhash {
|
2022-01-10 18:36:09 +01:00
|
|
|
p.attachment.Blurhash = thumb.blurhash
|
2022-01-09 18:41:22 +01:00
|
|
|
}
|
|
|
|
|
2022-01-10 18:36:09 +01:00
|
|
|
p.attachment.FileMeta.Small = gtsmodel.Small{
|
2022-01-04 17:37:54 +01:00
|
|
|
Width: thumb.width,
|
|
|
|
Height: thumb.height,
|
|
|
|
Size: thumb.size,
|
|
|
|
Aspect: thumb.aspect,
|
|
|
|
}
|
2022-01-15 14:33:58 +01:00
|
|
|
p.attachment.Thumbnail.FileSize = len(thumb.image)
|
2022-01-04 17:37:54 +01:00
|
|
|
|
|
|
|
// set the thumbnail of this media
|
2022-01-10 18:36:09 +01:00
|
|
|
p.thumb = thumb
|
2022-01-04 17:37:54 +01:00
|
|
|
|
|
|
|
// we're done processing the thumbnail!
|
2022-01-10 18:36:09 +01:00
|
|
|
p.thumbstate = complete
|
2022-01-04 17:37:54 +01:00
|
|
|
fallthrough
|
|
|
|
case complete:
|
2022-01-10 18:36:09 +01:00
|
|
|
return p.thumb, nil
|
2022-01-04 17:37:54 +01:00
|
|
|
case errored:
|
2022-01-10 18:36:09 +01:00
|
|
|
return nil, p.err
|
2022-01-04 17:37:54 +01:00
|
|
|
}
|
|
|
|
|
2022-01-10 18:36:09 +01:00
|
|
|
return nil, fmt.Errorf("thumbnail processing status %d unknown", p.thumbstate)
|
2022-01-04 17:37:54 +01:00
|
|
|
}
|
|
|
|
|
2022-01-11 17:49:14 +01:00
|
|
|
func (p *ProcessingMedia) loadFullSize(ctx context.Context) (*ImageMeta, error) {
|
2022-01-10 18:36:09 +01:00
|
|
|
p.mu.Lock()
|
|
|
|
defer p.mu.Unlock()
|
2022-01-08 13:45:42 +01:00
|
|
|
|
2022-01-10 18:36:09 +01:00
|
|
|
switch p.fullSizeState {
|
2022-01-08 13:45:42 +01:00
|
|
|
case received:
|
|
|
|
var clean []byte
|
|
|
|
var err error
|
|
|
|
var decoded *ImageMeta
|
|
|
|
|
2022-01-10 18:36:09 +01:00
|
|
|
ct := p.attachment.File.ContentType
|
2022-01-08 13:45:42 +01:00
|
|
|
switch ct {
|
|
|
|
case mimeImageJpeg, mimeImagePng:
|
|
|
|
// first 'clean' image by purging exif data from it
|
|
|
|
var exifErr error
|
2022-01-10 18:36:09 +01:00
|
|
|
if clean, exifErr = purgeExif(p.rawData); exifErr != nil {
|
2022-01-08 13:45:42 +01:00
|
|
|
err = exifErr
|
|
|
|
break
|
|
|
|
}
|
|
|
|
decoded, err = decodeImage(clean, ct)
|
|
|
|
case mimeImageGif:
|
|
|
|
// gifs are already clean - no exif data to remove
|
2022-01-10 18:36:09 +01:00
|
|
|
clean = p.rawData
|
2022-01-08 13:45:42 +01:00
|
|
|
decoded, err = decodeGif(clean)
|
|
|
|
default:
|
|
|
|
err = fmt.Errorf("content type %s not a processible image type", ct)
|
2022-01-04 17:37:54 +01:00
|
|
|
}
|
|
|
|
|
2022-01-08 13:45:42 +01:00
|
|
|
if err != nil {
|
2022-01-10 18:36:09 +01:00
|
|
|
p.err = err
|
|
|
|
p.fullSizeState = errored
|
2022-01-08 13:45:42 +01:00
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2022-01-08 17:17:01 +01:00
|
|
|
// put the full size in storage
|
2022-01-10 18:36:09 +01:00
|
|
|
if err := p.storage.Put(p.attachment.File.Path, decoded.image); err != nil {
|
|
|
|
p.err = fmt.Errorf("error storing full size image: %s", err)
|
|
|
|
p.fullSizeState = errored
|
|
|
|
return nil, p.err
|
2022-01-08 17:17:01 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// set appropriate fields on the attachment based on the image we derived
|
2022-01-10 18:36:09 +01:00
|
|
|
p.attachment.FileMeta.Original = gtsmodel.Original{
|
2022-01-08 17:17:01 +01:00
|
|
|
Width: decoded.width,
|
|
|
|
Height: decoded.height,
|
|
|
|
Size: decoded.size,
|
|
|
|
Aspect: decoded.aspect,
|
|
|
|
}
|
2022-01-15 14:33:58 +01:00
|
|
|
p.attachment.File.FileSize = len(decoded.image)
|
2022-01-10 18:36:09 +01:00
|
|
|
p.attachment.File.UpdatedAt = time.Now()
|
|
|
|
p.attachment.Processing = gtsmodel.ProcessingStatusProcessed
|
2022-01-08 17:17:01 +01:00
|
|
|
|
2022-01-08 13:45:42 +01:00
|
|
|
// set the fullsize of this media
|
2022-01-10 18:36:09 +01:00
|
|
|
p.fullSize = decoded
|
2022-01-08 13:45:42 +01:00
|
|
|
|
|
|
|
// we're done processing the full-size image
|
2022-01-10 18:36:09 +01:00
|
|
|
p.fullSizeState = complete
|
2022-01-08 13:45:42 +01:00
|
|
|
fallthrough
|
|
|
|
case complete:
|
2022-01-10 18:36:09 +01:00
|
|
|
return p.fullSize, nil
|
2022-01-08 13:45:42 +01:00
|
|
|
case errored:
|
2022-01-10 18:36:09 +01:00
|
|
|
return nil, p.err
|
2022-01-03 17:37:38 +01:00
|
|
|
}
|
2022-01-04 17:37:54 +01:00
|
|
|
|
2022-01-10 18:36:09 +01:00
|
|
|
return nil, fmt.Errorf("full size processing status %d unknown", p.fullSizeState)
|
2022-01-03 17:37:38 +01:00
|
|
|
}
|
|
|
|
|
2022-01-11 17:49:14 +01:00
|
|
|
// fetchRawData calls the data function attached to p if it hasn't been called yet,
|
|
|
|
// and updates the underlying attachment fields as necessary.
|
|
|
|
// It should only be called from within a function that already has a lock on p!
|
|
|
|
func (p *ProcessingMedia) fetchRawData(ctx context.Context) error {
|
|
|
|
// check if we've already done this and bail early if we have
|
|
|
|
if p.rawData != nil {
|
|
|
|
return nil
|
|
|
|
}
|
2022-01-08 17:17:01 +01:00
|
|
|
|
2022-01-11 17:49:14 +01:00
|
|
|
// execute the data function and pin the raw bytes for further processing
|
|
|
|
b, err := p.data(ctx)
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("fetchRawData: error executing data function: %s", err)
|
2022-01-08 13:45:42 +01:00
|
|
|
}
|
2022-01-11 17:49:14 +01:00
|
|
|
p.rawData = b
|
2022-01-08 13:45:42 +01:00
|
|
|
|
2022-01-11 17:49:14 +01:00
|
|
|
// now we have the data we can work out the content type
|
|
|
|
contentType, err := parseContentType(p.rawData)
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("fetchRawData: error parsing content type: %s", err)
|
2022-01-08 13:45:42 +01:00
|
|
|
}
|
|
|
|
|
2022-01-11 17:49:14 +01:00
|
|
|
split := strings.Split(contentType, "/")
|
|
|
|
if len(split) != 2 {
|
|
|
|
return fmt.Errorf("fetchRawData: content type %s was not valid", contentType)
|
|
|
|
}
|
2022-01-08 17:17:01 +01:00
|
|
|
|
2022-01-11 17:49:14 +01:00
|
|
|
mainType := split[0] // something like 'image'
|
|
|
|
extension := split[1] // something like 'jpeg'
|
|
|
|
|
|
|
|
// set some additional fields on the attachment now that
|
|
|
|
// we know more about what the underlying media actually is
|
|
|
|
p.attachment.URL = uris.GenerateURIForAttachment(p.attachment.AccountID, string(TypeAttachment), string(SizeOriginal), p.attachment.ID, extension)
|
|
|
|
p.attachment.File.Path = fmt.Sprintf("%s/%s/%s/%s.%s", p.attachment.AccountID, TypeAttachment, SizeOriginal, p.attachment.ID, extension)
|
|
|
|
p.attachment.File.ContentType = contentType
|
|
|
|
|
|
|
|
switch mainType {
|
|
|
|
case mimeImage:
|
|
|
|
if extension == mimeGif {
|
|
|
|
p.attachment.Type = gtsmodel.FileTypeGif
|
|
|
|
} else {
|
|
|
|
p.attachment.Type = gtsmodel.FileTypeImage
|
|
|
|
}
|
|
|
|
default:
|
|
|
|
return fmt.Errorf("fetchRawData: cannot process mime type %s (yet)", mainType)
|
|
|
|
}
|
2022-01-08 17:17:01 +01:00
|
|
|
|
2022-01-11 17:49:14 +01:00
|
|
|
return nil
|
2022-01-10 18:36:09 +01:00
|
|
|
}
|
|
|
|
|
2022-01-11 17:49:14 +01:00
|
|
|
func (m *manager) preProcessMedia(ctx context.Context, data DataFunc, accountID string, ai *AdditionalMediaInfo) (*ProcessingMedia, error) {
|
|
|
|
id, err := id.NewRandomULID()
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
file := gtsmodel.File{
|
|
|
|
Path: "", // we don't know yet because it depends on the uncalled DataFunc
|
|
|
|
ContentType: "", // we don't know yet because it depends on the uncalled DataFunc
|
|
|
|
UpdatedAt: time.Now(),
|
|
|
|
}
|
|
|
|
|
|
|
|
thumbnail := gtsmodel.Thumbnail{
|
|
|
|
URL: uris.GenerateURIForAttachment(accountID, string(TypeAttachment), string(SizeSmall), id, mimeJpeg), // all thumbnails are encoded as jpeg,
|
|
|
|
Path: fmt.Sprintf("%s/%s/%s/%s.%s", accountID, TypeAttachment, SizeSmall, id, mimeJpeg), // all thumbnails are encoded as jpeg,
|
|
|
|
ContentType: mimeJpeg,
|
|
|
|
UpdatedAt: time.Now(),
|
|
|
|
}
|
|
|
|
|
|
|
|
// populate initial fields on the media attachment -- some of these will be overwritten as we proceed
|
|
|
|
attachment := >smodel.MediaAttachment{
|
|
|
|
ID: id,
|
|
|
|
CreatedAt: time.Now(),
|
|
|
|
UpdatedAt: time.Now(),
|
|
|
|
StatusID: "",
|
|
|
|
URL: "", // we don't know yet because it depends on the uncalled DataFunc
|
|
|
|
RemoteURL: "",
|
|
|
|
Type: gtsmodel.FileTypeUnknown, // we don't know yet because it depends on the uncalled DataFunc
|
|
|
|
FileMeta: gtsmodel.FileMeta{},
|
|
|
|
AccountID: accountID,
|
|
|
|
Description: "",
|
|
|
|
ScheduledStatusID: "",
|
|
|
|
Blurhash: "",
|
|
|
|
Processing: gtsmodel.ProcessingStatusReceived,
|
|
|
|
File: file,
|
|
|
|
Thumbnail: thumbnail,
|
|
|
|
Avatar: false,
|
|
|
|
Header: false,
|
|
|
|
}
|
|
|
|
|
|
|
|
// check if we have additional info to add to the attachment,
|
|
|
|
// and overwrite some of the attachment fields if so
|
|
|
|
if ai != nil {
|
|
|
|
if ai.CreatedAt != nil {
|
|
|
|
attachment.CreatedAt = *ai.CreatedAt
|
|
|
|
}
|
|
|
|
|
|
|
|
if ai.StatusID != nil {
|
|
|
|
attachment.StatusID = *ai.StatusID
|
|
|
|
}
|
|
|
|
|
|
|
|
if ai.RemoteURL != nil {
|
|
|
|
attachment.RemoteURL = *ai.RemoteURL
|
|
|
|
}
|
|
|
|
|
|
|
|
if ai.Description != nil {
|
|
|
|
attachment.Description = *ai.Description
|
|
|
|
}
|
|
|
|
|
|
|
|
if ai.ScheduledStatusID != nil {
|
|
|
|
attachment.ScheduledStatusID = *ai.ScheduledStatusID
|
|
|
|
}
|
|
|
|
|
|
|
|
if ai.Blurhash != nil {
|
|
|
|
attachment.Blurhash = *ai.Blurhash
|
|
|
|
}
|
|
|
|
|
|
|
|
if ai.Avatar != nil {
|
|
|
|
attachment.Avatar = *ai.Avatar
|
|
|
|
}
|
|
|
|
|
|
|
|
if ai.Header != nil {
|
|
|
|
attachment.Header = *ai.Header
|
|
|
|
}
|
|
|
|
|
|
|
|
if ai.FocusX != nil {
|
|
|
|
attachment.FileMeta.Focus.X = *ai.FocusX
|
|
|
|
}
|
|
|
|
|
|
|
|
if ai.FocusY != nil {
|
|
|
|
attachment.FileMeta.Focus.Y = *ai.FocusY
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
processingMedia := &ProcessingMedia{
|
|
|
|
attachment: attachment,
|
|
|
|
data: data,
|
|
|
|
thumbstate: received,
|
|
|
|
fullSizeState: received,
|
|
|
|
database: m.db,
|
|
|
|
storage: m.storage,
|
|
|
|
}
|
|
|
|
|
|
|
|
return processingMedia, nil
|
|
|
|
}
|