mirror of
https://github.com/superseriousbusiness/gotosocial.git
synced 2024-12-27 09:36:31 +00:00
368c97f0f8
* take into account rotation when generating thumbnail, simplify ffprobe output to show only fields we need * only show rotation side data * remove unnecessary comment * fix code comments * remove debug logging
568 lines
14 KiB
Go
568 lines
14 KiB
Go
// GoToSocial
|
|
// Copyright (C) GoToSocial Authors admin@gotosocial.org
|
|
// SPDX-License-Identifier: AGPL-3.0-or-later
|
|
//
|
|
// This program is free software: you can redistribute it and/or modify
|
|
// it under the terms of the GNU Affero General Public License as published by
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
// (at your option) any later version.
|
|
//
|
|
// This program is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
// GNU Affero General Public License for more details.
|
|
//
|
|
// You should have received a copy of the GNU Affero General Public License
|
|
// along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
package media
|
|
|
|
import (
|
|
"context"
|
|
"encoding/json"
|
|
"errors"
|
|
"os"
|
|
"path"
|
|
"strconv"
|
|
"strings"
|
|
|
|
"codeberg.org/gruf/go-byteutil"
|
|
|
|
"codeberg.org/gruf/go-ffmpreg/wasm"
|
|
_ffmpeg "github.com/superseriousbusiness/gotosocial/internal/media/ffmpeg"
|
|
|
|
"github.com/superseriousbusiness/gotosocial/internal/gtserror"
|
|
"github.com/superseriousbusiness/gotosocial/internal/gtsmodel"
|
|
"github.com/tetratelabs/wazero"
|
|
)
|
|
|
|
// ffmpegClearMetadata generates a copy (in-place) of input media with all metadata cleared.
|
|
func ffmpegClearMetadata(ctx context.Context, filepath string) error {
|
|
var outpath string
|
|
|
|
// Get directory from filepath.
|
|
dirpath := path.Dir(filepath)
|
|
|
|
// Generate cleaned output path MAINTAINING extension.
|
|
if i := strings.IndexByte(filepath, '.'); i != -1 {
|
|
outpath = filepath[:i] + "_cleaned" + filepath[i:]
|
|
} else {
|
|
return gtserror.New("input file missing extension")
|
|
}
|
|
|
|
// Clear metadata with ffmpeg.
|
|
if err := ffmpeg(ctx, dirpath,
|
|
|
|
// Only log errors.
|
|
"-loglevel", "error",
|
|
|
|
// Input file path.
|
|
"-i", filepath,
|
|
|
|
// Drop all metadata.
|
|
"-map_metadata", "-1",
|
|
|
|
// Copy input codecs,
|
|
// i.e. no transcode.
|
|
"-codec", "copy",
|
|
|
|
// Overwrite.
|
|
"-y",
|
|
|
|
// Output.
|
|
outpath,
|
|
); err != nil {
|
|
return err
|
|
}
|
|
|
|
// Move the new output file path to original location.
|
|
if err := os.Rename(outpath, filepath); err != nil {
|
|
return gtserror.Newf("error renaming %s -> %s: %w", outpath, filepath, err)
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
// ffmpegGenerateThumb generates a thumbnail webp from input media of any type, useful for any media.
|
|
func ffmpegGenerateThumb(ctx context.Context, filepath string, width, height int) (string, error) {
|
|
var outpath string
|
|
|
|
// Generate thumb output path REPLACING extension.
|
|
if i := strings.IndexByte(filepath, '.'); i != -1 {
|
|
outpath = filepath[:i] + "_thumb.webp"
|
|
} else {
|
|
return "", gtserror.New("input file missing extension")
|
|
}
|
|
|
|
// Get directory from filepath.
|
|
dirpath := path.Dir(filepath)
|
|
|
|
// Thumbnail size scaling argument.
|
|
scale := strconv.Itoa(width) + ":" +
|
|
strconv.Itoa(height)
|
|
|
|
// Generate thumb with ffmpeg.
|
|
if err := ffmpeg(ctx, dirpath,
|
|
|
|
// Only log errors.
|
|
"-loglevel", "error",
|
|
|
|
// Input file.
|
|
"-i", filepath,
|
|
|
|
// Encode using libwebp.
|
|
// (NOT as libwebp_anim).
|
|
"-codec:v", "libwebp",
|
|
|
|
// Select thumb from first 10 frames
|
|
// (thumb filter: https://ffmpeg.org/ffmpeg-filters.html#thumbnail)
|
|
"-filter:v", "thumbnail=n=10,"+
|
|
|
|
// scale to dimensions
|
|
// (scale filter: https://ffmpeg.org/ffmpeg-filters.html#scale)
|
|
"scale="+scale+","+
|
|
|
|
// YUVA 4:2:0 pixel format
|
|
// (format filter: https://ffmpeg.org/ffmpeg-filters.html#format)
|
|
"format=pix_fmts=yuva420p",
|
|
|
|
// Only one frame
|
|
"-frames:v", "1",
|
|
|
|
// ~40% webp quality
|
|
// (codec options: https://ffmpeg.org/ffmpeg-codecs.html#toc-Codec-Options)
|
|
// (libwebp codec: https://ffmpeg.org/ffmpeg-codecs.html#Options-36)
|
|
"-qscale:v", "40",
|
|
|
|
// Overwrite.
|
|
"-y",
|
|
|
|
// Output.
|
|
outpath,
|
|
); err != nil {
|
|
return "", err
|
|
}
|
|
|
|
return outpath, nil
|
|
}
|
|
|
|
// ffmpegGenerateStatic generates a static png from input image of any type, useful for emoji.
|
|
func ffmpegGenerateStatic(ctx context.Context, filepath string) (string, error) {
|
|
var outpath string
|
|
|
|
// Generate thumb output path REPLACING extension.
|
|
if i := strings.IndexByte(filepath, '.'); i != -1 {
|
|
outpath = filepath[:i] + "_static.png"
|
|
} else {
|
|
return "", gtserror.New("input file missing extension")
|
|
}
|
|
|
|
// Get directory from filepath.
|
|
dirpath := path.Dir(filepath)
|
|
|
|
// Generate static with ffmpeg.
|
|
if err := ffmpeg(ctx, dirpath,
|
|
|
|
// Only log errors.
|
|
"-loglevel", "error",
|
|
|
|
// Input file.
|
|
"-i", filepath,
|
|
|
|
// Only first frame.
|
|
"-frames:v", "1",
|
|
|
|
// Encode using png.
|
|
// (NOT as apng).
|
|
"-codec:v", "png",
|
|
|
|
// Overwrite.
|
|
"-y",
|
|
|
|
// Output.
|
|
outpath,
|
|
); err != nil {
|
|
return "", err
|
|
}
|
|
|
|
return outpath, nil
|
|
}
|
|
|
|
// ffmpeg calls `ffmpeg [args...]` (WASM) with directory path mounted in runtime.
|
|
func ffmpeg(ctx context.Context, dirpath string, args ...string) error {
|
|
var stderr byteutil.Buffer
|
|
rc, err := _ffmpeg.Ffmpeg(ctx, wasm.Args{
|
|
Stderr: &stderr,
|
|
Args: args,
|
|
Config: func(modcfg wazero.ModuleConfig) wazero.ModuleConfig {
|
|
fscfg := wazero.NewFSConfig() // needs /dev/urandom
|
|
fscfg = fscfg.WithReadOnlyDirMount("/dev", "/dev")
|
|
fscfg = fscfg.WithDirMount(dirpath, dirpath)
|
|
modcfg = modcfg.WithFSConfig(fscfg)
|
|
return modcfg
|
|
},
|
|
})
|
|
if err != nil {
|
|
return gtserror.Newf("error running: %w", err)
|
|
} else if rc != 0 {
|
|
return gtserror.Newf("non-zero return code %d (%s)", rc, stderr.B)
|
|
}
|
|
return nil
|
|
}
|
|
|
|
// ffprobe calls `ffprobe` (WASM) on filepath, returning parsed JSON output.
|
|
func ffprobe(ctx context.Context, filepath string) (*result, error) {
|
|
var stdout byteutil.Buffer
|
|
|
|
// Get directory from filepath.
|
|
dirpath := path.Dir(filepath)
|
|
|
|
// Run ffprobe on our given file at path.
|
|
_, err := _ffmpeg.Ffprobe(ctx, wasm.Args{
|
|
Stdout: &stdout,
|
|
|
|
Args: []string{
|
|
// Don't show any excess logging
|
|
// information, all goes in JSON.
|
|
"-loglevel", "quiet",
|
|
|
|
// Print in compact JSON format.
|
|
"-print_format", "json=compact=1",
|
|
|
|
// Show error in our
|
|
// chosen format type.
|
|
"-show_error",
|
|
|
|
// Show specifically container format, total duration and bitrate.
|
|
"-show_entries", "format=format_name,duration,bit_rate" + ":" +
|
|
|
|
// Show specifically stream codec names, types, frame rate, duration and dimens.
|
|
"stream=codec_name,codec_type,r_frame_rate,duration_ts,width,height" + ":" +
|
|
|
|
// Show any rotation
|
|
// side data stored.
|
|
"side_data=rotation",
|
|
|
|
// Input file.
|
|
"-i", filepath,
|
|
},
|
|
|
|
Config: func(modcfg wazero.ModuleConfig) wazero.ModuleConfig {
|
|
fscfg := wazero.NewFSConfig()
|
|
fscfg = fscfg.WithReadOnlyDirMount(dirpath, dirpath)
|
|
modcfg = modcfg.WithFSConfig(fscfg)
|
|
return modcfg
|
|
},
|
|
})
|
|
if err != nil {
|
|
return nil, gtserror.Newf("error running: %w", err)
|
|
}
|
|
|
|
var result ffprobeResult
|
|
|
|
// Unmarshal the ffprobe output as our result type.
|
|
if err := json.Unmarshal(stdout.B, &result); err != nil {
|
|
return nil, gtserror.Newf("error unmarshaling json: %w", err)
|
|
}
|
|
|
|
// Convert raw result data.
|
|
res, err := result.Process()
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return res, nil
|
|
}
|
|
|
|
// result contains parsed ffprobe result
|
|
// data in a more useful data format.
|
|
type result struct {
|
|
format string
|
|
audio []audioStream
|
|
video []videoStream
|
|
duration float64
|
|
bitrate uint64
|
|
rotation int
|
|
}
|
|
|
|
type stream struct {
|
|
codec string
|
|
}
|
|
|
|
type audioStream struct {
|
|
stream
|
|
}
|
|
|
|
type videoStream struct {
|
|
stream
|
|
width int
|
|
height int
|
|
framerate float32
|
|
}
|
|
|
|
// GetFileType determines file type and extension to use for media data. This
|
|
// function helps to abstract away the horrible complexities that are possible
|
|
// media container (i.e. the file) types and and possible sub-types within that.
|
|
//
|
|
// Note the checks for (len(res.video) > 0) may catch some audio files with embedded
|
|
// album art as video, but i blame that on the hellscape that is media filetypes.
|
|
//
|
|
// TODO: we can update this code to also return a mimetype and avoid later parsing!
|
|
func (res *result) GetFileType() (gtsmodel.FileType, string) {
|
|
switch res.format {
|
|
case "mpeg":
|
|
return gtsmodel.FileTypeVideo, "mpeg"
|
|
case "mjpeg":
|
|
return gtsmodel.FileTypeVideo, "mjpeg"
|
|
case "mov,mp4,m4a,3gp,3g2,mj2":
|
|
switch {
|
|
case len(res.video) > 0:
|
|
return gtsmodel.FileTypeVideo, "mp4"
|
|
case len(res.audio) > 0 &&
|
|
res.audio[0].codec == "aac":
|
|
// m4a only supports [aac] audio.
|
|
return gtsmodel.FileTypeAudio, "m4a"
|
|
}
|
|
case "apng":
|
|
return gtsmodel.FileTypeImage, "apng"
|
|
case "png_pipe":
|
|
return gtsmodel.FileTypeImage, "png"
|
|
case "image2", "image2pipe", "jpeg_pipe":
|
|
return gtsmodel.FileTypeImage, "jpeg"
|
|
case "webp", "webp_pipe":
|
|
return gtsmodel.FileTypeImage, "webp"
|
|
case "gif":
|
|
return gtsmodel.FileTypeImage, "gif"
|
|
case "mp3":
|
|
if len(res.audio) > 0 {
|
|
switch res.audio[0].codec {
|
|
case "mp2":
|
|
return gtsmodel.FileTypeAudio, "mp2"
|
|
case "mp3":
|
|
return gtsmodel.FileTypeAudio, "mp3"
|
|
}
|
|
}
|
|
case "asf":
|
|
switch {
|
|
case len(res.video) > 0:
|
|
return gtsmodel.FileTypeVideo, "wmv"
|
|
case len(res.audio) > 0:
|
|
return gtsmodel.FileTypeAudio, "wma"
|
|
}
|
|
case "ogg":
|
|
switch {
|
|
case len(res.video) > 0:
|
|
return gtsmodel.FileTypeVideo, "ogv"
|
|
case len(res.audio) > 0:
|
|
return gtsmodel.FileTypeAudio, "ogg"
|
|
}
|
|
case "matroska,webm":
|
|
switch {
|
|
case len(res.video) > 0:
|
|
switch res.video[0].codec {
|
|
case "vp8", "vp9", "av1":
|
|
default:
|
|
return gtsmodel.FileTypeVideo, "mkv"
|
|
}
|
|
if len(res.audio) > 0 {
|
|
switch res.audio[0].codec {
|
|
case "vorbis", "opus", "libopus":
|
|
// webm only supports [VP8/VP9/AV1]+[vorbis/opus]
|
|
return gtsmodel.FileTypeVideo, "webm"
|
|
}
|
|
}
|
|
case len(res.audio) > 0:
|
|
return gtsmodel.FileTypeAudio, "mka"
|
|
}
|
|
case "avi":
|
|
return gtsmodel.FileTypeVideo, "avi"
|
|
case "flac":
|
|
return gtsmodel.FileTypeAudio, "flac"
|
|
}
|
|
return gtsmodel.FileTypeUnknown, res.format
|
|
}
|
|
|
|
// ImageMeta extracts image metadata contained within ffprobe'd media result streams.
|
|
func (res *result) ImageMeta() (width int, height int, framerate float32) {
|
|
for _, stream := range res.video {
|
|
if stream.width > width {
|
|
width = stream.width
|
|
}
|
|
if stream.height > height {
|
|
height = stream.height
|
|
}
|
|
if fr := float32(stream.framerate); fr > 0 {
|
|
if framerate == 0 || fr < framerate {
|
|
framerate = fr
|
|
}
|
|
}
|
|
}
|
|
return
|
|
}
|
|
|
|
// Process converts raw ffprobe result data into our more usable result{} type.
|
|
func (res *ffprobeResult) Process() (*result, error) {
|
|
if res.Error != nil {
|
|
return nil, res.Error
|
|
}
|
|
|
|
if res.Format == nil {
|
|
return nil, errors.New("missing format data")
|
|
}
|
|
|
|
var r result
|
|
var err error
|
|
|
|
// Copy over container format.
|
|
r.format = res.Format.FormatName
|
|
|
|
// Parsed media bitrate (if it was set).
|
|
if str := res.Format.BitRate; str != "" {
|
|
r.bitrate, err = strconv.ParseUint(str, 10, 64)
|
|
if err != nil {
|
|
return nil, gtserror.Newf("invalid bitrate %s: %w", str, err)
|
|
}
|
|
}
|
|
|
|
// Parse media duration (if it was set).
|
|
if str := res.Format.Duration; str != "" {
|
|
r.duration, err = strconv.ParseFloat(str, 32)
|
|
if err != nil {
|
|
return nil, gtserror.Newf("invalid duration %s: %w", str, err)
|
|
}
|
|
}
|
|
|
|
// Preallocate streams to max possible lengths.
|
|
r.audio = make([]audioStream, 0, len(res.Streams))
|
|
r.video = make([]videoStream, 0, len(res.Streams))
|
|
|
|
// Convert streams to separate types.
|
|
for _, s := range res.Streams {
|
|
switch s.CodecType {
|
|
case "audio":
|
|
// Append audio stream data to result.
|
|
r.audio = append(r.audio, audioStream{
|
|
stream: stream{codec: s.CodecName},
|
|
})
|
|
case "video":
|
|
var framerate float32
|
|
|
|
// Parse stream framerate, bearing in
|
|
// mind that some static container formats
|
|
// (e.g. jpeg) still return a framerate, so
|
|
// we also check for a non-1 timebase (dts).
|
|
if str := s.RFrameRate; str != "" &&
|
|
s.DurationTS > 1 {
|
|
var num, den uint32
|
|
den = 1
|
|
|
|
// Check for inequality (numerator / denominator).
|
|
if p := strings.SplitN(str, "/", 2); len(p) == 2 {
|
|
n, _ := strconv.ParseUint(p[0], 10, 32)
|
|
d, _ := strconv.ParseUint(p[1], 10, 32)
|
|
num, den = uint32(n), uint32(d)
|
|
} else {
|
|
n, _ := strconv.ParseUint(p[0], 10, 32)
|
|
num = uint32(n)
|
|
}
|
|
|
|
// Set final divised framerate.
|
|
framerate = float32(num / den)
|
|
}
|
|
|
|
// Append video stream data to result.
|
|
r.video = append(r.video, videoStream{
|
|
stream: stream{codec: s.CodecName},
|
|
width: s.Width,
|
|
height: s.Height,
|
|
framerate: framerate,
|
|
})
|
|
}
|
|
}
|
|
|
|
// Check extra packet / frame information
|
|
// for provided orientation (not always set).
|
|
for _, pf := range res.PacketsAndFrames {
|
|
for _, d := range pf.SideDataList {
|
|
|
|
// Ensure frame side
|
|
// data IS rotation data.
|
|
if d.Rotation == 0 {
|
|
continue
|
|
}
|
|
|
|
// Ensure rotation not
|
|
// already been specified.
|
|
if r.rotation != 0 {
|
|
return nil, errors.New("multiple sets of rotation data")
|
|
}
|
|
|
|
// Drop any decimal
|
|
// rotation value.
|
|
rot := int(d.Rotation)
|
|
|
|
// Round rotation to multiple of 90.
|
|
// More granularity is not needed.
|
|
if q := rot % 90; q > 45 {
|
|
rot += (90 - q)
|
|
} else {
|
|
rot -= q
|
|
}
|
|
|
|
// Drop any value above 360
|
|
// or below -360, these are
|
|
// just repeat full turns.
|
|
r.rotation = (rot % 360)
|
|
}
|
|
}
|
|
|
|
return &r, nil
|
|
}
|
|
|
|
// ffprobeResult contains parsed JSON data from
|
|
// result of calling `ffprobe` on a media file.
|
|
type ffprobeResult struct {
|
|
PacketsAndFrames []ffprobePacketOrFrame `json:"packets_and_frames"`
|
|
Streams []ffprobeStream `json:"streams"`
|
|
Format *ffprobeFormat `json:"format"`
|
|
Error *ffprobeError `json:"error"`
|
|
}
|
|
|
|
type ffprobePacketOrFrame struct {
|
|
Type string `json:"type"`
|
|
SideDataList []ffprobeSideData `json:"side_data_list"`
|
|
}
|
|
|
|
type ffprobeSideData struct {
|
|
Rotation float64 `json:"rotation"`
|
|
}
|
|
|
|
type ffprobeStream struct {
|
|
CodecName string `json:"codec_name"`
|
|
CodecType string `json:"codec_type"`
|
|
RFrameRate string `json:"r_frame_rate"`
|
|
DurationTS uint `json:"duration_ts"`
|
|
Width int `json:"width"`
|
|
Height int `json:"height"`
|
|
}
|
|
|
|
type ffprobeFormat struct {
|
|
FormatName string `json:"format_name"`
|
|
Duration string `json:"duration"`
|
|
BitRate string `json:"bit_rate"`
|
|
}
|
|
|
|
type ffprobeError struct {
|
|
Code int `json:"code"`
|
|
String string `json:"string"`
|
|
}
|
|
|
|
func isUnsupportedTypeErr(err error) bool {
|
|
ffprobeErr, ok := err.(*ffprobeError)
|
|
return ok && ffprobeErr.Code == -1094995529
|
|
}
|
|
|
|
func (err *ffprobeError) Error() string {
|
|
return err.String + " (" + strconv.Itoa(err.Code) + ")"
|
|
}
|