依 R5 五輪決策把 visionA-local 從「Wails 內嵌 Next.js」重構為「Wails
本機伺服器控制台 + 瀏覽器 Web UI」模式(類比 Docker Desktop / Ollama)。
程式碼變動
- M8-1 砍 yt-dlp 全套(後端 resolver / URL handler / 前端 URL tab /
Makefile vendor / installer / bootstrap / CI workflow,-555 行)
- M8-2 砍 Mock 模式全套(driver/mock、mock_camera、Settings runtimeMode、
VISIONA_MOCK 環境變數,-528 行)
- M8-3 ffmpeg 從 GPL 切換到 LGPL 混合方案:Windows/Linux 用 BtbN 現成
LGPL binary,macOS 自 build minimal decoder-only 進 git
(vendor/ffmpeg/macos/ffmpeg 5.7MB + ffprobe 5.6MB,比 GPL 版省 85% 空間)
- M8-4 Wails Server Controller:state machine、log ring buffer 2000 行、
preferences.json atomic write、boot-id、Gin SkipPaths、shutdown 7+1 秒、
notify_*.go 三平台 OS 通知、watchServer 改 Error state 不 os.Exit
- M8-4b 啟動階段管線 R5-E:6 階段進度 event、20s soft / 60s hard timeout、
stage 5/6 skip 規則、sentinel file、RestartStartupSequence 5 步驟
- M8-5 Wails 控制台 vanilla HTML/JS/CSS(9 檔 ~2012 行)取代 M7-B splash:
state 視覺、log panel、startup progress panel、Stage 6 manual CTA
pulse、shutdown modal、Settings、Dark Mode、i18n 中英雙語
- M8-6 上傳影片副檔名擴充(mp4/avi/mov/mpeg/mpg)
- M8-7 Web UI Server Offline Overlay(role=alertdialog + focus trap +
wsEverConnected 容錯 + Page Visibility)
- M8-8 CORS middleware(127.0.0.1/localhost only + suffix attack 防護)+
ws/origin.go 獨立 WebSocket CheckOrigin 避 package cycle
- MAJ-4 server:shutdown-imminent WebSocket broadcast 機制
(/ws/system endpoint + notifyShutdownImminent helper)
- M8-9 Boot-ID + 瀏覽器 tab 自動重連(sessionStorage loop guard)
品質
- ~105+ 新 unit test + race detector (-count=2) 全綠
- 10 個 milestone 全部通過 Reviewer 審查
- 三方 v2 + v2.1 文件(PRD / Design Spec / TDD)+ 交叉互審紀錄
收錄在 .autoflow/
交付前待處理(M8-10)
- 重跑 make payload-macos 把舊 GPL 77MB binary 換成新 LGPL
- 三平台 end-to-end build 驗證
Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
235 lines
5.6 KiB
Go
235 lines
5.6 KiB
Go
package camera
|
|
|
|
import (
|
|
"bufio"
|
|
"fmt"
|
|
"io"
|
|
"os"
|
|
"os/exec"
|
|
"strconv"
|
|
"strings"
|
|
"sync"
|
|
"sync/atomic"
|
|
)
|
|
|
|
// VideoInfo holds metadata extracted by ffprobe before pipeline starts.
|
|
type VideoInfo struct {
|
|
DurationSec float64 // total duration in seconds
|
|
TotalFrames int // estimated total frames at target FPS
|
|
}
|
|
|
|
// ProbeVideoInfo runs ffprobe to extract duration from a video file or URL.
|
|
// Returns zero values (no error) when duration is indeterminate (e.g. live streams).
|
|
func ProbeVideoInfo(input string, fps float64) VideoInfo {
|
|
cmd := exec.Command("ffprobe",
|
|
"-v", "error",
|
|
"-select_streams", "v:0",
|
|
"-show_entries", "format=duration",
|
|
"-of", "csv=p=0",
|
|
input,
|
|
)
|
|
out, err := cmd.Output()
|
|
if err != nil {
|
|
return VideoInfo{}
|
|
}
|
|
durStr := strings.TrimSpace(string(out))
|
|
if durStr == "" || durStr == "N/A" {
|
|
return VideoInfo{}
|
|
}
|
|
dur, err := strconv.ParseFloat(durStr, 64)
|
|
if err != nil {
|
|
return VideoInfo{}
|
|
}
|
|
if fps <= 0 {
|
|
fps = 15
|
|
}
|
|
return VideoInfo{
|
|
DurationSec: dur,
|
|
TotalFrames: int(dur * fps),
|
|
}
|
|
}
|
|
|
|
// VideoSource reads a video file or URL frame-by-frame using ffmpeg, outputting
|
|
// JPEG frames via stdout. Reuses the same JPEG SOI/EOI marker parsing
|
|
// pattern as FFmpegCamera.
|
|
type VideoSource struct {
|
|
cmd *exec.Cmd
|
|
stdout io.ReadCloser
|
|
frameCh chan []byte // decoded frames queue
|
|
mu sync.Mutex
|
|
done chan struct{}
|
|
finished bool
|
|
err error
|
|
filePath string // local file path
|
|
totalFrames int64 // 0 means unknown
|
|
frameCount int64 // atomic counter incremented in readLoop
|
|
}
|
|
|
|
// NewVideoSource starts an ffmpeg process that decodes a video file
|
|
// and outputs MJPEG frames to stdout at the specified FPS.
|
|
func NewVideoSource(filePath string, fps float64) (*VideoSource, error) {
|
|
return newVideoSource(filePath, fps, 0)
|
|
}
|
|
|
|
// NewVideoSourceWithSeek starts ffmpeg from a specific position (in seconds).
|
|
func NewVideoSourceWithSeek(filePath string, fps float64, seekSeconds float64) (*VideoSource, error) {
|
|
return newVideoSource(filePath, fps, seekSeconds)
|
|
}
|
|
|
|
func newVideoSource(filePath string, fps float64, seekSeconds float64) (*VideoSource, error) {
|
|
if fps <= 0 {
|
|
fps = 15
|
|
}
|
|
|
|
args := []string{}
|
|
if seekSeconds > 0 {
|
|
args = append(args, "-ss", fmt.Sprintf("%.3f", seekSeconds))
|
|
}
|
|
args = append(args,
|
|
"-i", filePath,
|
|
"-vf", fmt.Sprintf("fps=%g", fps),
|
|
"-f", "image2pipe",
|
|
"-vcodec", "mjpeg",
|
|
"-q:v", "5",
|
|
"-an",
|
|
"-",
|
|
)
|
|
|
|
cmd := exec.Command("ffmpeg", args...)
|
|
stdout, err := cmd.StdoutPipe()
|
|
if err != nil {
|
|
return nil, fmt.Errorf("failed to get stdout pipe: %w", err)
|
|
}
|
|
cmd.Stderr = nil
|
|
|
|
if err := cmd.Start(); err != nil {
|
|
return nil, fmt.Errorf("failed to start ffmpeg: %w", err)
|
|
}
|
|
|
|
vs := &VideoSource{
|
|
cmd: cmd,
|
|
stdout: stdout,
|
|
frameCh: make(chan []byte, 30), // buffer up to 30 frames
|
|
done: make(chan struct{}),
|
|
filePath: filePath,
|
|
}
|
|
|
|
go vs.readLoop()
|
|
return vs, nil
|
|
}
|
|
|
|
// readLoop scans ffmpeg stdout for JPEG SOI/EOI markers to extract frames.
|
|
func (v *VideoSource) readLoop() {
|
|
defer close(v.done)
|
|
defer close(v.frameCh)
|
|
|
|
reader := bufio.NewReaderSize(v.stdout, 1024*1024)
|
|
buf := make([]byte, 0, 512*1024)
|
|
inFrame := false
|
|
|
|
for {
|
|
b, err := reader.ReadByte()
|
|
if err != nil {
|
|
v.mu.Lock()
|
|
v.finished = true
|
|
if err != io.EOF {
|
|
v.err = fmt.Errorf("ffmpeg stream ended: %w", err)
|
|
}
|
|
v.mu.Unlock()
|
|
return
|
|
}
|
|
|
|
if !inFrame {
|
|
if b == 0xFF {
|
|
next, err := reader.ReadByte()
|
|
if err != nil {
|
|
v.mu.Lock()
|
|
v.finished = true
|
|
v.mu.Unlock()
|
|
return
|
|
}
|
|
if next == 0xD8 {
|
|
buf = buf[:0]
|
|
buf = append(buf, 0xFF, 0xD8)
|
|
inFrame = true
|
|
}
|
|
}
|
|
continue
|
|
}
|
|
|
|
buf = append(buf, b)
|
|
|
|
if b == 0xD9 && len(buf) >= 2 && buf[len(buf)-2] == 0xFF {
|
|
frame := make([]byte, len(buf))
|
|
copy(frame, buf)
|
|
|
|
v.frameCh <- frame // blocks if buffer full, applies backpressure
|
|
atomic.AddInt64(&v.frameCount, 1)
|
|
inFrame = false
|
|
}
|
|
}
|
|
}
|
|
|
|
// ReadFrame returns the next decoded frame, blocking until one is available.
|
|
// Returns an error when all frames have been consumed and ffmpeg has finished.
|
|
func (v *VideoSource) ReadFrame() ([]byte, error) {
|
|
frame, ok := <-v.frameCh
|
|
if !ok {
|
|
return nil, fmt.Errorf("video playback complete")
|
|
}
|
|
return frame, nil
|
|
}
|
|
|
|
// SetTotalFrames sets the expected total frame count (from ffprobe).
|
|
func (v *VideoSource) SetTotalFrames(n int) {
|
|
atomic.StoreInt64(&v.totalFrames, int64(n))
|
|
}
|
|
|
|
// TotalFrames returns the expected total frame count, or 0 if unknown.
|
|
func (v *VideoSource) TotalFrames() int {
|
|
return int(atomic.LoadInt64(&v.totalFrames))
|
|
}
|
|
|
|
// FrameCount returns the number of frames decoded so far.
|
|
func (v *VideoSource) FrameCount() int {
|
|
return int(atomic.LoadInt64(&v.frameCount))
|
|
}
|
|
|
|
// IsFinished returns true when the video file has been fully decoded
|
|
// AND all buffered frames have been consumed.
|
|
func (v *VideoSource) IsFinished() bool {
|
|
v.mu.Lock()
|
|
finished := v.finished
|
|
v.mu.Unlock()
|
|
return finished && len(v.frameCh) == 0
|
|
}
|
|
|
|
// CloseWithoutRemove stops the ffmpeg process but does NOT delete the temp file.
|
|
// Used when seeking: we need to restart ffmpeg from a different position but keep the file.
|
|
func (v *VideoSource) CloseWithoutRemove() error {
|
|
if v.cmd != nil && v.cmd.Process != nil {
|
|
_ = v.cmd.Process.Kill()
|
|
_ = v.cmd.Wait()
|
|
}
|
|
for range v.frameCh {
|
|
}
|
|
<-v.done
|
|
return nil
|
|
}
|
|
|
|
func (v *VideoSource) Close() error {
|
|
if v.cmd != nil && v.cmd.Process != nil {
|
|
_ = v.cmd.Process.Kill()
|
|
_ = v.cmd.Wait()
|
|
}
|
|
// Drain any remaining frames so readLoop can exit
|
|
for range v.frameCh {
|
|
}
|
|
<-v.done
|
|
// Remove temp file if present
|
|
if v.filePath != "" {
|
|
_ = os.Remove(v.filePath)
|
|
}
|
|
return nil
|
|
}
|