{"skill":{"slug":"local-video-understanding","displayName":"Local Video Understanding","summary":"Local video comprehension skill. Use ffmpeg to extract audio and frames, FunASR for speech recognition, and qwen3-vl for image understanding.","tags":{"latest":"1.0.2"},"stats":{"comments":0,"downloads":111,"installsAllTime":0,"installsCurrent":0,"stars":1,"versions":2},"createdAt":1775923371788,"updatedAt":1775923910883},"latestVersion":{"version":"1.0.2","createdAt":1775923695935,"changelog":"Fix README structure to match actual files","license":"MIT-0"},"metadata":null,"owner":{"handle":"tomuiv","userId":"s171935xz6xsqmpn3z12w1jnk184m1a9","displayName":"TOMUIV","image":"https://avatars.githubusercontent.com/u/232025981?v=4"},"moderation":null}