使用FFmpeg进行视频抽取音频,之后进行语音识别转为文字

简介: 使用FFmpeg进行视频抽取音频,之后进行语音识别转为文字


1、首先需要下载FFmpeg;

2、Gradle依赖

正在上传…
取消
def void forceVersion(details, group, version) {

if (details.requested.group == group) {
    details.useVersion version
}

}

def void forceVersion(details, group, name, version) {

if (details.requested.group == group && details.requested.name == name) {
    details.useVersion version
}

}

allprojects { p ->

group = 'com.my.spider'
version = '1.0.0'

apply plugin: 'java'
apply plugin: 'maven'
apply plugin: 'maven-publish'

[compileJava, compileTestJava]*.options*.encoding = 'UTF-8'

jar.doFirst {
    manifest {
        def manifestFile = "${projectDir}/META-INF/MANIFEST.MF"
        if (new File(manifestFile).exists())
            from (manifestFile)
        
        attributes 'Implementation-Title':p.name
        if (p.version.endsWith('-SNAPSHOT')) {
            attributes 'Implementation-Version': p.version + '-' + p.ext.Timestamp
        } else {
            attributes 'Implementation-Version': p.version
        }
        attributes 'Implementation-BuildDateTime':new Date()
    }
}

javadoc {
    options {
        encoding 'UTF-8'
        charSet 'UTF-8'
        author false
        version true
        links 'http://docs.oracle.com/javase/8/docs/api/index.html'
        memberLevel = org.gradle.external.javadoc.JavadocMemberLevel.PRIVATE
    }
}

if (System.env.uploadArchives) {
    build.dependsOn publish
}

buildscript {
    repositories {
        mavenCentral()
    }
    dependencies {classpath 'org.springframework.boot:spring-boot-gradle-plugin:1.5.14.RELEASE' }
}

afterEvaluate {Project  project -> 
    if (project.pluginManager.hasPlugin('java')) {
        configurations.all {
            resolutionStrategy.eachDependency {DependencyResolveDetails details -> 
                forceVersion details, 'org.springframework.boot', '1.4.1.RELEASE'
                forceVersion details, 'org.slf4j', '1.7.21'
                forceVersion details, 'org.springframework', '4.3.3.RELEASE'
            }

            exclude module:'slf4j-log4j12'
            exclude module:'log4j'
        }

        dependencies {testCompile 'junit:junit:4.12' }
    }
}

repositories {
    mavenCentral()
}

// 时间戳:年月日时分
p.ext.Timestamp = new Date().format('yyyyMMddHHmm')
// Build Number
p.ext.BuildNumber = System.env.BUILD_NUMBER
if (p.ext.BuildNumber == null || "" == p.ext.BuildNumber) {
    p.ext.BuildNumber = 'x'
}    

}

task zipSources(type: Zip) {

description '压缩源代码'
project.ext.zipSourcesFile = project.name + '-' + project.version + '-' +  project.ext.Timestamp + '.' + project.ext.BuildNumber + '-sources.zip' 
archiveName = project.ext.zipSourcesFile
includeEmptyDirs = false

from project.projectDir

exclude '**/.*'
exclude 'build/*'
allprojects.each { p ->
    exclude '**/' + p.name + '/bin/*'
    exclude '**/' + p.name + '/build/*'
    exclude '**/' + p.name + '/data/*'
    exclude '**/' + p.name + '/work/*'
    exclude '**/' + p.name + '/logs/*'    
}

}

def CopySpec appCopySpec(Project prj, dstname = null) {

if (!dstname) { dstname = prj.name }
return copySpec{
    // Fat jar
    from (prj.buildDir.toString() + '/libs/' + prj.name + '-' + project.version + '.jar') {
        into dstname
    }        

    // Configs
    from (prj.projectDir.toString() + '/config/examples') {
        into dstname + '/config'
    }

    // Windows start script
    from (prj.projectDir.toString() + '/' + prj.name + '.bat') {
        into dstname
    }
    
    // Unix conf script
    from (prj.projectDir.toString() + '/' + prj.name + '.conf') {
        into dstname
        rename prj.name, prj.name + '-' + project.version
    }
}    

}

task zipSetup(type: Zip, dependsOn: subprojects.build) {

description '制作安装包' 
project.ext.zipSetupFile = project.name + '-' + project.version + '-' +  project.ext.Timestamp + '.' + project.ext.BuildNumber + '-setup.zip' 
archiveName = project.name + '-' + project.version + '-' +  project.ext.Timestamp + '.' + project.ext.BuildNumber + '-setup.zip'

with appCopySpec(project(':spider-demo'))

}

import java.security.MessageDigest

def generateMD5(final file) {

MessageDigest digest = MessageDigest.getInstance("MD5")
file.withInputStream(){is->
    byte[] buffer = new byte[8192]
    int read = 0
    while( (read = is.read(buffer)) > 0) {
        digest.update(buffer, 0, read);
    }
}
byte[] md5sum = digest.digest()
BigInteger bigInt = new BigInteger(1, md5sum)
return bigInt.toString(16)

}

task md5(dependsOn: [zipSetup, zipSources]) << {

String md5_setup = generateMD5(file("${projectDir}/build/distributions/" + project.ext.zipSetupFile));
String md5_sources = generateMD5(file("${projectDir}/build/distributions/" + project.ext.zipSourcesFile));
println project.ext.zipSetupFile + '=' + md5_setup
println project.ext.zipSourcesFile + '=' + md5_sources

def newFile = new File("${projectDir}/build/distributions/" 
                + project.name + '-' + project.version + '-' +  project.ext.Timestamp + '.' + project.ext.BuildNumber + '-md5.txt')
PrintWriter printWriter = newFile.newPrintWriter()
printWriter.println project.ext.zipSetupFile + '=' + md5_setup
printWriter.println project.ext.zipSourcesFile + '=' + md5_sources
printWriter.flush()
printWriter.close()

}

build.dependsOn subprojects.build, zipSetup, zipSources, md5
bulid.gradle
工程组件gradle依赖: 语音识别使用 百度api;需引入 compile 'com.baidu.aip:java-sdk:3.2.1'

apply plugin: 'spring-boot'
apply plugin: 'application'

distributions {

main {
    contents {
        from ("${projectDir}/config/examples") {
            into "config"
        }
    }
}

}

distTar.enabled = false

springBoot {

executable = true
mainClass = 'com.my.ai.Application'

}

dependencies {

compile 'org.springframework.boot:spring-boot-starter-web:1.4.0.RELEASE'
compile 'dom4j:dom4j:1.6.1'
compile 'commons-httpclient:commons-httpclient:3.1'
compileOnly 'com.h2database:h2:1.4.191'
compile 'javax.cache:cache-api:1.0.0'
compile 'org.jboss.resteasy:resteasy-jaxrs:3.0.14.Final'
compile 'org.jboss.resteasy:resteasy-client:3.0.14.Final'
// Axis
compile 'axis:axis:1.4'

compile 'org.jsoup:jsoup:1.10.1'

compile 'com.alibaba:fastjson:1.2.21'

compile 'com.baidu.aip:java-sdk:3.2.1'

}
3、视频抽取音频服务“

正在上传…
取消
package com.my.ai.service;

import java.io.BufferedReader;
import java.io.File;
import java.io.InputStreamReader;
import java.util.List;

import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import org.springframework.stereotype.Service;

//视频抽取音频
@Service
public class ExtractAudioService {

public static Logger logger  = LoggerFactory.getLogger(ExtractAudioService.class);

public static void main(String[] args) {
    new ExtractAudioService().getAudioFromVideo("E:\\QLDownload\\氧化还原反应中电子转移的方向和数目的表示方法\\氧化还原反应中电子转移的方向和数目的表示方法.mp4",
            "D:\\ffmpeg4.2\\bin\\ffmpeg.exe");
}


public String getAudioFromVideo(String videoPath,String ffmpegPath) {
    File video = new File(videoPath);
    if(video.exists() && video.isFile()){
        String format = "wav";
        String outPath = videoPath.substring(0,videoPath.lastIndexOf(".")) + ".wav";
        processCmd(videoPath, ffmpegPath, format, outPath);
        return outPath;
    }
    return null;
}

//D:\ffmpeg4.2\bin\ffmpeg.exe -i 氧化还原反应中电子转移的方向和数目的表示方法.mp4 -f wav -vn -y 3.wav
public String processCmd(String inputPath,String ffmpegPath,String format,String outPath) {
    List<String> commend = new java.util.ArrayList<String>();
    commend.add(ffmpegPath);
    commend.add("-i");
    commend.add(inputPath);
    commend.add("-y");
    commend.add("-vn");
    commend.add("-f");
    commend.add(format);
    commend.add(outPath);
    try {

        ProcessBuilder builder = new ProcessBuilder();
        builder.command(commend);
        builder.redirectErrorStream(true);
        Process p = builder.start();

        // 1. start
        BufferedReader buf = null; // 保存ffmpeg的输出结果流
        String line = null;
        // read the standard output

        buf = new BufferedReader(new InputStreamReader(p.getInputStream()));

        StringBuffer sb = new StringBuffer();
        while ((line = buf.readLine()) != null) {
            System.out.println(line);
            sb.append(line);
            continue;
        }
        p.waitFor();// 这里线程阻塞,将等待外部转换进程运行成功运行结束后,才往下执行
        // 1. end
        return sb.toString();
    } catch (Exception e) {

// System.out.println(e);

        return null;
    }
}

}
ExtractAudioService
4、音频切段:

package com.my.ai.service;

import java.io.BufferedReader;
import java.io.File;
import java.io.InputStreamReader;
import java.util.ArrayList;
import java.util.List;
import java.util.regex.Matcher;
import java.util.regex.Pattern;

import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import org.springframework.stereotype.Service;

@Service
public class CutService {

public static Logger logger = LoggerFactory.getLogger(CutService.class);

public List<String> cutFile(String media_path, String ffmpeg_path) {

    List<String> audios = new ArrayList<>();
    int mediaTime = getMediaTime(media_path, ffmpeg_path); 
    int num = mediaTime / 59;
    int lastNum = mediaTime % 59;
    System.out.println(mediaTime +"|" + num + "|"+ lastNum);
    int length = 59;
    File file = new File(media_path);
    String filename = file.getName();
    for (int i = 0; i < num; i++) {
        String outputPath = file.getParent() + File.separator + i + "-"+filename;
        processCmd(media_path, ffmpeg_path, String.valueOf(length * i) , 
                String.valueOf(length), outputPath);
        audios.add(outputPath);
    }
    if(lastNum > 0) {
        String outputPath = file.getParent() + File.separator + num + "-"+filename;
        processCmd(media_path, ffmpeg_path, String.valueOf(length * num) , 
                String.valueOf(lastNum), outputPath);
        audios.add(outputPath);
    }
    return audios;
}

/**
 * 获取视频总时间
 * 
 * @param viedo_path  视频路径
 * @param ffmpeg_path ffmpeg路径
 * @return
 */
public int getMediaTime(String video_path, String ffmpeg_path) {
    List<String> commands = new java.util.ArrayList<String>();
    commands.add(ffmpeg_path);
    commands.add("-i");
    commands.add(video_path);
    try {
        ProcessBuilder builder = new ProcessBuilder();
        builder.command(commands);
        final Process p = builder.start();

        // 从输入流中读取视频信息
        BufferedReader br = new BufferedReader(new InputStreamReader(p.getErrorStream()));
        StringBuffer sb = new StringBuffer();
        String line = "";
        while ((line = br.readLine()) != null) {
            sb.append(line);
        }
        System.out.println(sb.toString());
        br.close();

        // 从视频信息中解析时长
        String regexDuration = "Duration: (.*?), bitrate: (\\d*) kb\\/s";
        Pattern pattern = Pattern.compile(regexDuration);
        Matcher m = pattern.matcher(sb.toString());
        if (m.find()) {
            int time = getTimelen(m.group(1));
            System.out
                    .println(video_path + ",视频时长:" + time + ",比特率:" + m.group(2) + "kb/s");
            return time;
        }
    } catch (Exception e) {
        e.printStackTrace();
    }
    return 0;
}

// 格式:"00:00:10.68"
public int getTimelen(String timelen) {
    int min = 0;
    String strs[] = timelen.split(":");
    if (strs[0].compareTo("0") > 0) {
        min += Integer.valueOf(strs[0]) * 60 * 60;// 秒
    }
    if (strs[1].compareTo("0") > 0) {
        min += Integer.valueOf(strs[1]) * 60;
    }
    if (strs[2].compareTo("0") > 0) {
        min += Math.round(Float.valueOf(strs[2]));
    }  
    return min;
}

//D:\ffmpeg4.2\bin\ffmpeg.exe -i 123.pcm -ss 0 -t 59 1-123.wav
public String processCmd(String inputPath,String ffmpegPath,
        String startTime,String length,String outputPath) {
    List<String> commend = new java.util.ArrayList<String>();
    commend.add(ffmpegPath);
    commend.add("-i");
    commend.add(inputPath);
    commend.add("-ss");
    commend.add(startTime);
    commend.add("-t");
    commend.add(length);
    commend.add(outputPath);
    try {

        ProcessBuilder builder = new ProcessBuilder();
        builder.command(commend);
        builder.redirectErrorStream(true);
        Process p = builder.start();

        // 1. start
        BufferedReader buf = null; // 保存ffmpeg的输出结果流
        String line = null;
        // read the standard output

        buf = new BufferedReader(new InputStreamReader(p.getInputStream()));

        StringBuffer sb = new StringBuffer();
        while ((line = buf.readLine()) != null) {
            System.out.println(line);
            sb.append(line);
            continue;
        }
        p.waitFor();// 这里线程阻塞,将等待外部转换进程运行成功运行结束后,才往下执行
        // 1. end
        return sb.toString();
    } catch (Exception e) {
        System.out.println(e);    
        return null;
    }
}

//ffmpeg -y  -i 16k.wav  -acodec pcm_s16le -f s16le -ac 1 -ar 16000 16k.pcm 
public static String processWavToPcm(String inputPath,String ffmpegPath,String outputPath) {
    List<String> commend = new java.util.ArrayList<String>();
    commend.add(ffmpegPath);
    commend.add("-i");
    commend.add(inputPath);
    commend.add("-acodec");
    commend.add("pcm_s16le");
    commend.add("-f");
    commend.add("s16le");
    commend.add("-ac");
    commend.add("1");
    commend.add("-ar");
    commend.add("16000");
    commend.add(outputPath);
    try {

        ProcessBuilder builder = new ProcessBuilder();
        builder.command(commend);
        builder.redirectErrorStream(true);
        Process p = builder.start();

        // 1. start
        BufferedReader buf = null; // 保存ffmpeg的输出结果流
        String line = null;
        // read the standard output

        buf = new BufferedReader(new InputStreamReader(p.getInputStream()));

        StringBuffer sb = new StringBuffer();
        while ((line = buf.readLine()) != null) {
            System.out.println(line);
            sb.append(line);
            continue;
        }
        p.waitFor();// 这里线程阻塞,将等待外部转换进程运行成功运行结束后,才往下执行
        // 1. end
        return outputPath;
                //sb.toString();
    } catch (Exception e) {
        System.out.println(e);    
        return null;
    }
}




public static void main(String[] args) {
    List<String> audios = new CutService().cutFile(
            "E:\\QLDownload\\氧化还原反应中电子转移的方向和数目的表示方法\\氧化还原反应中电子转移的方向和数目的表示方法.wav",
            "D:\\ffmpeg4.2\\bin\\ffmpeg.exe");
    System.out.println(audios.size());
    
    for (String wavPath : audios) {
        String out = wavPath.substring(0,wavPath.lastIndexOf(".")) + ".pcm";
        processWavToPcm(wavPath, "D:\\ffmpeg4.2\\bin\\ffmpeg.exe", out);
    }
    
}

}
5、音频格式转换,便于进行语音识别,代码如上:

6、调用sdk,获取识别结果:

package com.my.ai.service;

import org.json.JSONObject;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import org.springframework.stereotype.Service;

import com.baidu.aip.speech.AipSpeech;

@Service
public class TokenService {

public static Logger logger = LoggerFactory.getLogger(TokenService.class);

 //设置APPID/AK/SK
public static final String APP_ID = "***";
public static final String API_KEY = "***";
public static final String SECRET_KEY = "***";
static AipSpeech client = null;
static {
    if(client == null) {
         client = new AipSpeech(APP_ID, API_KEY, SECRET_KEY);
    }
}

public static void main(String[] args) {
    getResult("E:\\QLDownload\\数目的表示方法.pcm");
}

public static String getResult(String file) {
     
      // 可选:设置网络连接参数
      client.setConnectionTimeoutInMillis(2000);
      client.setSocketTimeoutInMillis(60000);
      // 可选:设置代理服务器地址, http和socket二选一,或者均不设置
      //client.setHttpProxy("proxy_host", proxy_port);  // 设置http代理
      //client.setSocketProxy("proxy_host", proxy_port);  // 设置socket代理
      JSONObject res = client.asr(file, "pcm", 16000, null);
      //System.out.println(res.toString(2));
      System.out.println(res.get("result").toString());
      return res.get("result").toString();
}


}
  

7、结果写入文件:

package com.my.ai.service;

import java.io.BufferedOutputStream;
import java.io.BufferedWriter;
import java.io.File;
import java.io.FileOutputStream;
import java.io.FileWriter;
import java.io.IOException;
import java.io.OutputStreamWriter;
import java.io.RandomAccessFile;

import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import org.springframework.stereotype.Service;

@Service
public class FileService {

public static Logger logger = LoggerFactory.getLogger(FileService.class);


//最慢
public static void writeFile1(String file,String content) throws IOException {
    FileOutputStream out = null;
    out = new FileOutputStream(new File(file));
    long begin = System.currentTimeMillis();
    out.write(content.getBytes());
    out.close();
    long end = System.currentTimeMillis();
    System.out.println("FileOutputStream执行耗时:" + (end - begin) + " 毫秒");
}
//中
public static void writeFile2(String file,String content) throws IOException{
    FileWriter fw = null;
    fw = new FileWriter(file);
    long begin3 = System.currentTimeMillis();
    fw.write(content);
    fw.close();
    long end3 = System.currentTimeMillis();
    System.out.println("FileWriter执行耗时:" + (end3 - begin3) + " 毫秒");
}
//最快
public static void writeFile3(String file,String content) throws IOException{
    FileOutputStream outSTr = null;
    BufferedOutputStream buff = null;
    outSTr = new FileOutputStream(new File(file));
    buff = new BufferedOutputStream(outSTr);
    long begin0 = System.currentTimeMillis();
    buff.write(content.getBytes());
    buff.flush();
    buff.close();
    long end0 = System.currentTimeMillis();
    System.out.println("BufferedOutputStream执行耗时:" + (end0 - begin0) + " 毫秒");
}

public static void main(String[] args) {
    for (int i = 0; i < 7; i++) {
        String result = TokenService.getResult("E:\\QLDownload\\氧化还原反应中电子转移的方向和数目的表示方法\\" + i +"-氧化还原反应中电子转移的方向和数目的表示方法.pcm");
        appendFile2("E:\\QLDownload\\氧化还原反应中电子转移的方向和数目的表示方法\\氧化还原反应中电子转移的方向和数目的表示方法.txt", result+"\r\n");
    }
}

public static void appendFile1(String file, String conent) {
    BufferedWriter out = null;
    try {
        out = new BufferedWriter(new OutputStreamWriter(new FileOutputStream(file, true)));
        out.write(conent);
    } catch (Exception e) {
        e.printStackTrace();
    } finally {
        try {
            if (out != null) {
                out.close();
            }
        } catch (IOException e) {
            e.printStackTrace();
        }
    }
}

/**
 * 追加文件:使用FileWriter
 * 
 * @param fileName
 * @param content
 */
public static void appendFile2(String fileName, String content) {
    FileWriter writer = null;
    try {
        // 打开一个写文件器,构造函数中的第二个参数true表示以追加形式写文件
        writer = new FileWriter(fileName, true);
        writer.write(content);
    } catch (IOException e) {
        e.printStackTrace();
    } finally {
        try {
            if (writer != null) {
                writer.close();
            }
        } catch (IOException e) {
            e.printStackTrace();
        }
    }
}

/**
 *  追加文件:使用RandomAccessFile
 * 
 * @param fileName 文件名
 * @param content  追加的内容
 */
public static void appendFile3(String fileName, String content) {
    RandomAccessFile randomFile = null;
    try {
        // 打开一个随机访问文件流,按读写方式
        randomFile = new RandomAccessFile(fileName, "rw");
        // 文件长度,字节数
        long fileLength = randomFile.length();
        // 将写文件指针移到文件尾。
        randomFile.seek(fileLength);
        randomFile.writeBytes(content);
    } catch (IOException e) {
        e.printStackTrace();
    } finally {
        if (randomFile != null) {
            try {
                randomFile.close();
            } catch (IOException e) {
                e.printStackTrace();
            }
        }
    }
}

}
 

8、测试:

package com.my.ai.test;

import java.util.List;

import com.my.ai.service.CutService;
import com.my.ai.service.ExtractAudioService;
import com.my.ai.service.FileService;
import com.my.ai.service.TokenService;

public class TestService {


public static void main(String[] args) {
    ExtractAudioService audioService = new ExtractAudioService();
    String outPath =  audioService.getAudioFromVideo("G:\\Youku Files\\transcode\\反应_标清.mp4", "D:\\ffmpeg4.2\\bin\\ffmpeg.exe");
    List<String> audios = new CutService().cutFile(outPath,"D:\\ffmpeg4.2\\bin\\ffmpeg.exe");
    for (String wavPath : audios) {
        String out = wavPath.substring(0,wavPath.lastIndexOf(".")) + ".pcm";
        String outPcm = CutService.processWavToPcm(wavPath, "D:\\ffmpeg4.2\\bin\\ffmpeg.exe", out);
        String result = TokenService.getResult(outPcm);
        FileService.appendFile2("G:\\Youku Files\\transcode\\标清.mp4-字幕.txt", result+"\r\n");
    }
}

}
  

相关实践学习
达摩院智能语音交互 - 声纹识别技术
声纹识别是基于每个发音人的发音器官构造不同,识别当前发音人的身份。按照任务具体分为两种: 声纹辨认:从说话人集合中判别出测试语音所属的说话人,为多选一的问题 声纹确认:判断测试语音是否由目标说话人所说,是二选一的问题(是或者不是) 按照应用具体分为两种: 文本相关:要求使用者重复指定的话语,通常包含与训练信息相同的文本(精度较高,适合当前应用模式) 文本无关:对使用者发音内容和语言没有要求,受信道环境影响比较大,精度不高 本课程主要介绍声纹识别的原型技术、系统架构及应用案例等。 讲师介绍: 郑斯奇,达摩院算法专家,毕业于美国哈佛大学,研究方向包括声纹识别、性别、年龄、语种识别等。致力于推动端侧声纹与个性化技术的研究和大规模应用。
相关文章
|
2月前
|
编解码 语音技术 内存技术
FFmpeg开发笔记(五十八)把32位采样的MP3转换为16位的PCM音频
《FFmpeg开发实战:从零基础到短视频上线》一书中的“5.1.2 把音频流保存为PCM文件”章节介绍了将媒体文件中的音频流转换为原始PCM音频的方法。示例代码直接保存解码后的PCM数据,保留了原始音频的采样频率、声道数量和采样位数。但在实际应用中,有时需要特定规格的PCM音频。例如,某些语音识别引擎仅接受16位PCM数据,而标准MP3音频通常采用32位采样,因此需将32位MP3音频转换为16位PCM音频。
78 0
FFmpeg开发笔记(五十八)把32位采样的MP3转换为16位的PCM音频
|
4月前
|
编解码 Linux
CentOS安装ffmpeg并转码视频为mp4
CentOS安装ffmpeg并转码视频为mp4
155 0
|
1月前
|
编解码 监控 网络协议
如何使用FFmpeg实现RTSP推送H.264和H.265(HEVC)编码视频
本文详细介绍了如何使用FFmpeg实现RTSP推送H.264和H.265(HEVC)编码视频。内容涵盖环境搭建、编码配置、服务器端与客户端实现等方面,适合视频监控系统和直播平台等应用场景。通过具体命令和示例代码,帮助读者快速上手并实现目标。
196 6
|
6月前
|
Python
Python使用ffmpeg下载m3u8拼接为视频
Python使用ffmpeg下载m3u8拼接为视频
|
2月前
|
Java 数据安全/隐私保护
Java ffmpeg 实现视频加文字/图片水印功能
【10月更文挑战第22天】在 Java 中使用 FFmpeg 实现视频加文字或图片水印功能,需先安装 FFmpeg 并添加依赖(如 JavaCV)。通过构建 FFmpeg 命令行参数,使用 `drawtext` 滤镜添加文字水印,或使用 `overlay` 滤镜添加图片水印。示例代码展示了如何使用 JavaCV 实现文字水印。
154 1
|
2月前
|
计算机视觉 Python
FFMPEG学习笔记(一): 提取视频的纯音频及无声视频
本文介绍了如何使用FFmpeg工具从视频中提取纯音频和无声视频。提供了具体的命令行操作,例如使用`ffmpeg -i input.mp4 -vn -c:a libmp3lame output.mp3`来提取音频,以及`ffmpeg -i input.mp4 -c:v copy -an output.mp4`来提取无声视频。此外,还包含了一个Python脚本,用于批量处理视频文件,自动提取音频和生成无声视频。
85 1
|
2月前
FFmpeg学习笔记(二):多线程rtsp推流和ffplay拉流操作,并储存为多路avi格式的视频
这篇博客主要介绍了如何使用FFmpeg进行多线程RTSP推流和ffplay拉流操作,以及如何将视频流保存为多路AVI格式的视频文件。
306 0
|
4月前
|
存储 算法 Serverless
【matlab】matlab基于DTW和HMM方法数字语音识别系统(源码+音频文件+GUI界面)【独一无二】
【matlab】matlab基于DTW和HMM方法数字语音识别系统(源码+音频文件+GUI界面)【独一无二】
|
6月前
|
Java Linux
ffmpeg音频格式转换、合成、速率调整
ffmpeg音频格式转换、合成、速率调整
126 2
|
6月前
|
编解码 Linux 计算机视觉
python 调用ffmpeg使用usb摄像头录制视频,输出h264格式,自动获取摄像头的最佳帧率和最大画面尺寸
使用 Python 调用 FFmpeg 进行 USB 摄像头视频录制,需先确保安装 FFmpeg 和 Python 的 `subprocess` 模块。代码示例展示了如何自动获取摄像头的最佳帧率和最大分辨率,然后录制视频。首先通过 FFmpeg 列出摄像头格式获取信息,解析出帧率和分辨率,选择最优值。之后调用 FFmpeg 命令录制视频,设置帧率、分辨率等参数。注意 `/dev/video0` 是 Linux 的摄像头设备路径,Windows 系统需相应调整。代码中未直接实现自动获取最佳参数,通常需要借助其他库如 OpenCV。
下一篇
DataWorks