【问题标题】:Split .srt file into equal chunks将 .srt 文件分成相等的块
【发布时间】:2018-07-03 12:39:24
【问题描述】:

我是新手,我需要将 Srt(字幕文件)拆分成多个块。

例如:如果我有视频的字幕文件(60 分钟)。那么字幕文件应该分成6个字幕文件,每个字幕文件时长10分钟。

即 6 X 10 = 60 分钟

不分分钟需要分成6个块。

使用这些每个字幕时间/持续时间,我必须将视频分成相同的块。

我正在尝试这段代码,请你帮我看看如何计算时间并分成块,

我能够达到我需要多少分钟的时间。但是卡在如何从源文件中读取该块分钟并创建一个新文件。然后如何从源文件的下一个 10 分钟开始下一个块文件。

import org.apache.commons.io.IOUtils;

import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.DataInputStream;
import java.io.File;
import java.io.FileInputStream;
import java.io.FileWriter;
import java.io.IOException;
import java.io.InputStreamReader;
import java.nio.charset.StandardCharsets;
import java.nio.file.Files;
import java.nio.file.Paths;
import java.sql.Timestamp;
import java.text.SimpleDateFormat;
import java.util.Date;
import java.util.List;
import java.util.stream.Stream;

/**
 * The class SyncSRTSubtitles reads a subtitles .SRT file and offsets all the
 * timestamps with the same specific value in msec.
 *
 * The format of the .SRT file is like this:
 *
 * 123
 * 00:11:23,456 --> 00:11:25,234
 * subtitle #123 text here
 *
 *
 * @author Sorinel CRISTESCU
 */
public class SyncSRTSubtitles {

    /**
     * Entry point in the program.
     *
     * @param args
     * @throws IOException
     */
    public static void main(String[] args) throws IOException {

        /* INPUT: offset value: negative = less (-) ... positive = more (+). */
        long delta = (22 * 1000L + 000); /* msec */


        /* INPUT: source & destination files */
        String srcFileNm = "/Users/meh/Desktop/avatar.srt";
        String destFileNm = "/Users/meh/Desktop/avatar1.srt";


        /* offset algorithm: START */
        File outFile = new File(destFileNm);
        outFile.createNewFile();
        FileWriter ofstream = new FileWriter(outFile);
        BufferedWriter out = new BufferedWriter(ofstream);

        /* Open the file that is the first command line parameter */
        FileInputStream fstream = new FileInputStream(srcFileNm);
        DataInputStream in = new DataInputStream(fstream);
        BufferedReader br = new BufferedReader(new InputStreamReader(in));
        String strLine;
//        List<String> doc = IOUtils.readLines(in, StandardCharsets.UTF_8);


String strEnd = null;
        long diff = 0;
        String line;
        String startTS1;
        try (Stream<String> lines = Files.lines(Paths.get(srcFileNm))) {
            line = lines.skip(1).findFirst().get();
            String[] atoms = line.split(" --> ");
             startTS1 = atoms[0];

        }
        System.out.println("bolo:" +line);
        System.out.println("startTS1:" +startTS1);

        String startTS = null;
        String endTS = null;
        /* Read File Line By Line */
        while ((strLine = br.readLine()) != null) {
            String[] atoms = strLine.split(" --> ");
            if (atoms.length == 1) {
                //out.write(strLine + "\n");
            }
            else {
                 startTS = atoms[0];


                 endTS = atoms[1];
//                out.write(offsetTime(startTS, delta) + " --> "
//                    + offsetTime(endTS, delta) + "\n");
                strEnd = endTS;

            }


        }
        try {
            SimpleDateFormat dateFormat = new SimpleDateFormat("hh:mm:ss");
            Date parsedendDate = dateFormat.parse(strEnd);
            Date parsedStartDate = dateFormat.parse(startTS1);
            diff = parsedendDate.getTime() - parsedStartDate.getTime();

        } catch(Exception e) { //this generic but you can control another types of exception
            // look the origin of excption
        }
        System.out.println("strEnd");
        System.out.println(strEnd);
        /* Close the input streams */
        in.close();
        out.close();
        System.out.println(diff);
        long diff1 =diff/6;
        System.out.println(diff1);
        long diff2= (diff1*6);
        System.out.println(diff2);
        System.out.println((diff / 3600000) + " hour/s " + (diff % 3600000) / 60000 + " minutes");
        System.out.println((diff1 / 3600000) + " hour/s " + (diff1 % 3600000) / 60000 + " minutes");
        System.out.println((diff2 / 3600000) + " hour/s " + (diff2 % 3600000) / 60000 + " minutes");

        /* offset algorithm: END */
        System.out.println("DONE! Check the rsult oin the file: " + destFileNm);
    }

    /**
     * Computes the timestamp offset.
     *
     * @param ts
     *            String value of the timestamp in format: "hh:MM:ss,mmm"
     * @param delta
     *            long value of the offset in msec (positive or negative).
     * @return String with the new timestamp representation.
     */
    private static String offsetTime(String ts, long delta) {
        long tsMsec = 0;
        String atoms[] = ts.split("\\,");
        if (atoms.length == 2) {
            tsMsec += Integer.parseInt(atoms[1]);
        }
        atoms = atoms[0].split(":");

        tsMsec += Integer.parseInt(atoms[2]) * 1000L; /* seconds */
        tsMsec += Integer.parseInt(atoms[1]) * 60000L; /* minutes */
        tsMsec += Integer.parseInt(atoms[0]) * 3600000L; /* hours */
        tsMsec += delta; /* here we do the offset. */

        long h = tsMsec / 3600000L;
        System.out.println(h);

        String result = get2digit(h, 2) + ":";

        System.out.println(result);


        long r = tsMsec % 3600000L;
        System.out.println(r);

        long m = r / 60000L;
        System.out.println(m);

        result += get2digit(m, 2) + ":";
        System.out.println(result);
        r = r % 60000L;
        System.out.println(r);

        long s = r / 1000L;
        result += get2digit(s, 2) + ",";

        result += get2digit(r % 1000L, 3);
        System.out.println(result);

        return result;
    }

    /**
     * Gets the string representation of the number, adding the prefix '0' to
     * have the required length.
     *
     * @param n
     *            long number to convert to string.
     * @param digits
     *            int number of digits required.
     * @return String with the required length string (3 for digits = 3 -->
     *         "003")
     */
    private static String get2digit(long n, int digits) {
        String result = "" + n;
        while (result.length() < digits) {
            result = "0" + result;
        }
        return result;
    }

}

请建议我如何做到这一点?

【问题讨论】:

  • 您是否总是需要以 10 分钟为单位的块,或者块应该是多少?
  • 我需要被分割成相等的块......如果它是 10 分钟,那么如果我想要 5 个块,那么它应该每个分割 2 分钟......如果我有 120 分钟的文件。如果我需要 6 个块,每个文件 20 分钟...这种输出我需要@XtremeBaumer
  • 您需要一种一致的方式来了解您需要多少块。 65/79/88 分钟需要多少块?
  • 它可能因电影而异。确定将固定为 6 块,无论几分钟。并且所有 6 个都应该写在 6 个 .srt 文件中
  • @XtremeBaumer 需要 6 个块,无论分钟数。它应该写在 6 个不同的 .srt 文件中。我怎样才能做到这一点?请建议

标签: java split srt


【解决方案1】:

我已经找到了一种将文件分成块的方法,

    public static void main(String args[]) throws IOException {
String FilePath = "/Users/meh/Desktop/escapeplan.srt";
        FileInputStream fin = new FileInputStream(FilePath);

        System.out.println("size: " +fin.getChannel().size());
        long abc = 0l;
        abc = (fin.getChannel().size())/3;
        System.out.println("6: " +abc);
System.out.println("abc: " +abc);
       //FilePath = args[1];
        File filename = new File(FilePath);
        long splitFileSize = 0,bytefileSize=0;
        if (filename.exists()) {
            try {
                //bytefileSize = Long.parseLong(args[2]);
                splitFileSize = abc;
                Splitme spObj = new Splitme();
                spObj.split(FilePath, (long) splitFileSize);
                spObj = null;
            } catch (Exception e) {
                e.printStackTrace();
            }
        } else {
            System.out.println("File Not Found....");
        }
}
    public void split(String FilePath, long splitlen) {

            long leninfile = 0, leng = 0;
            int count = 1, data;
            try {
                File filename = new File(FilePath);
                InputStream infile = new BufferedInputStream(new FileInputStream(filename));
                data = infile.read();
                System.out.println("data");
                System.out.println(data);

                while (data != -1) {
                    filename = new File("/Users/meh/Documents/srt" + count + ".srt");
    //RandomAccessFile outfile = new RandomAccessFile(filename, "rw");

                    OutputStream outfile = new BufferedOutputStream(new FileOutputStream(filename));
                    while (data != -1 && leng < splitlen) {
                        outfile.write(data);
                        leng++;
                        data = infile.read();
                    }
                    leninfile += leng;
                    leng = 0;
                    outfile.close();
                    changeTimeStamp(filename, count);

                    count++;


                }
            } catch (Exception e) {
                e.printStackTrace();
            }
}

【讨论】:

    【解决方案2】:

    您需要解析文件两次:

    • 一次读取最后结束时间
    • 第二次处理所有行和 生成输出文件。
    
        import java.io.BufferedWriter;
        import java.io.File;
        import java.io.FileWriter;
        import java.io.IOException;
        import java.util.List;
    
        import org.apache.commons.io.FileUtils;
    
        public class SplitSRTFiles {
    
            /**
             * Splits a SRT file in multiple files each containing an equal time duration.
             * @param args
             * [0] number of wanted chunks
             * [1] source file name
             * @throws IOException
             */
            public static void main(String[] args) throws IOException {
                int nrOfChunks = Integer.parseInt(args[0]);
                File srtFile = new File(args[1]);
                System.out.println("Splitting "+srtFile.getAbsolutePath()+" into "+nrOfChunks+" files.");
    
                List<String> srcLines = FileUtils.readLines(srtFile);
                long fileEndTime = lastEndTime(srcLines);
                long msecsPerChunkFile = fileEndTime / nrOfChunks;
                int destFileCounter = 1;
                String[] fileNameParts = srtFile.getName().split("\\.");
                File outFile = new File(fileNameParts[0] + destFileCounter + "." + fileNameParts[1]);
                System.out.println("Writing to "+outFile.getAbsolutePath());
                outFile.createNewFile();
                FileWriter ofstream = new FileWriter(outFile);
                BufferedWriter out = new BufferedWriter(ofstream);
    
                for (String line : srcLines) {
                    String[] atoms = line.split(" --> ");
                    if (atoms.length > 1) {
                        long startTS = toMSec(atoms[0]);
                        // check if start time of this subtitle is after the current
                        // chunk
                        if (startTS > msecsPerChunkFile * destFileCounter) {
                            // close existing file ...
                            out.close();
                            ofstream.close();
                            // ... and start a new file
                            destFileCounter++;
                            outFile = new File(srtFile.getParent(), fileNameParts[0] + destFileCounter + "." + fileNameParts[1]);
                            System.out.println("Writing to "+outFile.getAbsolutePath());
                            outFile.createNewFile();
                            ofstream = new FileWriter(outFile);
                            out = new BufferedWriter(ofstream);
                        }
                    }
                    out.write(line + "/n");
                }
                out.close();
                ofstream.close();
                System.out.println("Done.");
            }
    
            /**
             * Calculates the time in msec of the end time of the last subtitle of the
             * file
             * 
             * @param lines
             *            read from file
             * @return end time in milliseconds of the last subtitle
             */
            public static long lastEndTime(List lines) throws IOException {
                String endTS = null;
                for (String line : lines) {
                    String[] atoms = line.split(" --> ");
                    if (atoms.length > 1) {
                        endTS = atoms[1];
                    }
                }
                return endTS == null ? 0L : toMSec(endTS);
            }
    
            public static long toMSec(String time) {
                long tsMsec = 0;
                String atoms[] = time.split("\\,");
                if (atoms.length == 2) {
                    tsMsec += Integer.parseInt(atoms[1]);
                }
                atoms = atoms[0].split(":");
    
                tsMsec += Integer.parseInt(atoms[2]) * 1000L; /* seconds */
                tsMsec += Integer.parseInt(atoms[1]) * 60000L; /* minutes */
                tsMsec += Integer.parseInt(atoms[0]) * 3600000L; /* hours */
                return tsMsec;
            }
        }
    

    【讨论】:

    • 谢谢。但是我在“for(String line: )”不兼容的类型上遇到错误。预期的对象,但找到了字符串。
    猜你喜欢
    • 1970-01-01
    • 1970-01-01
    • 2021-10-22
    • 1970-01-01
    • 1970-01-01
    • 1970-01-01
    • 1970-01-01
    • 1970-01-01
    • 2014-10-21
    相关资源
    最近更新 更多