TeamNewPipe · TobiGr · Oct 30, 2025 · Aug 26, 2025 · Aug 27, 2025 · Sep 18, 2025
diff --git a/app/src/main/java/org/schabi/newpipe/streams/SrtFromTtmlWriter.java b/app/src/main/java/org/schabi/newpipe/streams/SrtFromTtmlWriter.java
@@ -54,6 +54,36 @@ private void writeString(final String text) throws IOException {
         out.write(text.getBytes(charset));
     }
 
+    // CHECKSTYLE:OFF checkstyle:JavadocStyle
+    // checkstyle does not understand that span tags are inside a code block
+    /**
+     * <p>Recursive method to extract text from all nodes.</p>
+     * <p>
+     *   This method processes {@link TextNode}s and {@code <br>} tags,
+     *   recursively extracting text from nested tags
+     *   (e.g. extracting text from nested {@code <span>} tags).
+     *   Newlines are added for {@code <br>} tags.
+     * </p>
+     * @param node the current node to process
+     * @param text the {@link StringBuilder} to append the extracted text to
+     */
+    private void extractText(final Node node, final StringBuilder text) {
+        if (node instanceof TextNode textNode) {
+            text.append((textNode).text());
+        } else if (node instanceof Element element) {
+            // <br> is a self-closing HTML tag used to insert a line break.
+            if (element.tagName().equalsIgnoreCase("br")) {
+                // Add a newline for <br> tags
+                text.append(NEW_LINE);
+            }
+        }
+        // Recursively process child nodes
+        for (final Node child : node.childNodes()) {
+            extractText(child, text);
+        }
-        if (node instanceof TextNode textNode) {
-            text.append((textNode).text());
-        } else if (node instanceof Element element) {
-            // <br> is a self-closing HTML tag used to insert a line break.
-            if (element.tagName().equalsIgnoreCase("br")) {
-                // Add a newline for <br> tags
-                text.append(NEW_LINE);
-            }
-        }
-        // Recursively process child nodes
-        for (final Node child : node.childNodes()) {
-            extractText(child, text);
-        }
+        final List<Pair<Element, String>> pairList = doc.selectStream("body > div > p")
+                .map(paragraph -> {
+                    // Element.text extracts from child nodes as well
+                    return new Pair<>(paragraph, paragraph.text());
+                })
+                .filter(pair -> !ignoreEmptyFrames || !pair.second.isEmpty())
+                .toList();
+
+        for (final var pair : pairList) {
+            final var paragraph = pair.first;
+            final var text = pair.second;
+
+            final String begin = getTimestamp(paragraph, "begin");
+            final String end = getTimestamp(paragraph, "end");
+
+            writeFrame(begin, end, text);
+        }
-        if (node instanceof TextNode textNode) {
-            text.append((textNode).text());
-        } else if (node instanceof Element element) {
-            // <br> is a self-closing HTML tag used to insert a line break.
-            if (element.tagName().equalsIgnoreCase("br")) {
-                // Add a newline for <br> tags
-                text.append(NEW_LINE);
-            }
-        }
-        // Recursively process child nodes
-        for (final Node child : node.childNodes()) {
-            extractText(child, text);
-        }
+        final List<Pair<Element, String>> pairList = doc.selectStream("body > div > p")
+                .map(paragraph -> {
+                    // Element.text extracts from child nodes as well
+                    return new Pair<>(paragraph, paragraph.text());
+                })
+                .filter(pair -> !ignoreEmptyFrames || !pair.second.isEmpty())
+                .toList();
+
+        for (final var pair : pairList) {
+            final var paragraph = pair.first;
+            final var text = pair.second;
+
+            final String begin = getTimestamp(paragraph, "begin");
+            final String end = getTimestamp(paragraph, "end");
+
+            writeFrame(begin, end, text);
+        }
+    }
+    // CHECKSTYLE:ON
+
     public void build(final SharpStream ttml) throws IOException {
         /*
          * TTML parser with BASIC support
@@ -74,21 +104,15 @@ public void build(final SharpStream ttml) throws IOException {
         final Elements paragraphList = doc.select("body > div > p");
 
         // check if has frames
-        if (paragraphList.size() < 1) {
+        if (paragraphList.isEmpty()) {
             return;
         }
 
         for (final Element paragraph : paragraphList) {
             text.setLength(0);
 
-            for (final Node children : paragraph.childNodes()) {
-                if (children instanceof TextNode) {
-                    text.append(((TextNode) children).text());
-                } else if (children instanceof Element
-                        && ((Element) children).tagName().equalsIgnoreCase("br")) {
-                    text.append(NEW_LINE);
-                }
-            }
+            // Recursively extract text from all child nodes
+            extractText(paragraph, text);
 
             if (ignoreEmptyFrames && text.length() < 1) {
                 continue;