fix: preserve input order for equal-timestamp lyrics in normalize and to_plain

2026-04-08 12:28:28 +02:00
parent f8db549d8e
commit 9b42cab76b
4 changed files with 46 additions and 4 deletions
@@ -4,7 +4,7 @@ build-backend = "hatchling.build"

 [project]
 name = "lrx-cli"
-version = "0.6.3"
+version = "0.6.4"
 description = "Fetch line-synced lyrics for your music player."
 readme = "README.md"
 requires-python = ">=3.13"
@@ -378,7 +378,12 @@ class LRCData:
                shifted = max(0, time_ms + offset_ms)
                lyric_entries.append((shifted, lyric_text))

-        lyric_entries.sort(key=lambda item: item[0])
+        # Sort by timestamp; original index as tiebreaker so equal-time entries
+        # retain the order they appeared in the input.
+        lyric_entries = [
+            e
+            for _, e in sorted(enumerate(lyric_entries), key=lambda x: (x[1][0], x[0]))
+        ]

        out_lyrics: list[LyricLine] = [
            LyricLine(line_times_ms=[time_ms], words=[LrcWordSegment(text=text)])
@@ -413,7 +418,12 @@ class LRCData:
        for line in self._lines:
            tagged_lines.extend(line.timed_plain_entries())

-        sorted_lines = [lyric for _, lyric in sorted(tagged_lines, key=lambda x: x[0])]
+        sorted_lines = [
+            lyric
+            for _, (_, lyric) in sorted(
+                enumerate(tagged_lines), key=lambda x: (x[1][0], x[0])
+            )
+        ]

        if deduplicate:
            # Remove consecutive duplicates
@@ -185,6 +185,23 @@ def test_normalize_expands_multi_time_tags_and_sorts_lyrics() -> None:
    assert normalized == "\n".join(["[00:01.00]x", "[00:02.00]x", "[00:03.00]c"])


+def test_normalize_preserves_input_order_for_equal_timestamps() -> None:
+    text = "\n".join(
+        [
+            "[00:00.00]first",
+            "[00:00.00]second",
+            "[00:00.00]third",
+            "[00:01.00]later",
+        ]
+    )
+
+    normalized = LRCData(text).to_normalized_text()
+
+    assert normalized == "\n".join(
+        ["[00:00.00]first", "[00:00.00]second", "[00:00.00]third", "[00:01.00]later"]
+    )
+
+
 def test_normalize_converts_unsynced_lines_and_removes_word_sync_tags() -> None:
    text = "\n".join(
        [
@@ -257,6 +274,21 @@ def test_to_plain_sorts_lines_by_timestamp_across_lines() -> None:
    assert plain == "\n".join(["early", "middle", "late"])


+def test_to_plain_preserves_input_order_for_equal_timestamps() -> None:
+    text = "\n".join(
+        [
+            "[00:00.00]first",
+            "[00:00.00]second",
+            "[00:00.00]third",
+            "[00:01.00]later",
+        ]
+    )
+
+    plain = LRCData(text).to_plain()
+
+    assert plain == "\n".join(["first", "second", "third", "later"])
+
+
 def test_to_plain_deduplicate_collapses_only_consecutive_equals() -> None:
    text = "\n".join(
        [
@@ -153,7 +153,7 @@ wheels = [

 [[package]]
 name = "lrx-cli"
-version = "0.6.3"
+version = "0.6.4"
 source = { editable = "." }
 dependencies = [
    { name = "cyclopts" },