From f505702dc7d311ef6bf960be536fa1b44b50791e Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=E9=99=B3=E9=88=9E?= <jim60105@gmail.com>
Date: Sat, 26 Aug 2023 06:48:35 +0800
Subject: [PATCH 1/2] chore(writer): Join words without spaces for ja, zh

fix #248, fix #310
---
 whisperx/transcribe.py | 1 +
 whisperx/utils.py      | 6 +++++-
 2 files changed, 6 insertions(+), 1 deletion(-)

diff --git a/whisperx/transcribe.py b/whisperx/transcribe.py
index 6a2dcb6..fa400a3 100644
--- a/whisperx/transcribe.py
+++ b/whisperx/transcribe.py
@@ -213,6 +213,7 @@ def cli():
             results.append((result, input_audio_path))
     # >> Write
     for result, audio_path in results:
+        result["language"] = align_language
         writer(result, audio_path, writer_args)
 
 if __name__ == "__main__":
diff --git a/whisperx/utils.py b/whisperx/utils.py
index 86beea4..37792d3 100644
--- a/whisperx/utils.py
+++ b/whisperx/utils.py
@@ -123,6 +123,7 @@ TO_LANGUAGE_CODE = {
     "castilian": "es",
 }
 
+LANGUAGES_WITHOUT_SPACES = ["ja", "zh"]
 
 system_encoding = sys.getdefaultencoding()
 
@@ -283,7 +284,10 @@ class SubtitlesWriter(ResultWriter):
                 sstart, ssend, speaker = _[0]
                 subtitle_start = self.format_timestamp(sstart)
                 subtitle_end = self.format_timestamp(ssend)
-                subtitle_text = " ".join([word["word"] for word in subtitle])
+                if result["language"] in LANGUAGES_WITHOUT_SPACES:
+                    subtitle_text = "".join([word["word"] for word in subtitle])
+                else:
+                    subtitle_text = " ".join([word["word"] for word in subtitle])
                 has_timing = any(["start" in word for word in subtitle])
 
                 # add [$SPEAKER_ID]: to each subtitle if speaker is available

From 5223de2a417228f671524106b8bc79301176dd18 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=E9=99=B3=E9=88=9E?= <jim60105@gmail.com>
Date: Sat, 26 Aug 2023 08:32:24 +0800
Subject: [PATCH 2/2] fix: UnboundLocalError: local variable 'align_language'
 referenced before assignment

---
 whisperx/transcribe.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/whisperx/transcribe.py b/whisperx/transcribe.py
index fa400a3..162eb0d 100644
--- a/whisperx/transcribe.py
+++ b/whisperx/transcribe.py
@@ -118,6 +118,7 @@ def cli():
                 f"{model_name} is an English-only model but receipted '{args['language']}'; using English instead."
             )
         args["language"] = "en"
+    align_language = args["language"] if args["language"] is not None else "en" # default to loading english if not specified
 
     temperature = args.pop("temperature")
     if (increment := args.pop("temperature_increment_on_fallback")) is not None:
@@ -174,7 +175,6 @@ def cli():
     if not no_align:
         tmp_results = results
         results = []
-        align_language = args["language"] if args["language"] is not None else "en" # default to loading english if not specified
         align_model, align_metadata = load_align_model(align_language, device, model_name=align_model)
         for result, audio_path in tmp_results:
             # >> Align