2 年之前 · 9a97a9b254
--- a/whisper/transcribe.py
+++ b/whisper/transcribe.py
@@ -10,7 +10,7 @@ import tqdm
 
															 from .audio import SAMPLE_RATE, N_FRAMES, HOP_LENGTH, pad_or_trim, log_mel_spectrogram
														
 
															 from .decoding import DecodingOptions, DecodingResult
														
 
															 from .tokenizer import LANGUAGES, TO_LANGUAGE_CODE, get_tokenizer
														
 
															-from .utils import exact_div, format_timestamp, make_safe, optional_int, optional_float, str2bool, get_writer
														
 
															+from .utils import exact_div, format_timestamp, make_safe, optional_int, optional_float, str2bool, get_writer, remove_leading_spaces
														
 
															 if TYPE_CHECKING:
														
 
															     from .model import Whisper
														
@@ -250,11 +250,16 @@ def transcribe(
 
															             pbar.update(min(num_frames, seek) - previous_seek_value)
														
 
															             previous_seek_value = seek
														
 
															-    return dict(
														
 
															-        text=tokenizer.decode(all_tokens[len(initial_prompt_tokens):]),
														
 
															-        segments=all_segments,
														
 
															-        language=language
														
 
															-    )
														
 
															+            result = dict(
														
 
															+                text=tokenizer.decode(all_tokens[len(initial_prompt_tokens):]),
														
 
															+                segments=all_segments,
														
 
															+                language=language
														
 
															+            )
														
 
															+
														
 
															+            if decode_options["language"] == "ko":
														
 
															+                result = remove_leading_spaces(result)
														
 
															+
														
 
															+    return result
														
 
															 def cli():
														
--- a/whisper/utils.py
+++ b/whisper/utils.py
@@ -161,3 +161,20 @@ def get_writer(output_format: str, output_dir: str) -> Callable[[dict, TextIO],
 
															     return writers[output_format](output_dir)
														
 
															+
														
 
															+def remove_leading_spaces(
														
 
															+        result: dict
														
 
															+) -> dict:
														
 
															+    """
														
 
															+    Removes unwanted leading spaces from the main 'text' field and each 'text' field in the 'segments' list.
														
 
															+    This function is currently applied specifically to some languages to correct formatting issues.
														
 
															+    Currently monitored language: Korean
														
 
															+    """
														
 
															+    if result['text'].startswith(' '):
														
 
															+        result['text'] = result['text'][1:]
														
 
															+
														
 
															+    for segment in result['segments']:
														
 
															+        if segment['text'].startswith(' '):
														
 
															+            segment['text'] = segment['text'][1:]
														
 
															+
														
 
															+    return result