Spaces:

mantrakp
/

aai

Runtime error

App Files Files Community

barreloflube commited on Sep 20, 2024

Commit

7de38d8

1 Parent(s): 11e2df6

Refactor code to remove unused function and commented out code

Browse files

Files changed (1) hide show

tabs/audios/events.py +36 -35

tabs/audios/events.py CHANGED Viewed

@@ -22,46 +22,47 @@ def create_temp_file():
 def assign_language_tags(text):
-    # Process the text
-    # based on the language assign <|zh|><|en|><|jp|><|yue|><|ko|> for Chinese/English/Japanese/Cantonese/Korean
-    # at the start of the text for that language
-    # e.g. input: 你好 Hello こんにちは 你好 안녕하세요
-    # output: <|zh|>你好<|en|>Hello<|jp|>こんにちは<|yue|>你好<|ko|>안녕하세요
-    # Define language patterns
-    patterns = {
-        'zh': r'[\u4e00-\u9fff]+',  # Chinese characters
-        'en': r'[a-zA-Z]+',         # English letters
-        'jp': r'[\u3040-\u30ff\u31f0-\u31ff]+',  # Japanese characters
-        'ko': r'[\uac00-\ud7a3]+',  # Korean characters
-    }
-    # Find all matches
-    matches = []
-    for lang, pattern in patterns.items():
-        for match in re.finditer(pattern, text):
-            matches.append((match.start(), match.end(), lang, match.group()))
-    # Sort matches by start position
-    matches.sort(key=lambda x: x[0])
-    # Build the result string
-    result = []
-    last_end = 0
-    zh_count = 0
-    for start, end, lang, content in matches:
-        if start > last_end:
-            result.append(text[last_end:start])
-        if lang == 'zh':
-            zh_count += 1
-            if zh_count > 1:
-                lang = 'yue'
-        result.append(f'<|{lang}|>{content}')
-        last_end = end
-    if last_end < len(text):
-        result.append(text[last_end:])
-    return ''.join(result)
 def update_mode(mode, sft_speaker, speaker_audio, voice_instructions):

 def assign_language_tags(text):
+    return text
+    # # Process the text
+    # # based on the language assign <|zh|><|en|><|jp|><|yue|><|ko|> for Chinese/English/Japanese/Cantonese/Korean
+    # # at the start of the text for that language
+    # # e.g. input: 你好 Hello こんにちは 你好 안녕하세요
+    # # output: <|zh|>你好<|en|>Hello<|jp|>こんにちは<|yue|>你好<|ko|>안녕하세요
+    # # Define language patterns
+    # patterns = {
+    #     'zh': r'[\u4e00-\u9fff]+',  # Chinese characters
+    #     'en': r'[a-zA-Z]+',         # English letters
+    #     'jp': r'[\u3040-\u30ff\u31f0-\u31ff]+',  # Japanese characters
+    #     'ko': r'[\uac00-\ud7a3]+',  # Korean characters
+    # }
+    # # Find all matches
+    # matches = []
+    # for lang, pattern in patterns.items():
+    #     for match in re.finditer(pattern, text):
+    #         matches.append((match.start(), match.end(), lang, match.group()))
+    # # Sort matches by start position
+    # matches.sort(key=lambda x: x[0])
+    # # Build the result string
+    # result = []
+    # last_end = 0
+    # zh_count = 0
+    # for start, end, lang, content in matches:
+    #     if start > last_end:
+    #         result.append(text[last_end:start])
+    #     if lang == 'zh':
+    #         zh_count += 1
+    #         if zh_count > 1:
+    #             lang = 'yue'
+    #     result.append(f'<|{lang}|>{content}')
+    #     last_end = end
+    # if last_end < len(text):
+    #     result.append(text[last_end:])
+    # return ''.join(result)
 def update_mode(mode, sft_speaker, speaker_audio, voice_instructions):