Spaces:

LichtLiu
/

Groq-GPT

Sleeping

App Files Files Community

LichtLiu commited on Oct 6

Commit

81766a7

•

1 Parent(s): 0d230cc

update audio split

Browse files

Files changed (2) hide show

app.py +18 -28
hell 3.10.15 +95 -0

app.py CHANGED Viewed

@@ -46,42 +46,32 @@ vocoder = SpeechT5HifiGan.from_pretrained("microsoft/speecht5_hifigan").to(devic
 embeddings_dataset = load_dataset("Matthijs/cmu-arctic-xvectors", split="validation")
 speaker_embeddings = torch.tensor(embeddings_dataset[7306]["xvector"]).unsqueeze(0).to(device)
-def split_text_into_chunks(text, max_length):
-    # Split text into chunks that fit within the maximum token limit
-    words = text.split()  # Split the text into words
-    chunks = []
-    current_chunk = []
-    for word in words:
-        if len(current_chunk) + len(word) + 1 <= max_length:  # +1 accounts for space between words
-            current_chunk.append(word)
-        else:
-            # Join the current chunk into a string and append it to the list of chunks
-            chunks.append(' '.join(current_chunk))
-            # Start a new chunk
-            current_chunk = [word]
-    # Append the last chunk
-    if current_chunk:
-        chunks.append(' '.join(current_chunk))
-    return chunks
 def textToSpeech(expression):
-    # Split the input text into smaller chunks if necessary
-    max_token_limit = 600  # Set the token limit for your model
-    chunks = split_text_into_chunks(expression, max_token_limit)
     # Initialize an empty list to store the generated speech chunks
     audio_chunks = []
-    # Process each chunk through the model
-    for chunk in chunks:
-        inputs = processor(text=chunk, return_tensors="pt").to(device)
-        speech = model.generate_speech(inputs["input_ids"], speaker_embeddings, vocoder=vocoder)
         audio_chunks.append(speech.cpu().numpy())
-    # Concatenate the audio chunks into a single file
     final_audio = np.concatenate(audio_chunks)
     # Get the current date and time for unique file naming

 embeddings_dataset = load_dataset("Matthijs/cmu-arctic-xvectors", split="validation")
 speaker_embeddings = torch.tensor(embeddings_dataset[7306]["xvector"]).unsqueeze(0).to(device)
+def split_text_into_chunks(text, processor, max_length):
+    # Tokenize the input text
+    tokens = processor(text, return_tensors="pt", truncation=False).input_ids[0]
+    # Split tokens into chunks
+    chunked_tokens = [tokens[i:i + max_length] for i in range(0, len(tokens), max_length)]
+    return chunked_tokens
 def textToSpeech(expression):
+    # Set the maximum token limit for your model
+    max_token_limit = 600  # The maximum token length the model can handle
+    # Tokenize and split the text into chunks based on tokens
+    token_chunks = split_text_into_chunks(expression, processor, max_token_limit)
     # Initialize an empty list to store the generated speech chunks
     audio_chunks = []
+    # Process each token chunk through the model
+    for token_chunk in token_chunks:
+        # Generate speech from the token chunk
+        speech = model.generate_speech(token_chunk.unsqueeze(0), speaker_embeddings, vocoder=vocoder)
         audio_chunks.append(speech.cpu().numpy())
+    # Concatenate the audio chunks into a single array
     final_audio = np.concatenate(audio_chunks)
     # Get the current date and time for unique file naming

hell 3.10.15 ADDED Viewed

	@@ -0,0 +1,95 @@

+[33mcommit b8c7a08b2bbcfdee152786b6a7212a047c50fc85[m[33m ([m[1;36mHEAD -> [m[1;32mmain[m[33m, [m[1;31morigin/main[m[33m, [m[1;31morigin/HEAD[m[33m)[m
+Author: LichtLiu <LichtLiu@users.noreply.huggingface.co>
+Date:   Sun Oct 6 14:21:55 2024 +0200
+    state
+[33mcommit 469ea347d5b8ea6d5404d7e88c4b4ab3f4abea07[m
+Author: LichtLiu <LichtLiu@users.noreply.huggingface.co>
+Date:   Sun Oct 6 14:15:30 2024 +0200
+    update history
+[33mcommit 3665a4d6ca95c3a000e58ce1cb8a96fd34ecd9ce[m
+Author: LichtLiu <LichtLiu@users.noreply.huggingface.co>
+Date:   Sun Oct 6 14:11:30 2024 +0200
+    print
+[33mcommit 96ad9b6e84215b238a689f0a5e4d33971114a2d7[m
+Author: LichtLiu <LichtLiu@users.noreply.huggingface.co>
+Date:   Sun Oct 6 14:08:38 2024 +0200
+    update history return
+[33mcommit 46e5c3d007799e62d711648538998e777fabca81[m
+Author: LichtLiu <LichtLiu@users.noreply.huggingface.co>
+Date:   Sun Oct 6 14:02:18 2024 +0200
+    delete history
+[33mcommit a997e436dc12c9d1c0824216b9c274ffee7371f8[m
+Author: LichtLiu <LichtLiu@users.noreply.huggingface.co>
+Date:   Sun Oct 6 13:53:47 2024 +0200
+    update history
+[33mcommit a743d0417f8168714ec629191b0d0c228c5b236e[m
+Author: LichtLiu <LichtLiu@users.noreply.huggingface.co>
+Date:   Sun Oct 6 13:51:41 2024 +0200
+    update
+[33mcommit 2c12fc659c9e0f58f725b751b244de305ef31423[m
+Author: LichtLiu <LichtLiu@users.noreply.huggingface.co>
+Date:   Sun Oct 6 13:48:20 2024 +0200
+    update
+[33mcommit c1aaa3ef2578af41e237a507c82ba8810b23129f[m
+Author: LichtLiu <LichtLiu@users.noreply.huggingface.co>
+Date:   Sun Oct 6 13:45:29 2024 +0200
+    update new_history
+[33mcommit cbc1d5399d3c2b2ea2385503a96194c2aea7e5c7[m
+Author: LichtLiu <LichtLiu@users.noreply.huggingface.co>
+Date:   Sun Oct 6 13:41:12 2024 +0200
+    update
+[33mcommit 5605340f569f7de28844f49d7c8216159326240a[m
+Author: LichtLiu <LichtLiu@users.noreply.huggingface.co>
+Date:   Sun Oct 6 13:26:52 2024 +0200
+    update 20241006
+[33mcommit 9819d723446298f3846c4eca55c081d1ab6083a4[m
+Author: LichtLiu <LichtLiu@users.noreply.huggingface.co>
+Date:   Mon Sep 30 16:22:08 2024 +0200
+    update markdown
+[33mcommit 60c04ae96546d672b6804699cd99623e15dea0b1[m
+Author: LichtLiu <LichtLiu@users.noreply.huggingface.co>
+Date:   Mon Sep 30 15:24:05 2024 +0200
+    call print
+[33mcommit 08681846ade0af0fa2323113c1416fc0c2a5e345[m
+Author: LichtLiu <LichtLiu@users.noreply.huggingface.co>
+Date:   Mon Sep 30 15:06:04 2024 +0200
+    update
+[33mcommit d99be9e3ac9f8e8148f3da866f94ae539e29d363[m
+Author: LichtLiu <LichtLiu@users.noreply.huggingface.co>
+Date:   Mon Sep 30 14:47:27 2024 +0200
+    edit prompt
+[33mcommit 23136538c718c9a7683a5f9f729790050986066b[m[33m ([m[1;34mgrafted[m[33m)[m
+Author: LichtLiu <LichtLiu@users.noreply.huggingface.co>
+Date:   Sun Sep 29 19:22:47 2024 +0200
+    update