normalizing entries

Browse files

Files changed (3) hide show

prepare_model.py +86 -0
vctk_speakers.json → speakers-log.json +0 -0
speakers.md +18 -24

prepare_model.py ADDED Viewed

	@@ -0,0 +1,86 @@

+import json
+import os
+import subprocess
+def generate_html_output(data, repository_path):
+    with open('speakers.md', 'a') as file:
+        for speaker_id, speaker_info in data.items():
+            out_path = f"{repository_path}/samples/{speaker_id}.wav"
+            age = speaker_info['age']
+            gender = speaker_info['gender']
+            if gender == 'F':
+                gender = 'female'
+            elif gender == "M":
+                gender = 'male'
+            accents = speaker_info['accents']
+            region = speaker_info['region']
+            file.write(f"<p>VCTK_{speaker_id}: {age} year old {gender}, {accents} accent ({region})<audio controls><source src=\"{out_path}\" type=\"audio/wav\"></audio> </p>\n")
+# Load the data from the provided dictionary
+data = {
+    "p225": {"age": 23, "gender": "F", "accents": "English", "region": "Southern England", "comments": ""},
+    "p228": {"age": 22, "gender": "F", "accents": "English", "region": "Southern England", "comments": ""},
+    "p229": {"age": 23, "gender": "F", "accents": "English", "region": "Southern England", "comments": ""},
+    "p230": {"age": 22, "gender": "F", "accents": "English", "region": "Stockton-on-tees", "comments": ""},
+    "p231": {"age": 23, "gender": "F", "accents": "English", "region": "Southern England", "comments": ""},
+    "p233": {"age": 23, "gender": "F", "accents": "English", "region": "Staffordshire", "comments": ""},
+    "p236": {"age": 23, "gender": "F", "accents": "English", "region": "Manchester", "comments": ""},
+    "p239": {"age": 22, "gender": "F", "accents": "English", "region": "Southwest England", "comments": ""},
+    "p240": {"age": 21, "gender": "F", "accents": "English", "region": "Southern England", "comments": ""},
+    "p244": {"age": 22, "gender": "F", "accents": "English", "region": "Manchester", "comments": ""},
+    "p250": {"age": 22, "gender": "F", "accents": "English", "region": "Southeast England", "comments": ""},
+    "p257": {"age": 24, "gender": "F", "accents": "English", "region": "Southern England", "comments": ""},
+    "p267": {"age": 23, "gender": "F", "accents": "English", "region": "Yorkshire", "comments": ""},
+    "p268": {"age": 23, "gender": "F", "accents": "English", "region": "Southern England", "comments": ""},
+    "p269": {"age": 20, "gender": "F", "accents": "English", "region": "Newcastle", "comments": ""},
+    "p276": {"age": 24, "gender": "F", "accents": "English", "region": "Oxford", "comments": ""},
+    "p277": {"age": 23, "gender": "F", "accents": "English", "region": "Northeast England", "comments": ""},
+    "p282": {"age": 23, "gender": "F", "accents": "English", "region": "Newcastle", "comments": ""}
+}
+# Convert the data to JSON format
+json_data = json.dumps(data, indent=2)
+# Save the JSON data to a file
+with open('speakers-log.json', 'w') as file:
+    file.write(json_data)
+# Run the TTS command to get the speaker indices
+command = "tts --model_path checkpoint_85000.pth --config_path config.json --list_speaker_idxs | grep -vE '^(\s*\||\s*>|\s*$)'"
+output = subprocess.check_output(command, shell=True, text=True)
+# Parse the JSON output into a Python dictionary
+speaker_indices = eval(output)
+# Load the speaker IDs from speakers.json
+with open('speakers-log.json', 'r') as file:
+    speaker_ids = json.load(file)
+# Create the speakers.md file
+with open('speakers.md', 'w') as file:
+    for speaker_idx in speaker_indices:
+        # Remove the 'VCTK_' prefix
+        speaker_id = speaker_idx.replace('VCTK_', '')
+        # Lookup the speaker ID in the loaded speaker IDs
+        if speaker_id in speaker_ids:
+            speaker_id_json = speaker_ids[speaker_id]
+        else:
+            continue
+        # # Generate the TTS command to create the audio file
+        # text = f"Hello, I am from {speaker_id_json['region']}. I hope that you will select my voice for your project. Thank you."
+        # # make samples directory if it doesn't exist
+        # if not os.path.exists("samples"):
+        #     os.makedirs("samples")
+        out_path = f"samples/{speaker_id}.wav"
+        tts_command = f"tts --text \"{text}\" --model_path checkpoint_85000.pth --language_idx en --config_path config.json --speaker_idx \"VCTK_{speaker_id}\" --out_path {out_path}"
+        Execute the TTS command
+        os.system(tts_command)
+        # Write the speaker information to the speakers.md file
+        generate_html_output({speaker_id: speaker_id_json}, "https://huggingface.co/voices/VCTK_European_English_Females/resolve/main")

vctk_speakers.json → speakers-log.json RENAMED Viewed

File without changes

speakers.md CHANGED Viewed

@@ -1,24 +1,18 @@
- <audio controls>
-  <source src="horse.ogg" type="audio/ogg">
-  <source src="horse.mp3" type="audio/mpeg">
-Your browser does not support the audio element.
-</audio>
-[p225](samples/p225.wav) Age 23 Gender F Accents English Region Southern England Comments
-[p228](samples/p228.wav) Age 22 Gender F Accents English Region Southern England Comments
-[p229](samples/p229.wav) Age 23 Gender F Accents English Region Southern England Comments
-[p230](samples/p230.wav) Age 22 Gender F Accents English Region Stockton-on-tees Comments
-[p231](samples/p231.wav) Age 23 Gender F Accents English Region Southern England Comments
-[p233](samples/p233.wav) Age 23 Gender F Accents English Region Staffordshire Comments
-[p236](samples/p236.wav) Age 23 Gender F Accents English Region Manchester Comments
-[p239](samples/p239.wav) Age 22 Gender F Accents English Region Southwest England Comments
-[p240](samples/p240.wav) Age 21 Gender F Accents English Region Southern England Comments
-[p244](samples/p244.wav) Age 22 Gender F Accents English Region Manchester Comments
-[p250](samples/p250.wav) Age 22 Gender F Accents English Region Southeast England Comments
-[p257](samples/p257.wav) Age 24 Gender F Accents English Region Southern England Comments
-[p267](samples/p267.wav) Age 23 Gender F Accents English Region Yorkshire Comments
-[p268](samples/p268.wav) Age 23 Gender F Accents English Region Southern England Comments
-[p269](samples/p269.wav) Age 20 Gender F Accents English Region Newcastle Comments
-[p276](samples/p276.wav) Age 24 Gender F Accents English Region Oxford Comments
-[p277](samples/p277.wav) Age 23 Gender F Accents English Region Northeast England Comments
-[p282](samples/p282.wav) Age 23 Gender F Accents English Region Newcastle Comments

+<p>VCTK_p225: 23 year old female, English accent (Southern England)<audio controls><source src="https://huggingface.co/voices/VCTK_European_English_Females/resolve/main/samples/p225.wav" type="audio/wav"></audio> </p>
+<p>VCTK_p228: 22 year old female, English accent (Southern England)<audio controls><source src="https://huggingface.co/voices/VCTK_European_English_Females/resolve/main/samples/p228.wav" type="audio/wav"></audio> </p>
+<p>VCTK_p229: 23 year old female, English accent (Southern England)<audio controls><source src="https://huggingface.co/voices/VCTK_European_English_Females/resolve/main/samples/p229.wav" type="audio/wav"></audio> </p>
+<p>VCTK_p230: 22 year old female, English accent (Stockton-on-tees)<audio controls><source src="https://huggingface.co/voices/VCTK_European_English_Females/resolve/main/samples/p230.wav" type="audio/wav"></audio> </p>
+<p>VCTK_p231: 23 year old female, English accent (Southern England)<audio controls><source src="https://huggingface.co/voices/VCTK_European_English_Females/resolve/main/samples/p231.wav" type="audio/wav"></audio> </p>
+<p>VCTK_p233: 23 year old female, English accent (Staffordshire)<audio controls><source src="https://huggingface.co/voices/VCTK_European_English_Females/resolve/main/samples/p233.wav" type="audio/wav"></audio> </p>
+<p>VCTK_p236: 23 year old female, English accent (Manchester)<audio controls><source src="https://huggingface.co/voices/VCTK_European_English_Females/resolve/main/samples/p236.wav" type="audio/wav"></audio> </p>
+<p>VCTK_p239: 22 year old female, English accent (Southwest England)<audio controls><source src="https://huggingface.co/voices/VCTK_European_English_Females/resolve/main/samples/p239.wav" type="audio/wav"></audio> </p>
+<p>VCTK_p240: 21 year old female, English accent (Southern England)<audio controls><source src="https://huggingface.co/voices/VCTK_European_English_Females/resolve/main/samples/p240.wav" type="audio/wav"></audio> </p>
+<p>VCTK_p244: 22 year old female, English accent (Manchester)<audio controls><source src="https://huggingface.co/voices/VCTK_European_English_Females/resolve/main/samples/p244.wav" type="audio/wav"></audio> </p>
+<p>VCTK_p250: 22 year old female, English accent (Southeast England)<audio controls><source src="https://huggingface.co/voices/VCTK_European_English_Females/resolve/main/samples/p250.wav" type="audio/wav"></audio> </p>
+<p>VCTK_p257: 24 year old female, English accent (Southern England)<audio controls><source src="https://huggingface.co/voices/VCTK_European_English_Females/resolve/main/samples/p257.wav" type="audio/wav"></audio> </p>
+<p>VCTK_p267: 23 year old female, English accent (Yorkshire)<audio controls><source src="https://huggingface.co/voices/VCTK_European_English_Females/resolve/main/samples/p267.wav" type="audio/wav"></audio> </p>
+<p>VCTK_p268: 23 year old female, English accent (Southern England)<audio controls><source src="https://huggingface.co/voices/VCTK_European_English_Females/resolve/main/samples/p268.wav" type="audio/wav"></audio> </p>
+<p>VCTK_p269: 20 year old female, English accent (Newcastle)<audio controls><source src="https://huggingface.co/voices/VCTK_European_English_Females/resolve/main/samples/p269.wav" type="audio/wav"></audio> </p>
+<p>VCTK_p276: 24 year old female, English accent (Oxford)<audio controls><source src="https://huggingface.co/voices/VCTK_European_English_Females/resolve/main/samples/p276.wav" type="audio/wav"></audio> </p>
+<p>VCTK_p277: 23 year old female, English accent (Northeast England)<audio controls><source src="https://huggingface.co/voices/VCTK_European_English_Females/resolve/main/samples/p277.wav" type="audio/wav"></audio> </p>
+<p>VCTK_p282: 23 year old female, English accent (Newcastle)<audio controls><source src="https://huggingface.co/voices/VCTK_European_English_Females/resolve/main/samples/p282.wav" type="audio/wav"></audio> </p>