ryanlinjui commited on
Commit
bd05f58
·
1 Parent(s): 6377b99

Add application file

Browse files
Files changed (4) hide show
  1. .gitignore +15 -0
  2. app.py +40 -0
  3. pyproject.toml +16 -0
  4. taiko.py +104 -0
.gitignore ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # python cache
2
+ __pycache__
3
+
4
+ # poetry
5
+ .venv
6
+ poetry.lock
7
+
8
+ # gradio
9
+ flagged
10
+
11
+ # test
12
+ *.wav
13
+ *.ogg
14
+ *.json
15
+ *.tja
app.py ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import json
2
+ import gradio as gr
3
+ import numpy as np
4
+
5
+ from taiko import (
6
+ preprocess,
7
+ generate_taiko_wav,
8
+ COURSE
9
+ )
10
+
11
+ def handle(chart_path, music_path):
12
+ data = json.loads(open(chart_path, "r").read())
13
+
14
+ if len(data["data"]) < 0 and len(data["data"]) > 5:
15
+ raise("Issue occur: Json data")
16
+
17
+ for d in data["data"]:
18
+ chart = preprocess(d["chart"])
19
+ audio = generate_taiko_wav(chart, music_path)
20
+ COURSE[d["course"]]["audio"] = audio
21
+
22
+ c = 2
23
+ if music_path is None: c = 1
24
+
25
+ return \
26
+ (COURSE[0]["audio"].frame_rate * c, np.array(COURSE[0]["audio"].get_array_of_samples())), \
27
+ (COURSE[1]["audio"].frame_rate * c, np.array(COURSE[1]["audio"].get_array_of_samples())), \
28
+ (COURSE[2]["audio"].frame_rate * c, np.array(COURSE[2]["audio"].get_array_of_samples())), \
29
+ (COURSE[3]["audio"].frame_rate * c, np.array(COURSE[3]["audio"].get_array_of_samples())), \
30
+ (COURSE[4]["audio"].frame_rate * c, np.array(COURSE[4]["audio"].get_array_of_samples()))
31
+
32
+ if __name__ == "__main__":
33
+ inputs = [
34
+ gr.File(label="太鼓達人譜面Json/Taiko Chart Json Data"),
35
+ gr.File(label="譜面音樂/Chart Music (Optional)")
36
+ ]
37
+ outputs = [gr.Audio(label=course["label"]) for course in COURSE]
38
+
39
+ demo = gr.Interface(fn=handle, inputs=inputs, outputs=outputs, title="`程設二作業HW0105 / Taiko Music Generator")
40
+ demo.launch(share=True)
pyproject.toml ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [tool.poetry]
2
+ name = "taiko-music-generator"
3
+ version = "0.1.0"
4
+ description = ""
5
+ authors = ["ryanlinjui <ryanlinjui@gmail.com>"]
6
+ readme = "README.md"
7
+ packages = [{include = "taiko_music_generator"}]
8
+
9
+ [tool.poetry.dependencies]
10
+ python = "^3.10"
11
+ gradio = "^4.19.2"
12
+
13
+
14
+ [build-system]
15
+ requires = ["poetry-core"]
16
+ build-backend = "poetry.core.masonry.api"
taiko.py ADDED
@@ -0,0 +1,104 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from pydub import AudioSegment
2
+ import numpy as np
3
+
4
+ DON_WAV = "./Arcade - Taiko no Tatsujin 2020 Version - Common Sound Effects/Don.wav"
5
+ KATSU_WAV = "./Arcade - Taiko no Tatsujin 2020 Version - Common Sound Effects/Katsu.wav"
6
+ BALLOON_BANG_WAV = "./Arcade - Taiko no Tatsujin 2020 Version - Common Sound Effects/Balloon.wav"
7
+
8
+ COURSE = [
9
+ {
10
+ "audio": AudioSegment.empty(),
11
+ "label": "かんたん/梅花(簡單)/Easy",
12
+ },
13
+ {
14
+ "audio": AudioSegment.empty(),
15
+ "label": "ふつう/竹子(普通)/Normal",
16
+ },
17
+ {
18
+ "audio": AudioSegment.empty(),
19
+ "label": "むずかしい/樹(困難)/Hard",
20
+ },
21
+ {
22
+ "audio": AudioSegment.empty(),
23
+ "label": "おに/魔王/Oni",
24
+ },
25
+ {
26
+ "audio": AudioSegment.empty(),
27
+ "label": "裏/Edit",
28
+ }
29
+ ]
30
+
31
+ HIT_PER_SEC = 30
32
+
33
+ def preprocess(data:list, offset:float=0):
34
+ chart = []
35
+ for m in data:
36
+ if m[0] in {1, 3}: # Don or Big Don
37
+ chart.append((DON_WAV, offset + m[1]))
38
+ elif m[0] in {2, 4}: # Katsu or Big Katsu
39
+ chart.append((KATSU_WAV, offset + m[1]))
40
+ elif m[0] in {5, 6}: # Drum Roll or Big Drum Roll
41
+ count = m[1]
42
+ while count < m[2]:
43
+ chart.append((DON_WAV, offset + count))
44
+ count += (1 / HIT_PER_SEC)
45
+
46
+ elif m[0] == 7: # Balloon
47
+ count = m[1]
48
+ balloon_count = 0
49
+ while count < m[2] and balloon_count < m[3]:
50
+ chart.append((DON_WAV, offset + count))
51
+ count += (1 / HIT_PER_SEC)
52
+ balloon_count += 1
53
+
54
+ if balloon_count >= m[3]:
55
+ chart.append((BALLOON_BANG_WAV, offset + m[1]))
56
+ else:
57
+ raise ValueError("Your json file has some problems.")
58
+
59
+ return chart
60
+
61
+ def resize_audio(file_path:str, target_duration:int, target_amplitude:int):
62
+ audio = AudioSegment.from_wav(file_path)
63
+
64
+ audio = audio[:target_duration * 1000]
65
+
66
+ if file_path == DON_WAV or file_path == BALLOON_BANG_WAV:
67
+ return audio
68
+
69
+ audio = audio - (audio.dBFS - target_amplitude)
70
+ return audio
71
+
72
+ def generate_taiko_wav(chart: list, music:str=None):
73
+ max_length = int(max([start_time + len(resize_audio(file_path, target_duration=1, target_amplitude=-20))
74
+ for file_path, start_time in chart]))
75
+
76
+ mixed_audio = np.zeros(max_length)
77
+
78
+ for file_path, start_time in chart:
79
+ audio = resize_audio(file_path, target_duration=0.5, target_amplitude=-20)
80
+ audio_array = np.array(audio.get_array_of_samples())
81
+
82
+ start_index = int(start_time * audio.frame_rate)
83
+ end_index = start_index + len(audio_array)
84
+
85
+ if len(mixed_audio) < end_index:
86
+ mixed_audio = np.pad(mixed_audio, (0, end_index - len(mixed_audio)))
87
+
88
+ mixed_audio[start_index:end_index] += audio_array
89
+
90
+ mixed_audio = np.clip(mixed_audio, -32768, 32767)
91
+
92
+ mixed_audio_segment = AudioSegment(
93
+ mixed_audio.astype(np.int16).tobytes(),
94
+ frame_rate=audio.frame_rate,
95
+ sample_width=2,
96
+ channels=1
97
+ )
98
+
99
+ if music is None:
100
+ return mixed_audio_segment
101
+ else:
102
+ background_music = AudioSegment.from_ogg(music)
103
+ mixed_audio_with_bg = background_music.overlay(mixed_audio_segment)
104
+ return mixed_audio_with_bg