-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathdivide_by_character.py
34 lines (31 loc) · 1.31 KB
/
divide_by_character.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
import os
OUTPUT_PATH = "raw-vocal-output"
METADATA_CSV_FILE = "meta.csv"
AUDIO_FORMAT = '.ogg'
csv_file = open(os.path.join(OUTPUT_PATH, METADATA_CSV_FILE), 'r', encoding='utf_8_sig')
for line in csv_file:
if line == "filename,character,content\n":
continue
assert line.count(',') == 2 or line.count(',') == 1
if line.count(',') != 2:
continue
filename, character, content = line[:-1].split(',') # [:-1] removes \n at the end of line
if character == '':
continue
character_path = os.path.join(OUTPUT_PATH, character)
if not os.path.exists(character_path):
os.mkdir(character_path)
original_voice_file_path = os.path.join(OUTPUT_PATH, filename)
if os.path.exists(original_voice_file_path):
os.rename(original_voice_file_path, os.path.join(character_path, filename))
character_directories = [i for i in os.listdir(OUTPUT_PATH) if os.path.isdir(os.path.join(OUTPUT_PATH, i))]
total_voice_count = 0
for i in character_directories:
character_voice_files = os.listdir(os.path.join(OUTPUT_PATH, i))
for file in character_voice_files:
assert file.endswith(AUDIO_FORMAT)
character_voice_count = len(character_voice_files)
total_voice_count += character_voice_count
print(i, character_voice_count)
print()
print('TOTAL:', total_voice_count)