split_csv/split-csv.sh
2024-07-05 14:54:39 +00:00

11 lines
837 B
Bash
Executable file

#!/bin/bash
cut --complement -f 2 -d\| metadata.csv > metadata-cut.csv
awk -F '|' -v OFS='|' '$1 {print "wavs/" $1 ".wav" "|" $2}' metadata-cut.csv > ljs_audio_text.txt
shuf ljs_audio_text.txt > ljs_audio_text-shuf.txt
sed -n '1,50p' ljs_audio_text-shuf.txt > ljs_audio_text_val.txt
sed -n '51,200p' ljs_audio_text-shuf.txt > ljs_audio_text_test.txt
sed -n '201,$ p' ljs_audio_text-shuf.txt > ljs_audio_text_train_v3.txt
awk -F '|' -v OFS='|' '$1 {print $1 "|" "pitch/" substr($1,6,6) ".pt" "|" $2}' ljs_audio_text_val.txt > ljs_audio_pitch_text_val.txt
awk -F '|' -v OFS='|' '$1 {print $1 "|" "pitch/" substr($1,6,6) ".pt" "|" $2}' ljs_audio_text_test.txt > ljs_audio_pitch_text_test.txt
awk -F '|' -v OFS='|' '$1 {print $1 "|" "pitch/" substr($1,6,6) ".pt" "|" $2}' ljs_audio_text_train_v3.txt > ljs_audio_pitch_text_train_v3.txt