Spaces:
Sleeping
Sleeping
File size: 272 Bytes
6fc683c |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 |
set -ex
input_dir=$1
output_dir=$2
SPM_MODEL=$3
mkdir -p $output_dir
for split in train valid test ;
do
for lang in en de ;
do
cat $input_dir/$split.$lang | spm_encode --model=$SPM_MODEL --output_format=piece > $output_dir/$split.$lang;
done;
done; |