#! /bin/bash -eu
# Last edited on 2026-04-21 18:34:26 by stolfi

out_dir="res"
mkdir -p ${out_dir}

ex_dir="work/VoynichNinja/005"
mkdir -p ${ex_dir}

rm -f ${out_dir}/text_* ${ex_dir}/text_*

min_wlen=2
max_wlen=7
max_tlen=60

for text_type in 0 1; do 
  tok_stream_prefix="text_${text_type}_${min_wlen}_${max_wlen}"

  echo "generating token stream of type ${text_type}..." 1>&2
  generate_sample_text.py ${text_type} ${min_wlen} ${max_wlen} \
    > res/${tok_stream_prefix}.txt

  for alg in TLA SLA; do
    just_text_prefix="${tok_stream_prefix}_${alg}_${max_tlen}"

    echo "breaking lines with ${alg}..." 1>&2
    line_breaking_algorithm.py ${alg} ${max_tlen} \
      < res/${tok_stream_prefix}.txt \
      > res/${just_text_prefix}.txt

    stats_out_prefix="${just_text_prefix}_stats"
    echo "collecting statistcs ..." 1>&2
    analyze_word_breaks.py \
      < res/${just_text_prefix}.txt \
      > res/${stats_out_prefix}.txt
  done

done
echo "plotting ..." 1>&2
make_comparative_plots.sh \
  ${min_wlen} ${max_wlen} ${max_tlen}
echo "done." 1>&2
