| | #!/usr/bin/env bash |
| | set -euo pipefail |
| |
|
| | |
| | |
| | |
| | |
| |
|
| | LANGCODES=("sv") |
| |
|
| | |
| | |
| | |
| |
|
| | mkdir -p logs |
| |
|
| | timestamp=$(date +"%Y%m%d_%H%M%S") |
| |
|
| | |
| | LANG_JOINED=$(printf "_%s" "${LANGCODES[@]}") |
| | LANG_JOINED="${LANG_JOINED:1}" |
| |
|
| | |
| | LOGFILE="logs/log_bert-base-swedish-cased_${LANG_JOINED}_${timestamp}.txt" |
| |
|
| | |
| | exec > >(tee -a "$LOGFILE") 2>&1 |
| |
|
| | echo "=== LOGFILE: $LOGFILE ===" |
| | echo "Language codes: ${LANGCODES[*]}" |
| | echo "Using pretrained model: KBLab/bert-base-swedish-cased" |
| | echo |
| |
|
| | |
| | |
| | |
| | echo "Running: python prepare-train-val-SILVER.py ${LANGCODES[*]}" |
| | python prepare-train-val-SILVER.py "${LANGCODES[@]}" |
| |
|
| | |
| | |
| | |
| | echo "Sourcing scripts/config.sh" |
| | source scripts/config.sh |
| |
|
| | |
| | |
| | |
| | echo "Running stanza dataset preparation…" |
| | python -m stanza.utils.datasets.prepare_depparse_treebank UD_Swedish-diachronic \ |
| | --gold |
| | |
| |
|
| | |
| | |
| | |
| | echo "Running stanza dependency parser training…" |
| | python -m stanza.utils.training.run_depparse UD_Swedish-diachronic \ |
| | --batch_size 32 \ |
| | --dropout 0.33 \ |
| | --use_bert \ |
| | --bert_model KBLab/bert-base-swedish-cased \ |
| | --silver_file "ud/UD_Swedish-diachronic/sv_diachronic-ud-train-silver.conllu" |
| |
|
| | echo "DONE." |
| | echo "Full log saved to: $LOGFILE" |
| |
|
| | |
| | |
| | |
| | ln -sf "$(basename "$LOGFILE")" logs/latest.txt |
| | echo "Symlink updated: logs/latest.txt → $(basename "$LOGFILE")" |
| |
|
| | |
| | |
| | |
| | python loss.py |