work in progress

This commit is contained in:
三洋三洋
2024-04-12 03:20:04 +00:00
parent 1538cb73f8
commit 7d1d8ddd77
2 changed files with 3 additions and 3 deletions

View File

@@ -96,7 +96,7 @@ if __name__ == '__main__':
collate_fn_with_tokenizer = partial(collate_fn, tokenizer=tokenizer)
# model = TexTeller()
model = TexTeller.from_pretrained('/home/lhy/code/TexTeller/src/models/ocr_model/model/ckpt')
model = TexTeller.from_pretrained('/home/lhy/code/TexTeller/src/models/ocr_model/train/train_result/TexTellerv3/checkpoint-440000')
# ================= debug =======================
# foo = train_dataset[:50]

View File

@@ -1,8 +1,8 @@
#!/usr/bin/env bash
set -exu
# export CHECKPOINT_DIR="/home/lhy/code/TexTeller/src/models/ocr_model/model/ckpt"
export CHECKPOINT_DIR="default"
export CHECKPOINT_DIR="/home/lhy/code/TexTeller/src/models/ocr_model/train/train_result/TexTellerv3/checkpoint-460000"
# export CHECKPOINT_DIR="default"
export TOKENIZER_DIR="/home/lhy/code/TexTeller/src/models/tokenizer/roberta-tokenizer-7Mformulas"
export USE_CUDA=True # True or False (case-sensitive)
export NUM_BEAM=3