You need an additional package train
.
pip install -U 'pilota[ja-line,train] @ git+https://github.com/megagonlabs/pilota'
- Needed corpus
- asdc
- (optional, internal only)
scud_internal
OUTPUT=/path/to/output
make -j1 -f ./train.mk \
OUTPUT="${OUTPUT}" \
T5BASE=megagonlabs/t5-base-japanese-web-8k \
BATCH=100 BATCH_DEV=100 EPOCH=20 IN_LEN=128 OUT_LEN=64 BATCH_PRED=100 \
all
- Needed corpus
OUTPUT=/path/to/output
make -j1 -f ./train.mk \
OUTPUT="${OUTPUT}" \
T5BASE=megagonlabs/t5-base-japanese-web-8k \
BATCH=86 BATCH_DEV=112 EPOCH=20 IN_LEN=128 OUT_LEN=64 BATCH_PRED=120 JALAN=1 \
all
- Needed Corpus
OUTPUT=/path/to/output
make -j1 -f ./train.mk \
OUTPUT="${OUTPUT}" \
T5BASE=megagonlabs/t5-base-japanese-web-8k \
BATCH=86 BATCH_DEV=112 EPOCH=20 IN_LEN=128 OUT_LEN=64 BATCH_PRED=120 SCUD2QUERY=1 \
all