Spaces:
Sleeping
Sleeping
File size: 1,319 Bytes
6fc683c |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 |
#!/usr/bin/env bash
set -x
set -e
DIR="$( cd "$( dirname "$0" )" && cd ../../ && pwd )"
echo "working directory: ${DIR}"
MODEL_NAME_OR_PATH=""
RERANK_IN_PATH=""
SPLIT="nq_dev"
if [[ $# -ge 1 && ! "$1" == "--"* ]]; then
MODEL_NAME_OR_PATH=$1
shift
fi
if [[ $# -ge 1 && ! "$1" == "--"* ]]; then
RERANK_IN_PATH=$1
shift
fi
if [[ $# -ge 1 && ! "$1" == "--"* ]]; then
SPLIT=$1
shift
fi
if [ -z "$OUTPUT_DIR" ]; then
OUTPUT_DIR="${MODEL_NAME_OR_PATH}"
fi
if [ -z "$DATA_DIR" ]; then
DATA_DIR="${DIR}/data/dpr/"
fi
mkdir -p "${OUTPUT_DIR}"
PYTHONPATH=src/ python -u src/inference/rerank_main.py \
--model_name_or_path "${MODEL_NAME_OR_PATH}" \
--do_rerank \
--task_type qa \
--fp16 \
--rerank_in_path "${RERANK_IN_PATH}" \
--rerank_out_path "${OUTPUT_DIR}/rerank.${SPLIT}.msmarco.txt" \
--rerank_batch_size 128 \
--rerank_max_length 224 \
--rerank_split "${SPLIT}" \
--rerank_depth 100 \
--dataloader_num_workers 1 \
--output_dir "/tmp/" \
--data_dir "${DATA_DIR}" \
--report_to none "$@"
python -u misc/dpr/format_and_evaluate.py \
--data-dir "${DATA_DIR}" \
--topk 1 5 20 100 \
--topics "${DATA_DIR}/${SPLIT}_queries.tsv" \
--input "${OUTPUT_DIR}/rerank.${SPLIT}.msmarco.txt" \
--output "${OUTPUT_DIR}/${SPLIT}.dpr.json"
|