This is a repo for our hallucination detection and editing work in the finance domain. This repo includes information on synthetic data generation for training and evaluating our fine-tuned model on FinQA+TATQA.
## Data Preparation
cd data_preparation
python insert_errors.py \
--input_file {input_file_path} \
--output_file {output_file_path} \
--api_key {your_openai_key}cd data_preparation
python verify_responses.py \
--input_file {input_file_path} \
--output_file {output_file_path} \cd data_preparation
python convert_format.py \
--input_file {input_file_path} \
--output_file {output_file_path} \## Inference
cd evalution
python phi_4_inference.py \
--input_file {input_file_path} \
--output_file {output_file_path} \cd evalution
python postprocess.py \
--input_file {input_file_path} \
--output_file {output_file_path} \cd evalution
python eval_detection.py \
--input_file {input_file_path} \
--output_file {output_file_path} \cd evalution
python eval_factscore.py \
--input_file {input_file_path} \