From 6a441799fd8ab7dd968b36001dcdbc73f02969c2 Mon Sep 17 00:00:00 2001 From: David Andrews Date: Wed, 2 Apr 2025 10:58:13 -0400 Subject: [PATCH] Fix quickstart.md when running process_hotpotqa.py script Since process_hotpotqa.py uses relative paths like "../../data/corpus", we need to change directory before running it. --- docs/getting_started/quickstart.md | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/docs/getting_started/quickstart.md b/docs/getting_started/quickstart.md index 9d1d772..b8a45ad 100644 --- a/docs/getting_started/quickstart.md +++ b/docs/getting_started/quickstart.md @@ -29,7 +29,8 @@ wget https://huggingface.co/datasets/BeIR/hotpotqa/resolve/main/corpus.jsonl.gz gunzip -c data/corpus/hotpotqa/corpus.jsonl.gz > data/corpus/hotpotqa/hpqa_corpus.jsonl # Process the corpus and build the search index -python scripts/hotpotqa_search/process_hotpotqa.py +cd scripts/hotpotqa_search +python process_hotpotqa.py ``` This script will: @@ -46,4 +47,4 @@ bash run_ppo.sh bash run_rpp.sh # Run the GRPO training script bash run_grpo.sh -``` \ No newline at end of file +```