conda create -n parser python==3.12
conda activate tools
pip install pdfplumber
pip install PyMuPDF
pip install tqdm
-
python exam_parser- input: Data/NPExam/ * / *.pdf
- output: Data/exams/*.json
-
python ans_parser- input: Data/NPExam/ * / *.pdf
- output: Data/ans/*.json
-
python qset_merger.py- input:
- Data/ans/*.json
- Data/exams/*.json
- output:
- Data/NPQSet/ * / *.json
- input:
- figure question
- department set