conda create -n parser python==3.12
conda activate tools
pip install pdfplumber
pip install PyMuPDF
pip install tqdm
-
python exam_parser
- input: Data/NPExam/ * / *.pdf
- output: Data/exams/*.json
-
python ans_parser
- input: Data/NPExam/ * / *.pdf
- output: Data/ans/*.json
-
python qset_merger.py
- input:
- Data/ans/*.json
- Data/exams/*.json
- output:
- Data/NPQSet/ * / *.json
- input:
- figure question
- department set