|
python3 -m virtualenv venv |
|
|
|
python3 pip install prodigy -f {.....} |
|
|
|
source venv/bin/activate |
|
|
|
python3 pip install ngrok |
|
|
|
ngrok config add-authoken {.....} |
|
|
|
python3 -m prodigy metric.iaa.doc dataset:project3eval multiclass -l CapitalRequirements,ConsumerProtection,RiskManagement,ReportingAndCompliance,CorporateGovernance |
|
|
|
PRODIGY_ALLOWED_SESSIONS=reviwer python3 -m prodigy review project3eval-review project3eval --auto-accept |
|
|
|
prodigy db-out project3eval-review > goldenEval.jsonl |
|
|
|
prodigy db-in prodigy3train train200.jsonl |
|
|
|
iconv -f utf-16 -t utf-8 train200.jsonl > train200a.jsonl |
|
|
|
prodigy db-in golden3 goldeneval.jsonl |
|
|
|
python3 -m prodigy train --textcat-multilabel prodigy3train,eval:golden3 ./output/experiment1 |
|
|
|
python3 -m spacy download en_core_web_lg |
|
|
|
python3 -m prodigy data-to-spacy --textcat-multilabel prodigy3train,eval:golden3 ./corpus --base-model en_core_web_lg |
|
|
|
python -m spacy train corpus/config.cfg --paths.train corpus/train.spacy --paths.dev corpus/dev.spacy |
|
|
|
pip install jsonlines |
|
|
|
python3 firstStep-format.py |
|
|
|
python3 secondStep-score.py |
|
|
|
python3 thirdStep-label.py |
|
|
|
python3 finalStep-formatLabel.py |
|
|
|
prodigy db-in prodigy3trainComplete project3_trainComplete.jsonl |
|
|
|
python3 -m prodigy train --textcat-multilabel prodigy3trainComplete,eval:golden3 ./output/experiment3 |
|
|
|
python3 -m prodigy data-to-spacy --textcat-multilabel prodigy3trainComplete,eval:golden3 ./corpus --base-model en_core_web_lg |
|
|
|
python -m spacy train corpus/config.cfg --paths.train corpus/train.spacy --paths.dev corpus/dev.spacy |
|
|