hm_qc/profiles/HM.json
2025-09-30 10:37:12 -05:00

57 lines
2.2 KiB
JSON
Executable file

[
{
"id": "HM_parse",
"script": "checks.HM_parse",
"config": {
"description": "Parses document with Llamaparse, returning both text extraction and image of document",
"input_file": "supplied by launcher script",
"working_dir": "/tmp/HM_working"
}
},
{
"id": "HM_filename_parse",
"script": "checks.HM_filename_parse",
"config": {
"description": "Parses filename into constituent pieces",
"working_dir": "/tmp/HM_working",
"filename_path": "filename.txt"
}
},
{
"id": "HM_imprint_check",
"script": "checks.HM_imprint_check",
"config": {
"description": "Checks imprint on document against relevant portion of filename",
"working_dir": "/tmp/HM_working",
"test_image_path": "HM_working/parsed_test_image.jpg"
}
},
{
"id": "HM_language_validate",
"script": "checks.HM_language_validate",
"config": {
"description": "Validates language of document content against language code in file name",
"working_dir": "/tmp/HM_working",
"test_image_path": "HM_working/parsed_test_image.jpg"
}
},
{
"id": "HM_price_currency_check",
"script": "checks.HM_price_currency_check",
"config": {
"description": "Validates currency of pricing in document against language detected in previous check",
"working_dir": "/tmp/HM_working",
"test_image_path": "HM_working/parsed_test_image.jpg"
}
},
{
"id": "HM_censorship",
"script": "checks.HM_censorship",
"config": {
"description": "Checks CEN and GEN assets (primarily GEN) to determine whether the image(s) are actually censored for conservative markets. Examines images for full coverage of clothing on all body parts (except face and hands) and fail if too much skin is exposed.",
"images_dir": "/opt/QC/supporting/censorship_trainset",
"working_dir": "/tmp/HM_working",
"test_image_path": "HM_working/parsed_test_image.jpg"
}
}
]