| |
|
|
| |
| TESSERACT_FOLDER=tesseract/ |
| POPPLER_FOLDER=poppler/poppler-24.02.0/Library/bin/ |
|
|
| GRADIO_SERVER_NAME=127.0.0.1 |
| GRADIO_SERVER_PORT=7860 |
|
|
| USER_GUIDE_URL=<ENTER_URL> |
| CUSTOM_BOX_COLOUR=(128, 128, 128) |
| RUN_FASTAPI=False |
| FAVICON_PATH=favicon.png |
| INTRO_TEXT=intros/short_intro.txt |
|
|
| |
| SHOW_QUICKSTART=False |
| SHOW_SUMMARISATION=True |
| SHOW_EXAMPLES=True |
| SHOW_DIFFICULT_OCR_EXAMPLES=True |
| SHOW_LANGUAGE_SELECTION=True |
| SHOW_WHOLE_DOCUMENT_TEXTRACT_CALL_OPTIONS=False |
| SHOW_COSTS=True |
| SHOW_LOCAL_OCR_MODEL_OPTIONS=True |
| SHOW_ALL_OUTPUTS_IN_OUTPUT_FOLDER=True |
| SHOW_PII_IDENTIFICATION_OPTIONS=True |
| SHOW_LOCAL_PII_DETECTION_OPTIONS=True |
| SHOW_OCR_GUI_OPTIONS=True |
| EXTRACTION_AND_PII_OPTIONS_OPEN_BY_DEFAULT=True |
|
|
| |
| DEFAULT_LOCAL_OCR_MODEL=tesseract |
| OVERWRITE_EXISTING_OCR_RESULTS=False |
| PREPROCESS_LOCAL_OCR_IMAGES=False |
| MAX_WORKERS=4 |
|
|
| EFFICIENT_OCR=True |
| OVERWRITE_EXISTING_OCR_RESULTS=True |
| INCLUDE_OCR_VISUALISATION_IN_OUTPUT_FILES=True |
|
|
| |
| CUSTOM_BOX_COLOUR=(128, 128, 128) |
| USE_GUI_BOX_COLOURS_FOR_OUTPUTS=False |
|
|
| |
| SAVE_PAGE_OCR_VISUALISATIONS=True |
| SAVE_PREPROCESS_IMAGES=True |
|
|
| |
| SAVE_LOGS_TO_CSV=True |
| SESSION_OUTPUT_FOLDER=True |
| DISPLAY_FILE_NAMES_IN_LOGS=False |
|
|
| |
| SHOW_PADDLE_MODEL_OPTIONS=False |
| LOAD_PADDLE_AT_STARTUP=False |
| PADDLE_MAX_WORKERS=4 |
|
|
| |
| SHOW_HYBRID_MODELS=False |
| SHOW_CUSTOM_VLM_ENTITIES=False |
| SHOW_VLM_MODEL_OPTIONS=True |
| SHOW_INFERENCE_SERVER_PII_OPTIONS=False |
| SHOW_INFERENCE_SERVER_VLM_OPTIONS=False |
| SHOW_TRANSFORMERS_LLM_PII_DETECTION_OPTIONS=False |
|
|
| |
| SELECTED_LOCAL_TRANSFORMERS_VLM_MODEL=Qwen3.5-9B |
| QUANTISE_VLM_MODELS=False |
| USE_TRANSFORMERS_VLM_MODEL_AS_LLM=True |
| LOCAL_TRANSFORMERS_LLM_PII_MODEL_CHOICE=None |
| QUANTISE_TRANSFORMERS_LLM_MODELS=False |
| LOAD_TRANSFORMERS_LLM_PII_MODEL_AT_START=False |
| LOAD_TRANSFORMERS_VLM_MODEL_AT_START=True |
|
|
| |
| INFERENCE_SERVER_API_URL=http://192.168.0.220:8080 |
| USE_LLAMA_SWAP=True |
| INFERENCE_SERVER_LLM_PII_MODEL_CHOICE=qwen_3_5_27b |
|
|
| |
| VLM_DISABLE_QWEN3_5_THINKING=True |
| LLM_MAX_NEW_TOKENS=8192 |
| CUSTOM_VLM_BACKEND=bedrock_vlm |
|
|
| |
| RUN_AWS_FUNCTIONS=True |
| AWS_REGION=example-region |
| DOCUMENT_REDACTION_BUCKET=example-bucket |
|
|
| SHOW_AWS_TEXT_EXTRACTION_OPTIONS=True |
| SHOW_AWS_PII_DETECTION_OPTIONS=True |
|
|
| SHOW_AWS_EXAMPLES=True |
| RUN_ALL_EXAMPLES_THROUGH_AWS=True |
|
|
| SAVE_LOGS_TO_DYNAMODB=True |
| ACCESS_LOG_DYNAMODB_TABLE_NAME=example-dynamodb-access-log |
| USAGE_LOG_DYNAMODB_TABLE_NAME=example-dynamodb-usage |
| FEEDBACK_LOG_DYNAMODB_TABLE_NAME=example-dynamodb-feedback |
|
|
| |
| SHOW_WHOLE_DOCUMENT_TEXTRACT_CALL_OPTIONS=True |
| LOAD_PREVIOUS_TEXTRACT_JOBS_S3=True |
| TEXTRACT_WHOLE_DOCUMENT_ANALYSIS_BUCKET=example-bucket-output |
| INCLUDE_FORM_EXTRACTION_TEXTRACT_OPTION=False |
| INCLUDE_LAYOUT_EXTRACTION_TEXTRACT_OPTION=False |
| INCLUDE_TABLE_EXTRACTION_TEXTRACT_OPTION=False |
| INCLUDE_FACE_IDENTIFICATION_TEXTRACT_OPTION=False |
|
|
| |
| SHOW_BEDROCK_VLM_MODELS=False |
| SHOW_AWS_BEDROCK_LLM_MODELS=False |
| HYBRID_TEXTRACT_BEDROCK_VLM=False |
|
|
| CLOUD_LLM_PII_MODEL_CHOICE=amazon.nova-pro-v1:0 |
| CLOUD_LLM_PII_CUSTOM_INSTRUCTIONS_MODEL_CHOICE=anthropic.claude-sonnet-4-6 |
| CLOUD_VLM_MODEL_CHOICE=amazon.nova-pro-v1:0 |
| CLOUD_SUMMARISATION_MODEL_CHOICE=amazon.nova-lite-v1:0 |
|
|
| |
| SHOW_COSTS=True |
| GET_COST_CODES=True |
| COST_CODES_PATH=config/cost_codes.csv |
| ENFORCE_COST_CODES=True |
| DEFAULT_COST_CODE=example_cost_code |
|
|
| |
| S3_COST_CODES_PATH=cost_codes.csv |