refactor: Update image description minimum word threshold in get_content_of_website_optimized

This commit is contained in:
unclecode
2024-08-02 14:53:11 +08:00
parent 8ae6c43ca4
commit 9ee988753d
2 changed files with 4 additions and 1 deletions

View File

@@ -27,6 +27,7 @@ WORD_TOKEN_RATE = 1.3
# Threshold for the minimum number of word in a HTML tag to be considered
MIN_WORD_THRESHOLD = 1
IMAGE_DESCRIPTION_MIN_WORD_THRESHOLD = 1
# Threshold for the Image extraction - Range is 1 to 6
# Images are scored based on point based system, to filter based on usefulness. Points are assigned