Merge branch 'hotfix-reading-order' into 'main'

hotfix: threshold adjustements

See merge request fforesight/layout-parser!192
This commit is contained in:
Dominique Eifländer 2024-08-12 14:59:20 +02:00
commit 173911b840

View File

@ -27,11 +27,12 @@ public class TextPositionOperations {
public static final double MAX_LINE_HEIGHT_FACTOR = 0.66; // multiplied with max word height
public static final double MAX_WORD_DISTANCE_FACTOR = 3.5; // multiplied with max word width
private static final double THRESHOLD = 5;
private static final double Y_THRESHOLD = 6;
private static final double X_THRESHOLD = 3;
private static final Comparator<TextBoundingBox> COMPARATOR_DIR_ADJ = //
Comparator.comparing(TextBoundingBox::getDir)
.thenComparing(TextBoundingBox::getCenterYDirAdj, (o1, o2) -> DoubleUtils.compareDouble(o1, o2, THRESHOLD))
.thenComparing(TextBoundingBox::getCenterXDirAdj, (o1, o2) -> DoubleUtils.compareDouble(o1, o2, THRESHOLD));
.thenComparing(TextBoundingBox::getMaxYDirAdj, (o1, o2) -> DoubleUtils.compareDouble(o1, o2, Y_THRESHOLD))
.thenComparing(TextBoundingBox::getXDirAdj, (o1, o2) -> DoubleUtils.compareDouble(o1, o2, X_THRESHOLD));
public List<TextPositionSequence> mergeAndSort(List<TextPageBlock> textBlocks) {