mirror of
https://github.com/jzillmann/pdf-to-markdown.git
synced 2024-11-21 15:23:26 +01:00
Prevent headline detection code from detecting headline > 6
This commit is contained in:
parent
908f0b4be1
commit
ecde2ea0f5
@ -67,16 +67,19 @@ export default class DetectHeaders extends ToLineItemTransformation {
|
||||
heights.sort((a, b) => b - a);
|
||||
|
||||
heights.forEach((height, i) => {
|
||||
const headlineType = headlineByLevel(2 + i);
|
||||
parseResult.pages.forEach(page => {
|
||||
page.items.forEach(item => {
|
||||
if (!item.type && item.height == height && !isListItem(item.text())) {
|
||||
detectedHeaders++;
|
||||
item.annotation = DETECTED_ANNOTATION;
|
||||
item.type = headlineType;
|
||||
}
|
||||
const headlineLevel = i + 2;
|
||||
if (headlineLevel <= 6) {
|
||||
const headlineType = headlineByLevel(2 + i);
|
||||
parseResult.pages.forEach(page => {
|
||||
page.items.forEach(item => {
|
||||
if (!item.type && item.height == height && !isListItem(item.text())) {
|
||||
detectedHeaders++;
|
||||
item.annotation = DETECTED_ANNOTATION;
|
||||
item.type = headlineType;
|
||||
}
|
||||
});
|
||||
});
|
||||
});
|
||||
}
|
||||
});
|
||||
}
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user