todo
This commit is contained in:
@@ -36,6 +36,7 @@ class Chars:
|
|||||||
result[-1].merge_in(char)
|
result[-1].merge_in(char)
|
||||||
else:
|
else:
|
||||||
result.append(Chars([char], self.page))
|
result.append(Chars([char], self.page))
|
||||||
|
# TODO remove headers, footers; maybe median font size vs. max of cluster?
|
||||||
result = [i for i in result if i.n > 2]
|
result = [i for i in result if i.n > 2]
|
||||||
|
|
||||||
# merge all vertically overlapping boxes
|
# merge all vertically overlapping boxes
|
||||||
|
|||||||
Reference in New Issue
Block a user