@@ -1,4 +1,5 @@
demeter-lib
+tornado==6.2
redis
requests
gevent
@@ -43,7 +43,8 @@ class Pdf(Base):
for i, b in enumerate(blocks):
y_top = b["bbox"][1]
y_bottom = b["bbox"][3]
- if y_top < page_height * 0.05 or y_bottom > page_height * 0.95:
+ block_height = y_bottom - y_top
+ if (y_top < page_height * 0.02 or y_bottom > page_height * 0.98) and block_height < 20:
continue
if b['type'] == 0: