#!/usr/bin/env python # -*- coding: utf-8 -*- import ConfigParser import json import os import re from re import sub import sys import time import requests from pdfminer.converter import PDFPageAggregator from pdfminer.layout import LTTextBoxHorizont