I am not able to extract data from pdf to python table format, it gets me a lot of errors.
This is my code:
from tabula import read_pdf
url="https://www.dsf.unica.it/~fiore/BasicPlanetaryData.pdf"
try:
df=read_pdf(url)
print(df)
except Exception as e:
print("Error{}".format(e))
The error is:
Traceback (most recent call last):
File "C:\Users\Mukesh Nayal\pycharm project\Python\pdftotext.py", line 1, in <module>
from tabula import read_pdf
File "C:\Users\Mukesh Nayal\AppData\Local\Programs\Python\Python39\lib\site-packages\tabula\__init__.py", line 1, in <module>
from pkg_resources import DistributionNotFound, get_distribution
File "C:\Users\Mukesh Nayal\AppData\Local\Programs\Python\Python39\lib\site-packages\pkg_resources\__init__.py", line 33, in <module>
import email.parser
File "C:\Users\Mukesh Nayal\AppData\Local\Programs\Python\Python39\lib\email\parser.py", line 12, in <module>
from email.feedparser import FeedParser, BytesFeedParser
File "C:\Users\Mukesh Nayal\AppData\Local\Programs\Python\Python39\lib\email\feedparser.py", line 27, in <module>
from email._policybase import compat32
File "C:\Users\Mukesh Nayal\AppData\Local\Programs\Python\Python39\lib\email\_policybase.py", line 7, in <module>
from email import header
File "C:\Users\Mukesh Nayal\AppData\Local\Programs\Python\Python39\lib\email\header.py", line 16, in <module>
import email.quoprimime
File "C:\Users\Mukesh Nayal\AppData\Local\Programs\Python\Python39\lib\email\quoprimime.py", line 44, in <module>
from string import ascii_letters, digits, hexdigits
ImportError: cannot import name 'ascii_letters' from 'string' (C:\Users\Mukesh Nayal\pycharm project\Python\string.py)