1# 1. Download and install java
2# 2. Install python library 'tabular-py' using pip
3pip install tabula-py
4# If this is the first time installing java and tabula-py
5# add your Java installation folder to the PATH variable.
6# if you don't, this is the error message you'll get.
7tabula.errors.JavaNotFoundError: `java` command is not found from this
8Python process.Please ensure Java is installed and PATH is set for `java`
9# 3. Import and run the tabula function on the desire page on the pdf file.
10import tabula
11df = tabula.read_pdf('data.pdf', pages = 3, lattice = True)[1]