import PyPDF2 import pandas import numpy import re import os,sys import nltk from io import StringIO from nltk import word_tokenize,sent_tokenize from nltk.tokenize imp