1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19
|
import nltk
nltk.download('punkt')
from nltk.corpus import stopwords
from nltk.tokenize import word_tokenize
from scipy import spatial
import tabula
#import module_wrapper
tables = tabula.io.read_pdf('datacrypt.pdf', pages = "all")
tabula.convert_into("datacrypt.pdf", "data.csv", output_format="csv", pages='all')
import pandas as pd
import numpy as np
# Program to measure the similarity between
# two sentences using cosine similarity.
df = pd.read_excel('C:/Users/User/Desktop/datacrypt.xls') |
Partager