Vous êtes sur la page 1sur 1

with open('cotidian1.

txt', 'r') as myfile:


data = myfile.read()
with open('cotidian2.txt', 'r') as myfile:
data2 = myfile.read()

import numpy as np
from sklearn.feature_extraction.text import TfidfVectorizer
import pandas as pd

# Create text
# Create text
text_data = np.array(['I love Brazil. Brazil!',
'Sweden is best',
'Germany beats both'])

# Create the tf-idf feature matrix


tfidf = TfidfVectorizer()
feature_matrix = tfidf.fit_transform(text_data)

file=open("rezultat.txt","w")
pd.DataFrame(feature_matrix.toarray(),
columns=tfidf.get_feature_names()).to_csv("lalka.csv",sep="\t")

Vous aimerez peut-être aussi