Documentation
Data Preprocessing
Text
Vectorize

Module: vectorize.py

Functions

from sklearn.feature_extraction.text import TfidfVectorizer, CountVectorizer
 
def vectorize_text_tfidf(texts):
    """
    Vectorize text data using TF-IDF method.
 
    Parameters:
        texts (list): List of text documents.
 
    Returns:
        scipy.sparse.csr.csr_matrix: TF-IDF feature matrix.
    """
 
 
def vectorize_text_count(texts):
    """
    Vectorize text data using Count Vectorizer method.
 
    Parameters:
        texts (list): List of text documents.
 
    Returns:
        scipy.sparse.csr.csr_matrix: Count Vector feature matrix.
    """