Source code for transfer_nlp.loaders.vectorizers

import string
from collections import Counter
from typing import Dict, Tuple, List, Any

import numpy as np
import pandas as pd

from transfer_nlp.common.tokenizers import CustomTokenizer
from transfer_nlp.loaders.vocabulary import Vocabulary, SequenceVocabulary
from transfer_nlp.plugins.config import register_plugin


[docs]class Vectorizer: def __init__(self, data_file: str): self.data_file = data_file # self.df = pd.read_csv(data_file) def vectorize(self, input_string: str): raise NotImplementedError