srivarshan commited on
Commit
45674cb
·
1 Parent(s): c2f034e

Add vectorizer

Browse files
Files changed (3) hide show
  1. app.py +2 -1
  2. preprocess.py +8 -0
  3. vectorizers/count_vectorizer.pkl +0 -0
app.py CHANGED
@@ -1,6 +1,6 @@
1
  import gradio as gr
2
  from model import CustomModel
3
- from preprocess import preprocess_pipeline
4
  import os
5
 
6
  os.system("cp -r ./nltk_data/ /home/user/nltk_data")
@@ -8,6 +8,7 @@ os.system("cp -r ./nltk_data/ /home/user/nltk_data")
8
  def analyze(text):
9
  model = CustomModel()
10
  text = preprocess_pipeline(text)
 
11
  return text
12
 
13
  app = gr.Interface(fn=analyze, inputs="text", outputs="text")
 
1
  import gradio as gr
2
  from model import CustomModel
3
+ from preprocess import preprocess_pipeline, vectorizer
4
  import os
5
 
6
  os.system("cp -r ./nltk_data/ /home/user/nltk_data")
 
8
  def analyze(text):
9
  model = CustomModel()
10
  text = preprocess_pipeline(text)
11
+ text = vectorizer(text)
12
  return text
13
 
14
  app = gr.Interface(fn=analyze, inputs="text", outputs="text")
preprocess.py CHANGED
@@ -1,4 +1,7 @@
1
  import re
 
 
 
2
  from nltk.corpus import stopwords
3
  from nltk.stem import SnowballStemmer
4
 
@@ -20,3 +23,8 @@ def clean_text(text):
20
 
21
  def preprocess_pipeline(text):
22
  return clean_text(text)
 
 
 
 
 
 
1
  import re
2
+ from nltk.corpus.reader import pickle
3
+ import pandas as pd
4
+ import numpy as np
5
  from nltk.corpus import stopwords
6
  from nltk.stem import SnowballStemmer
7
 
 
23
 
24
  def preprocess_pipeline(text):
25
  return clean_text(text)
26
+
27
+ def vectorizer(text):
28
+ count_vectorizer = pickle.load(open("vectorizers/count_vectorizer.pkl", "rb"))
29
+ return count_vectorizer.transform(text)
30
+
vectorizers/count_vectorizer.pkl ADDED
Binary file (23.1 kB). View file