OxbridgeEconomics commited on
Commit
741bcee
·
unverified ·
1 Parent(s): 1177da7

Update vectorizer.py

Browse files
Files changed (1) hide show
  1. controllers/vectorizer.py +2 -0
controllers/vectorizer.py CHANGED
@@ -41,6 +41,8 @@ def vectorize(article):
41
  df = df[['id','site','title','titleCN','category','author','content',
42
  'publishDate','link','attachment','sentimentScore','sentimentLabel']]
43
  df['sentimentScore'] = df['sentimentScore'].round(2)
 
 
44
  loader = DataFrameLoader(df, page_content_column="content")
45
  documents = loader.load()
46
  text_splitter = RecursiveCharacterTextSplitter(
 
41
  df = df[['id','site','title','titleCN','category','author','content',
42
  'publishDate','link','attachment','sentimentScore','sentimentLabel']]
43
  df['sentimentScore'] = df['sentimentScore'].round(2)
44
+ df['sentimentScore'] = df['sentimentScore'].astype(float)
45
+ df['publishDate'] = pd.to_datetime(df['publishDate'])
46
  loader = DataFrameLoader(df, page_content_column="content")
47
  documents = loader.load()
48
  text_splitter = RecursiveCharacterTextSplitter(