OxbridgeEconomics
commited on
Update vectorizer.py
Browse files
controllers/vectorizer.py
CHANGED
@@ -41,6 +41,8 @@ def vectorize(article):
|
|
41 |
df = df[['id','site','title','titleCN','category','author','content',
|
42 |
'publishDate','link','attachment','sentimentScore','sentimentLabel']]
|
43 |
df['sentimentScore'] = df['sentimentScore'].round(2)
|
|
|
|
|
44 |
loader = DataFrameLoader(df, page_content_column="content")
|
45 |
documents = loader.load()
|
46 |
text_splitter = RecursiveCharacterTextSplitter(
|
|
|
41 |
df = df[['id','site','title','titleCN','category','author','content',
|
42 |
'publishDate','link','attachment','sentimentScore','sentimentLabel']]
|
43 |
df['sentimentScore'] = df['sentimentScore'].round(2)
|
44 |
+
df['sentimentScore'] = df['sentimentScore'].astype(float)
|
45 |
+
df['publishDate'] = pd.to_datetime(df['publishDate'])
|
46 |
loader = DataFrameLoader(df, page_content_column="content")
|
47 |
documents = loader.load()
|
48 |
text_splitter = RecursiveCharacterTextSplitter(
|