Compare commits

...

2 Commits

Author SHA1 Message Date
Simon Moisy
885f51b83d cleanup 2025-03-22 04:47:52 +08:00
Simon Moisy
4f665db568 .gitignore 2025-03-22 04:46:59 +08:00
2 changed files with 11 additions and 4 deletions

4
.gitignore vendored
View File

@ -3,8 +3,8 @@
.idea/*
data/
.zip
.db
*.zip
*.db
plots/
results/

View File

@ -74,5 +74,12 @@ class ArticleAnalyzer:
def classify_article_finbert(self, article_html):
article_md = self.convert_to_markdown(article_html)
result = self.classifier(article_md)
return result
chunk_size = 512
chunks = [article_md[i:i + chunk_size] for i in range(0, len(article_md), chunk_size)]
results = []
for chunk in chunks:
result = self.classifier(chunk)
results.append(result)
return results