add summarization for documents

This commit is contained in:
2025-01-20 20:34:23 +01:00
parent 0594fb8aeb
commit 637a5ebb0c
6 changed files with 270 additions and 9 deletions

View File

@@ -6,6 +6,7 @@ import (
"crowsnest/internal/middleware"
"crowsnest/internal/model"
"crowsnest/internal/model/database"
"crowsnest/internal/util"
"log"
"net/http"
@@ -18,6 +19,21 @@ func main() {
log.Fatal("failed to connect to database due to", err.Error())
}
// summarize documents
documents := &database.DocumentRepository{DB: db}
go documents.Map(func(doc *model.Document) *model.Document {
if doc.Summary == "" {
summaryText, err := util.Summarize(doc.Content)
if err == nil {
doc.Summary = summaryText
return doc
}
log.Println(err.Error())
}
return doc
})
// run web crawlers
articles := &database.ArticleRepository{DB: db}
crawler := crawler.CrawlerFacade{}