mirror of
https://github.com/opencloud-eu/opencloud.git
synced 2026-01-03 03:28:03 -05:00
33 lines
805 B
Go
33 lines
805 B
Go
package content
|
|
|
|
import (
|
|
"strings"
|
|
|
|
"github.com/bbalet/stopwords"
|
|
libregraph "github.com/opencloud-eu/libre-graph-api-go"
|
|
)
|
|
|
|
func init() {
|
|
stopwords.OverwriteWordSegmenter(`[^ ]+`)
|
|
}
|
|
|
|
// Document wraps all resource meta fields,
|
|
// it is used as a content extraction result.
|
|
type Document struct {
|
|
Title string
|
|
Name string
|
|
Content string
|
|
Size uint64
|
|
Mtime string
|
|
MimeType string
|
|
Tags []string
|
|
Audio *libregraph.Audio `json:"audio,omitempty"`
|
|
Image *libregraph.Image `json:"image,omitempty"`
|
|
Location *libregraph.GeoCoordinates `json:"location,omitempty"`
|
|
Photo *libregraph.Photo `json:"photo,omitempty"`
|
|
}
|
|
|
|
func CleanString(content, langCode string) string {
|
|
return strings.TrimSpace(stopwords.CleanString(content, langCode, true))
|
|
}
|