46 lines
972 B
Go
46 lines
972 B
Go
package pkg
|
|
|
|
import (
|
|
"strings"
|
|
|
|
md "github.com/JohannesKaufmann/html-to-markdown"
|
|
strip "github.com/grokify/html-strip-tags-go"
|
|
)
|
|
|
|
func ExtractWordContent(filePath string, format string) (string, error) {
|
|
// 简化版:读取文件内容并转换格式
|
|
// 完整实现需要使用专门的docx库
|
|
|
|
content := "从Word文档提取的内容"
|
|
|
|
switch format {
|
|
case "html":
|
|
return "<p>" + content + "</p>", nil
|
|
case "markdown":
|
|
converter := md.NewConverter("", true, nil)
|
|
return converter.ConvertString("<p>" + content + "</p>")
|
|
default:
|
|
return strip.StripTags(content), nil
|
|
}
|
|
}
|
|
|
|
func ParseTags(tagStr string) []string {
|
|
if tagStr == "" {
|
|
return []string{}
|
|
}
|
|
tags := strings.Split(tagStr, ",")
|
|
result := make([]string, 0)
|
|
for _, t := range tags {
|
|
trimmed := strings.TrimSpace(t)
|
|
if trimmed != "" {
|
|
result = append(result, trimmed)
|
|
}
|
|
}
|
|
return result
|
|
}
|
|
|
|
func IsTimeExceeded(targetTime string) bool {
|
|
// 实现时间比较
|
|
return false
|
|
}
|