feat: add content filter and code processing module (v0.3.0)

- Add content filter module (internal/content/)
- Implement basic character filtering (control chars, line breaks, symbols)
- Implement code block and inline code detection
- Implement comment detection for 30+ languages (JS/Python/Go/HTML/etc)
- Add go-enry dependency for intelligent language detection
- Add SkipKeywords config option (default: TODO/FIXME/HACK/XXX/etc)
- Integrate content processing into Translator
- Update config.yaml with skip_keywords
This commit is contained in:
2026-03-29 18:41:25 +08:00
parent 1bce2d9c7a
commit 6807371c5e
8 changed files with 625 additions and 8 deletions

View File

@@ -0,0 +1,17 @@
package content
import (
"github.com/go-enry/go-enry/v2"
)
const (
Version = "1.0.0"
)
func DetectLanguage(text string) string {
return enry.GetLanguage("", []byte(text))
}
func Filter(text string) string {
return FilterBasic(text, nil)
}