summaryrefslogtreecommitdiff
path: root/internal/text/plain_test.go
diff options
context:
space:
mode:
authorLibravatar Vyr Cossont <VyrCossont@users.noreply.github.com>2025-01-31 02:42:55 -0800
committerLibravatar GitHub <noreply@github.com>2025-01-31 11:42:55 +0100
commitb9e0689359f347edc47487a8043c9004ead0770a (patch)
tree514077f83214533ec359a79e0033dcd9015d4ff2 /internal/text/plain_test.go
parent[feature] Add system message wrappers for pending replies and placeholder att... (diff)
downloadgotosocial-b9e0689359f347edc47487a8043c9004ead0770a.tar.xz
[bugfix] Extend parser to handle more non-Latin hashtags (#3700)
* Allow marks after NFC normalization Includes regression test for the Tamil example from #3618 * Disallow just numbers + marks + underscore as hashtag
Diffstat (limited to 'internal/text/plain_test.go')
-rw-r--r--internal/text/plain_test.go41
1 files changed, 25 insertions, 16 deletions
diff --git a/internal/text/plain_test.go b/internal/text/plain_test.go
index fac54a38e..ffa64ce44 100644
--- a/internal/text/plain_test.go
+++ b/internal/text/plain_test.go
@@ -118,20 +118,20 @@ func (suite *PlainTestSuite) TestDeriveHashtagsOK() {
`
tags := suite.FromPlain(statusText).Tags
- suite.Len(tags, 13)
- suite.Equal("testing123", tags[0].Name)
- suite.Equal("also", tags[1].Name)
- suite.Equal("thisshouldwork", tags[2].Name)
- suite.Equal("dupe", tags[3].Name)
- suite.Equal("ThisShouldAlsoWork", tags[4].Name)
- suite.Equal("this_should_not_be_split", tags[5].Name)
- suite.Equal("111111", tags[6].Name)
- suite.Equal("alimentación", tags[7].Name)
- suite.Equal("saúde", tags[8].Name)
- suite.Equal("lävistää", tags[9].Name)
- suite.Equal("ö", tags[10].Name)
- suite.Equal("네", tags[11].Name)
- suite.Equal("ThisOneIsThirteyCharactersLong", tags[12].Name)
+ if suite.Len(tags, 12) {
+ suite.Equal("testing123", tags[0].Name)
+ suite.Equal("also", tags[1].Name)
+ suite.Equal("thisshouldwork", tags[2].Name)
+ suite.Equal("dupe", tags[3].Name)
+ suite.Equal("ThisShouldAlsoWork", tags[4].Name)
+ suite.Equal("this_should_not_be_split", tags[5].Name)
+ suite.Equal("alimentación", tags[6].Name)
+ suite.Equal("saúde", tags[7].Name)
+ suite.Equal("lävistää", tags[8].Name)
+ suite.Equal("ö", tags[9].Name)
+ suite.Equal("네", tags[10].Name)
+ suite.Equal("ThisOneIsThirteyCharactersLong", tags[11].Name)
+ }
statusText = `#올빼미 hej`
tags = suite.FromPlain(statusText).Tags
@@ -170,8 +170,17 @@ func (suite *PlainTestSuite) TestDeriveMultiple() {
func (suite *PlainTestSuite) TestZalgoHashtag() {
statusText := `yo who else loves #praying to #z̸͉̅a̸͚͋l̵͈̊g̸̫͌ỏ̷̪?`
f := suite.FromPlain(statusText)
- suite.Len(f.Tags, 1)
- suite.Equal("praying", f.Tags[0].Name)
+ if suite.Len(f.Tags, 2) {
+ suite.Equal("praying", f.Tags[0].Name)
+ // NFC doesn't do much for Zalgo text, but it's difficult to strip marks without affecting non-Latin text.
+ suite.Equal("z̸͉̅a̸͚͋l̵͈̊g̸̫͌ỏ̷̪", f.Tags[1].Name)
+ }
+}
+
+func (suite *PlainTestSuite) TestNumbersAreNotHashtags() {
+ statusText := `yo who else thinks #19_98 is #1?`
+ f := suite.FromPlain(statusText)
+ suite.Len(f.Tags, 0)
}
func TestPlainTestSuite(t *testing.T) {