Convert EOL to UNIX-style to render MD properly (#8925)

author guillep2k <18600385+guillep2k@users.noreply.github.com>

Wed, 13 Nov 2019 02:27:11 +0000 (23:27 -0300)

committer Antoine GIRARD <sapk@users.noreply.github.com>

Wed, 13 Nov 2019 02:27:11 +0000 (03:27 +0100)
author guillep2k <18600385+guillep2k@users.noreply.github.com>
Wed, 13 Nov 2019 02:27:11 +0000 (23:27 -0300)
committer Antoine GIRARD <sapk@users.noreply.github.com>
Wed, 13 Nov 2019 02:27:11 +0000 (03:27 +0100)
diff --git a/modules/markup/markdown/markdown.go b/modules/markup/markdown/markdown.go

index ff78d7ea3a8e44535d14b8732edf309e64b9a585..fc704243e2d7f28997ea2a54c8844fa228e6b58d 100644 (file)
--- a/modules/markup/markdown/markdown.go
+++ b/modules/markup/markdown/markdown.go
@@ -157,7 +157,8 @@ func RenderRaw(body []byte, urlPrefix string, wikiMarkdown bool) []byte {
                 exts |= blackfriday.HardLineBreak
         }
  
-       body = blackfriday.Run(body, blackfriday.WithRenderer(renderer), blackfriday.WithExtensions(exts))
+       // Need to normalize EOL to UNIX LF to have consistent results in rendering
+       body = blackfriday.Run(util.NormalizeEOL(body), blackfriday.WithRenderer(renderer), blackfriday.WithExtensions(exts))
         return markup.SanitizeBytes(body)
  }
  
diff --git a/modules/markup/markdown/markdown_test.go b/modules/markup/markdown/markdown_test.go

index b29f870ce52685e4002335aeb13e1c22f403d14e..e80173c6cf3225a8dea9aa3ba756921a405bd5f0 100644 (file)
--- a/modules/markup/markdown/markdown_test.go
+++ b/modules/markup/markdown/markdown_test.go
@@ -294,3 +294,25 @@ func TestTotal_RenderString(t *testing.T) {
                 assert.Equal(t, testCases[i+1], line)
         }
  }
+
+func TestRender_RenderParagraphs(t *testing.T) {
+       test := func(t *testing.T, str string, cnt int) {
+               unix := []byte(str)
+               res := string(RenderRaw(unix, "", false))
+               assert.Equal(t, strings.Count(res, "<p"), cnt)
+
+               mac := []byte(strings.ReplaceAll(str, "\n", "\r"))
+               res = string(RenderRaw(mac, "", false))
+               assert.Equal(t, strings.Count(res, "<p"), cnt)
+
+               dos := []byte(strings.ReplaceAll(str, "\n", "\r\n"))
+               res = string(RenderRaw(dos, "", false))
+               assert.Equal(t, strings.Count(res, "<p"), cnt)
+       }
+
+       test(t, "\nOne\nTwo\nThree", 1)
+       test(t, "\n\nOne\nTwo\nThree", 1)
+       test(t, "\n\nOne\nTwo\nThree\n\n\n", 1)
+       test(t, "A\n\nB\nC\n", 2)
+       test(t, "A\n\n\nB\nC\n", 2)
+}
diff --git a/modules/util/util.go b/modules/util/util.go

index 4203b5eb517321026dbf2a5b3b171263d5a448e0..6d02b5f52fa737cff540eebc090545c47170e916 100644 (file)
--- a/modules/util/util.go
+++ b/modules/util/util.go
@@ -5,6 +5,7 @@
  package util
  
  import (
+       "bytes"
         "strings"
  )
  
@@ -63,3 +64,39 @@ func Min(a, b int) int {
  func IsEmptyString(s string) bool {
         return len(strings.TrimSpace(s)) == 0
  }
+
+// NormalizeEOL will convert Windows (CRLF) and Mac (CR) EOLs to UNIX (LF)
+func NormalizeEOL(input []byte) []byte {
+       var right, left, pos int
+       if right = bytes.IndexByte(input, '\r'); right == -1 {
+               return input
+       }
+       length := len(input)
+       tmp := make([]byte, length)
+
+       // We know that left < length because otherwise right would be -1 from IndexByte.
+       copy(tmp[pos:pos+right], input[left:left+right])
+       pos += right
+       tmp[pos] = '\n'
+       left += right + 1
+       pos++
+
+       for left < length {
+               if input[left] == '\n' {
+                       left++
+               }
+
+               right = bytes.IndexByte(input[left:], '\r')
+               if right == -1 {
+                       copy(tmp[pos:], input[left:])
+                       pos += length - left
+                       break
+               }
+               copy(tmp[pos:pos+right], input[left:left+right])
+               pos += right
+               tmp[pos] = '\n'
+               left += right + 1
+               pos++
+       }
+       return tmp[:pos]
+}
diff --git a/modules/util/util_test.go b/modules/util/util_test.go

index 2475065059e88a8ec292fb2c2cfc2d0bb2679bfa..04ab42f29253bb39cbf443df35405126a7d44cc4 100644 (file)
--- a/modules/util/util_test.go
+++ b/modules/util/util_test.go
@@ -5,6 +5,7 @@
  package util
  
  import (
+       "strings"
         "testing"
  
         "code.gitea.io/gitea/modules/setting"
@@ -94,3 +95,61 @@ func TestIsEmptyString(t *testing.T) {
                 assert.Equal(t, v.expected, IsEmptyString(v.s))
         }
  }
+
+func Test_NormalizeEOL(t *testing.T) {
+       data1 := []string{
+               "",
+               "This text starts with empty lines",
+               "another",
+               "",
+               "",
+               "",
+               "Some other empty lines in the middle",
+               "more.",
+               "And more.",
+               "Ends with empty lines too.",
+               "",
+               "",
+               "",
+       }
+
+       data2 := []string{
+               "This text does not start with empty lines",
+               "another",
+               "",
+               "",
+               "",
+               "Some other empty lines in the middle",
+               "more.",
+               "And more.",
+               "Ends without EOLtoo.",
+       }
+
+       buildEOLData := func(data []string, eol string) []byte {
+               return []byte(strings.Join(data, eol))
+       }
+
+       dos := buildEOLData(data1, "\r\n")
+       unix := buildEOLData(data1, "\n")
+       mac := buildEOLData(data1, "\r")
+
+       assert.Equal(t, unix, NormalizeEOL(dos))
+       assert.Equal(t, unix, NormalizeEOL(mac))
+       assert.Equal(t, unix, NormalizeEOL(unix))
+
+       dos = buildEOLData(data2, "\r\n")
+       unix = buildEOLData(data2, "\n")
+       mac = buildEOLData(data2, "\r")
+
+       assert.Equal(t, unix, NormalizeEOL(dos))
+       assert.Equal(t, unix, NormalizeEOL(mac))
+       assert.Equal(t, unix, NormalizeEOL(unix))
+
+       assert.Equal(t, []byte("one liner"), NormalizeEOL([]byte("one liner")))
+       assert.Equal(t, []byte("\n"), NormalizeEOL([]byte("\n")))
+       assert.Equal(t, []byte("\ntwo liner"), NormalizeEOL([]byte("\ntwo liner")))
+       assert.Equal(t, []byte("two liner\n"), NormalizeEOL([]byte("two liner\n")))
+       assert.Equal(t, []byte{}, NormalizeEOL([]byte{}))
+
+       assert.Equal(t, []byte("mix\nand\nmatch\n."), NormalizeEOL([]byte("mix\r\nand\rmatch\n.")))
+}
author	guillep2k <18600385+guillep2k@users.noreply.github.com>
	Wed, 13 Nov 2019 02:27:11 +0000 (23:27 -0300)
committer	Antoine GIRARD <sapk@users.noreply.github.com>
	Wed, 13 Nov 2019 02:27:11 +0000 (03:27 +0100)
modules/markup/markdown/markdown.go		patch \| blob \| history
modules/markup/markdown/markdown_test.go		patch \| blob \| history
modules/util/util.go		patch \| blob \| history
modules/util/util_test.go		patch \| blob \| history