You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

markdown.go 9.7 kB

12 years ago
12 years ago
10 years ago
12 years ago
12 years ago
12 years ago
12 years ago
12 years ago
12 years ago
12 years ago
12 years ago
12 years ago
12 years ago
12 years ago
12 years ago
10 years ago
10 years ago
10 years ago
12 years ago
12 years ago
12 years ago
12 years ago
12 years ago
12 years ago
12 years ago
10 years ago
10 years ago
10 years ago
10 years ago
10 years ago
10 years ago
10 years ago
10 years ago
10 years ago
10 years ago
10 years ago
10 years ago
10 years ago
10 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357
  1. // Copyright 2014 The Gogs Authors. All rights reserved.
  2. // Use of this source code is governed by a MIT-style
  3. // license that can be found in the LICENSE file.
  4. package base
  5. import (
  6. "bytes"
  7. "fmt"
  8. "io"
  9. "net/http"
  10. "path"
  11. "path/filepath"
  12. "regexp"
  13. "strings"
  14. "github.com/Unknwon/com"
  15. "github.com/russross/blackfriday"
  16. "golang.org/x/net/html"
  17. "github.com/gogits/gogs/modules/setting"
  18. )
  19. // TODO: put this into 'markdown' module.
  20. func isletter(c byte) bool {
  21. return (c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z')
  22. }
  23. func isalnum(c byte) bool {
  24. return (c >= '0' && c <= '9') || isletter(c)
  25. }
  26. var validLinks = [][]byte{[]byte("http://"), []byte("https://"), []byte("ftp://"), []byte("mailto://")}
  27. func isLink(link []byte) bool {
  28. for _, prefix := range validLinks {
  29. if len(link) > len(prefix) && bytes.Equal(bytes.ToLower(link[:len(prefix)]), prefix) && isalnum(link[len(prefix)]) {
  30. return true
  31. }
  32. }
  33. return false
  34. }
  35. func IsMarkdownFile(name string) bool {
  36. name = strings.ToLower(name)
  37. switch filepath.Ext(name) {
  38. case ".md", ".markdown", ".mdown", ".mkd":
  39. return true
  40. }
  41. return false
  42. }
  43. func IsTextFile(data []byte) (string, bool) {
  44. contentType := http.DetectContentType(data)
  45. if strings.Index(contentType, "text/") != -1 {
  46. return contentType, true
  47. }
  48. return contentType, false
  49. }
  50. func IsImageFile(data []byte) (string, bool) {
  51. contentType := http.DetectContentType(data)
  52. if strings.Index(contentType, "image/") != -1 {
  53. return contentType, true
  54. }
  55. return contentType, false
  56. }
  57. // IsReadmeFile returns true if given file name suppose to be a README file.
  58. func IsReadmeFile(name string) bool {
  59. name = strings.ToLower(name)
  60. if len(name) < 6 {
  61. return false
  62. } else if len(name) == 6 {
  63. if name == "readme" {
  64. return true
  65. }
  66. return false
  67. }
  68. if name[:7] == "readme." {
  69. return true
  70. }
  71. return false
  72. }
  73. var (
  74. MentionPattern = regexp.MustCompile(`(\s|^)@[0-9a-zA-Z_\.]+`)
  75. commitPattern = regexp.MustCompile(`(\s|^)https?.*commit/[0-9a-zA-Z]+(#+[0-9a-zA-Z-]*)?`)
  76. issueFullPattern = regexp.MustCompile(`(\s|^)https?.*issues/[0-9]+(#+[0-9a-zA-Z-]*)?`)
  77. issueIndexPattern = regexp.MustCompile(`( |^|\()#[0-9]+\b`)
  78. sha1CurrentPattern = regexp.MustCompile(`\b[0-9a-f]{40}\b`)
  79. )
  80. type CustomRender struct {
  81. blackfriday.Renderer
  82. urlPrefix string
  83. }
  84. func (r *CustomRender) Link(out *bytes.Buffer, link []byte, title []byte, content []byte) {
  85. if len(link) > 0 && !isLink(link) {
  86. if link[0] == '#' {
  87. // link = append([]byte(options.urlPrefix), link...)
  88. } else {
  89. link = []byte(path.Join(r.urlPrefix, string(link)))
  90. }
  91. }
  92. r.Renderer.Link(out, link, title, content)
  93. }
  94. func (r *CustomRender) AutoLink(out *bytes.Buffer, link []byte, kind int) {
  95. if kind != 1 {
  96. r.Renderer.AutoLink(out, link, kind)
  97. return
  98. }
  99. // This method could only possibly serve one link at a time, no need to find all.
  100. m := commitPattern.Find(link)
  101. if m != nil {
  102. m = bytes.TrimSpace(m)
  103. i := strings.Index(string(m), "commit/")
  104. j := strings.Index(string(m), "#")
  105. if j == -1 {
  106. j = len(m)
  107. }
  108. out.WriteString(fmt.Sprintf(` <code><a href="%s">%s</a></code>`, m, ShortSha(string(m[i+7:j]))))
  109. return
  110. }
  111. m = issueFullPattern.Find(link)
  112. if m != nil {
  113. m = bytes.TrimSpace(m)
  114. i := strings.Index(string(m), "issues/")
  115. j := strings.Index(string(m), "#")
  116. if j == -1 {
  117. j = len(m)
  118. }
  119. out.WriteString(fmt.Sprintf(` <a href="%s">#%s</a>`, m, ShortSha(string(m[i+7:j]))))
  120. return
  121. }
  122. r.Renderer.AutoLink(out, link, kind)
  123. }
  124. func (options *CustomRender) ListItem(out *bytes.Buffer, text []byte, flags int) {
  125. switch {
  126. case bytes.HasPrefix(text, []byte("[ ] ")):
  127. text = append([]byte(`<input type="checkbox" disabled="" />`), text[3:]...)
  128. case bytes.HasPrefix(text, []byte("[x] ")):
  129. text = append([]byte(`<input type="checkbox" disabled="" checked="" />`), text[3:]...)
  130. }
  131. options.Renderer.ListItem(out, text, flags)
  132. }
  133. var (
  134. svgSuffix = []byte(".svg")
  135. svgSuffixWithMark = []byte(".svg?")
  136. )
  137. func (r *CustomRender) Image(out *bytes.Buffer, link []byte, title []byte, alt []byte) {
  138. prefix := strings.Replace(r.urlPrefix, "/src/", "/raw/", 1)
  139. if len(link) > 0 {
  140. if isLink(link) {
  141. // External link with .svg suffix usually means CI status.
  142. if bytes.HasSuffix(link, svgSuffix) || bytes.Contains(link, svgSuffixWithMark) {
  143. r.Renderer.Image(out, link, title, alt)
  144. return
  145. }
  146. } else {
  147. if link[0] != '/' {
  148. prefix += "/"
  149. }
  150. link = []byte(prefix + string(link))
  151. }
  152. }
  153. out.WriteString(`<a href="`)
  154. out.Write(link)
  155. out.WriteString(`">`)
  156. r.Renderer.Image(out, link, title, alt)
  157. out.WriteString("</a>")
  158. }
  159. func cutoutVerbosePrefix(prefix string) string {
  160. count := 0
  161. for i := 0; i < len(prefix); i++ {
  162. if prefix[i] == '/' {
  163. count++
  164. }
  165. if count >= 3+setting.AppSubUrlDepth {
  166. return prefix[:i]
  167. }
  168. }
  169. return prefix
  170. }
  171. func RenderIssueIndexPattern(rawBytes []byte, urlPrefix string, metas map[string]string) []byte {
  172. urlPrefix = cutoutVerbosePrefix(urlPrefix)
  173. ms := issueIndexPattern.FindAll(rawBytes, -1)
  174. for _, m := range ms {
  175. var space string
  176. m2 := m
  177. if m2[0] != '#' {
  178. space = string(m2[0])
  179. m2 = m2[1:]
  180. }
  181. if metas == nil {
  182. rawBytes = bytes.Replace(rawBytes, m, []byte(fmt.Sprintf(`%s<a href="%s/issues/%s">%s</a>`,
  183. space, urlPrefix, m2[1:], m2)), 1)
  184. } else {
  185. // Support for external issue tracker
  186. metas["index"] = string(m2[1:])
  187. rawBytes = bytes.Replace(rawBytes, m, []byte(fmt.Sprintf(`%s<a href="%s">%s</a>`,
  188. space, com.Expand(metas["format"], metas), m2)), 1)
  189. }
  190. }
  191. return rawBytes
  192. }
  193. func RenderSpecialLink(rawBytes []byte, urlPrefix string, metas map[string]string) []byte {
  194. ms := MentionPattern.FindAll(rawBytes, -1)
  195. for _, m := range ms {
  196. m = bytes.TrimSpace(m)
  197. rawBytes = bytes.Replace(rawBytes, m,
  198. []byte(fmt.Sprintf(`<a href="%s/%s">%s</a>`, setting.AppSubUrl, m[1:], m)), -1)
  199. }
  200. rawBytes = RenderIssueIndexPattern(rawBytes, urlPrefix, metas)
  201. rawBytes = RenderSha1CurrentPattern(rawBytes, urlPrefix)
  202. return rawBytes
  203. }
  204. func RenderSha1CurrentPattern(rawBytes []byte, urlPrefix string) []byte {
  205. ms := sha1CurrentPattern.FindAll(rawBytes, -1)
  206. for _, m := range ms {
  207. rawBytes = bytes.Replace(rawBytes, m, []byte(fmt.Sprintf(
  208. `<a href="%s/commit/%s"><code>%s</code></a>`, urlPrefix, m, ShortSha(string(m)))), -1)
  209. }
  210. return rawBytes
  211. }
  212. func RenderRawMarkdown(body []byte, urlPrefix string) []byte {
  213. htmlFlags := 0
  214. htmlFlags |= blackfriday.HTML_SKIP_STYLE
  215. htmlFlags |= blackfriday.HTML_OMIT_CONTENTS
  216. renderer := &CustomRender{
  217. Renderer: blackfriday.HtmlRenderer(htmlFlags, "", ""),
  218. urlPrefix: urlPrefix,
  219. }
  220. // set up the parser
  221. extensions := 0
  222. extensions |= blackfriday.EXTENSION_NO_INTRA_EMPHASIS
  223. extensions |= blackfriday.EXTENSION_TABLES
  224. extensions |= blackfriday.EXTENSION_FENCED_CODE
  225. extensions |= blackfriday.EXTENSION_AUTOLINK
  226. extensions |= blackfriday.EXTENSION_STRIKETHROUGH
  227. extensions |= blackfriday.EXTENSION_SPACE_HEADERS
  228. extensions |= blackfriday.EXTENSION_NO_EMPTY_LINE_BEFORE_BLOCK
  229. if setting.Markdown.EnableHardLineBreak {
  230. extensions |= blackfriday.EXTENSION_HARD_LINE_BREAK
  231. }
  232. body = blackfriday.Markdown(body, renderer, extensions)
  233. return body
  234. }
  235. var (
  236. leftAngleBracket = []byte("</")
  237. rightAngleBracket = []byte(">")
  238. )
  239. var noEndTags = []string{"img", "input", "br", "hr"}
  240. // PostProcessMarkdown treats different types of HTML differently,
  241. // and only renders special links for plain text blocks.
  242. func PostProcessMarkdown(rawHtml []byte, urlPrefix string, metas map[string]string) []byte {
  243. startTags := make([]string, 0, 5)
  244. var buf bytes.Buffer
  245. tokenizer := html.NewTokenizer(bytes.NewReader(rawHtml))
  246. OUTER_LOOP:
  247. for html.ErrorToken != tokenizer.Next() {
  248. token := tokenizer.Token()
  249. switch token.Type {
  250. case html.TextToken:
  251. buf.Write(RenderSpecialLink([]byte(token.String()), urlPrefix, metas))
  252. case html.StartTagToken:
  253. buf.WriteString(token.String())
  254. tagName := token.Data
  255. // If this is an excluded tag, we skip processing all output until a close tag is encountered.
  256. if strings.EqualFold("a", tagName) || strings.EqualFold("code", tagName) || strings.EqualFold("pre", tagName) {
  257. stackNum := 1
  258. for html.ErrorToken != tokenizer.Next() {
  259. token = tokenizer.Token()
  260. // Copy the token to the output verbatim
  261. buf.WriteString(token.String())
  262. if token.Type == html.StartTagToken {
  263. stackNum++
  264. }
  265. // If this is the close tag to the outer-most, we are done
  266. if token.Type == html.EndTagToken && strings.EqualFold(tagName, token.Data) {
  267. stackNum--
  268. if stackNum == 0 {
  269. break
  270. }
  271. }
  272. }
  273. continue OUTER_LOOP
  274. }
  275. if !com.IsSliceContainsStr(noEndTags, token.Data) {
  276. startTags = append(startTags, token.Data)
  277. }
  278. case html.EndTagToken:
  279. if len(startTags) == 0 {
  280. buf.WriteString(token.String())
  281. break
  282. }
  283. buf.Write(leftAngleBracket)
  284. buf.WriteString(startTags[len(startTags)-1])
  285. buf.Write(rightAngleBracket)
  286. startTags = startTags[:len(startTags)-1]
  287. default:
  288. buf.WriteString(token.String())
  289. }
  290. }
  291. if io.EOF == tokenizer.Err() {
  292. return buf.Bytes()
  293. }
  294. // If we are not at the end of the input, then some other parsing error has occurred,
  295. // so return the input verbatim.
  296. return rawHtml
  297. }
  298. func RenderMarkdown(rawBytes []byte, urlPrefix string, metas map[string]string) []byte {
  299. result := RenderRawMarkdown(rawBytes, urlPrefix)
  300. result = PostProcessMarkdown(result, urlPrefix, metas)
  301. result = Sanitizer.SanitizeBytes(result)
  302. return result
  303. }
  304. func RenderMarkdownString(raw, urlPrefix string, metas map[string]string) string {
  305. return string(RenderMarkdown([]byte(raw), urlPrefix, metas))
  306. }