Fix parsing edge case of frontmatter
authorNoah Campbell <noahcampbell@gmail.com>
Wed, 18 Sep 2013 16:15:46 +0000 (09:15 -0700)
committerNoah Campbell <noahcampbell@gmail.com>
Wed, 18 Sep 2013 16:15:46 +0000 (09:15 -0700)
When the frontmatter contains a - (or other delimiter) close to the
closing frontmatter delimiter, frontmatter detection would fail.

hugolib/page.go
hugolib/page_test.go
hugolib/site.go
hugolib/site_url_test.go
parser/page.go
parser/parse_frontmatter_test.go
transform/post.go
transform/posttrans_test.go

index 3738483c7c1c12a235ea46957de9de1482e3b870..79c414aaf6d1fd36d99de2d23ef0fd55b49af3d2 100644 (file)
@@ -19,10 +19,10 @@ import (
        "errors"
        "fmt"
        "github.com/BurntSushi/toml"
+       "github.com/spf13/hugo/parser"
        helper "github.com/spf13/hugo/template"
        "github.com/spf13/hugo/template/bundle"
        "github.com/theplant/blackfriday"
-       "github.com/spf13/hugo/parser"
        "html/template"
        "io"
        "launchpad.net/goyaml"
index a2a4999dfe5e5c09c66a77729dd6e2aa8a2d6ced..64395decfa9a2a5e3a93205115122ab3366d177e 100644 (file)
@@ -10,13 +10,8 @@ import (
 
 var EMPTY_PAGE = ""
 
-var SIMPLE_PAGE = `---
-title: Simple
----
-Simple Page
-`
-
-var INVALID_FRONT_MATTER_MISSING = `This is a test`
+var SIMPLE_PAGE = "---\ntitle: Simple\n---\nSimple Page\n"
+var INVALID_FRONT_MATTER_MISSING = "This is a test"
 
 var INVALID_FRONT_MATTER_SHORT_DELIM = `
 --
@@ -95,7 +90,7 @@ type and layout set`
 var SIMPLE_PAGE_WITH_SUMMARY_DELIMITER = `---
 title: Simple
 ---
-Simple Page
+Summary Next Line
 
 <!--more-->
 Some more text
@@ -104,7 +99,7 @@ Some more text
 var SIMPLE_PAGE_WITH_SUMMARY_DELIMITER_SAME_LINE = `---
 title: Simple
 ---
-Simple Page<!--more-->
+Summary Same Line<!--more-->
 
 Some more text
 `
@@ -144,7 +139,7 @@ func checkPageTitle(t *testing.T, page *Page, title string) {
 
 func checkPageContent(t *testing.T, page *Page, content string) {
        if page.Content != template.HTML(content) {
-               t.Fatalf("Page content is: %s.  Expected %s", page.Content, content)
+               t.Fatalf("Page content mismatch\nexp: %q\ngot: %q", content, page.Content)
        }
 }
 
@@ -190,8 +185,8 @@ func TestPageWithDelimiter(t *testing.T) {
                t.Fatalf("Unable to create a page with frontmatter and body content: %s", err)
        }
        checkPageTitle(t, p, "Simple")
-       checkPageContent(t, p, "<p>Simple Page</p>\n\n<p>Some more text</p>\n")
-       checkPageSummary(t, p, "<p>Simple Page</p>\n")
+       checkPageContent(t, p, "<p>Summary Next Line</p>\n\n<p>Some more text</p>\n")
+       checkPageSummary(t, p, "<p>Summary Next Line</p>\n")
        checkPageType(t, p, "page")
        checkPageLayout(t, p, "page/single.html")
 
@@ -203,8 +198,8 @@ func TestPageWithMoreTag(t *testing.T) {
                t.Fatalf("Unable to create a page with frontmatter and body content: %s", err)
        }
        checkPageTitle(t, p, "Simple")
-       checkPageContent(t, p, "<p>Simple Page</p>\n\n<p>Some more text</p>\n")
-       checkPageSummary(t, p, "<p>Simple Page</p>\n")
+       checkPageContent(t, p, "<p>Summary Same Line</p>\n\n<p>Some more text</p>\n")
+       checkPageSummary(t, p, "<p>Summary Same Line</p>\n")
        checkPageType(t, p, "page")
        checkPageLayout(t, p, "page/single.html")
 }
@@ -243,7 +238,7 @@ func TestDegenerateInvalidFrontMatterShortDelim(t *testing.T) {
                err string
        }{
                {INVALID_FRONT_MATTER_SHORT_DELIM, "Unable to locate frontmatter"},
-               {INVALID_FRONT_MATTER_SHORT_DELIM_ENDING, "EOF"},
+               {INVALID_FRONT_MATTER_SHORT_DELIM_ENDING, "Unable to read frontmatter at filepos 45: EOF"},
                {INVALID_FRONT_MATTER_MISSING, "Unable to locate frontmatter"},
        }
        for _, test := range tests {
index bfbb4ab24d1fce7411db62f8093f5c7639f39ec9..2c81655431b9071a8ca3af9161e35740dce2c1b8 100644 (file)
@@ -14,7 +14,6 @@
 package hugolib
 
 import (
-       "io"
        "bitbucket.org/pkg/inflect"
        "bytes"
        "fmt"
@@ -25,6 +24,7 @@ import (
        "github.com/spf13/hugo/transform"
        "github.com/spf13/nitro"
        "html/template"
+       "io"
        "os"
        "path"
        "strings"
@@ -68,18 +68,18 @@ func PrintErr(str string, a ...interface{}) {
 //
 // 5. The entire collection of files is written to disk.
 type Site struct {
-       Config     Config
-       Pages      Pages
-       Tmpl       bundle.Template
-       Indexes    IndexList
-       Source     source.Input
-       Sections   Index
-       Info       SiteInfo
-       Shortcodes map[string]ShortcodeFunc
-       timer      *nitro.B
+       Config      Config
+       Pages       Pages
+       Tmpl        bundle.Template
+       Indexes     IndexList
+       Source      source.Input
+       Sections    Index
+       Info        SiteInfo
+       Shortcodes  map[string]ShortcodeFunc
+       timer       *nitro.B
        Transformer *transform.Transformer
-       Target     target.Output
-       Alias      target.AliasPublisher
+       Target      target.Output
+       Alias       target.AliasPublisher
 }
 
 type SiteInfo struct {
index ef226fe7f59c1f2e2f4e24d5b27334eafa512b55..b9c30fec4e80357fb209f3adfc983571edd96b2d 100644 (file)
@@ -10,7 +10,12 @@ import (
 
 const SLUG_DOC_1 = "---\ntitle: slug doc 1\nslug: slug-doc-1\naliases:\n - sd1/foo/\n - sd2\n - sd3/\n - sd4.html\n---\nslug doc 1 content\n"
 
-const SLUG_DOC_2 = "---\ntitle: slug doc 2\nslug: slug-doc-2\n---\nslug doc 2 content\n"
+const SLUG_DOC_2 = `---
+title: slug doc 2
+slug: slug-doc-2
+---
+slug doc 2 content
+`
 
 const INDEX_TEMPLATE = "{{ range .Data.Pages }}.{{ end }}"
 
@@ -58,7 +63,7 @@ func (t *InMemoryAliasTarget) Publish(label string, permalink template.HTML) (er
 
 var urlFakeSource = []byteSource{
        {"content/blue/doc1.md", []byte(SLUG_DOC_1)},
-//     {"content/blue/doc2.md", []byte(SLUG_DOC_2)},
+       {"content/blue/doc2.md", []byte(SLUG_DOC_2)},
 }
 
 func TestPageCount(t *testing.T) {
@@ -95,7 +100,7 @@ func TestPageCount(t *testing.T) {
                t.Errorf("No indexed rendered. %v", target.files)
        }
 
-       expected := "<html><head></head><body>.</body></html>"
+       expected := "<html><head></head><body>..</body></html>"
        if string(blueIndex) != expected {
                t.Errorf("Index template does not match expected: %q, got: %q", expected, string(blueIndex))
        }
index 2df4ce635a2faf915a438feafe31d8a888f37db7..eb8672bd4faedda27e8189e1fb665f912dce65d7 100644 (file)
@@ -2,9 +2,9 @@ package parser
 
 import (
        "bufio"
-       "fmt"
        "bytes"
        "errors"
+       "fmt"
        "io"
        "unicode"
 )
@@ -164,22 +164,34 @@ func determineDelims(firstLine []byte) (left, right []byte) {
 }
 
 func extractFrontMatterDelims(r *bufio.Reader, left, right []byte) (fm FrontMatter, err error) {
-       var level int = 0
-       var sameDelim = bytes.Equal(left, right)
+       var (
+               c         byte
+               level     int = 0
+               bytesRead int = 0
+               sameDelim     = bytes.Equal(left, right)
+       )
+
        wr := new(bytes.Buffer)
        for {
-               c, err := r.ReadByte()
-               if err != nil {
-                       return nil, err
+               if c, err = r.ReadByte(); err != nil {
+                       return nil, fmt.Errorf("Unable to read frontmatter at filepos %d: %s", bytesRead, err)
                }
+               bytesRead += 1
 
                switch c {
                case left[0]:
-                       match, err := matches(r, wr, []byte{c}, left)
-                       if err != nil {
+                       var (
+                               buf       []byte = []byte{c}
+                               remaining []byte
+                       )
+
+                       if remaining, err = r.Peek(len(left) - 1); err != nil {
                                return nil, err
                        }
-                       if match {
+
+                       buf = append(buf, remaining...)
+
+                       if bytes.Equal(buf, left) {
                                if sameDelim {
                                        if level == 0 {
                                                level = 1
@@ -190,6 +202,19 @@ func extractFrontMatterDelims(r *bufio.Reader, left, right []byte) (fm FrontMatt
                                        level += 1
                                }
                        }
+
+                       if _, err = wr.Write([]byte{c}); err != nil {
+                               return nil, err
+                       }
+
+                       if level == 0 {
+                               if _, err = r.Read(remaining); err != nil {
+                                       return nil, err
+                               }
+                               if _, err = wr.Write(remaining); err != nil {
+                                       return nil, err
+                               }
+                       }
                case right[0]:
                        match, err := matches(r, wr, []byte{c}, right)
                        if err != nil {
@@ -216,6 +241,10 @@ func extractFrontMatterDelims(r *bufio.Reader, left, right []byte) (fm FrontMatt
        return nil, errors.New("Could not find front matter.")
 }
 
+func matches_quick(buf, expected []byte) (ok bool, err error) {
+       return bytes.Equal(expected, buf), nil
+}
+
 func matches(r *bufio.Reader, wr io.Writer, c, expected []byte) (ok bool, err error) {
        if len(expected) == 1 {
                if _, err = wr.Write(c); err != nil {
@@ -223,16 +252,13 @@ func matches(r *bufio.Reader, wr io.Writer, c, expected []byte) (ok bool, err er
                }
                return bytes.Equal(c, expected), nil
        }
+
        buf := make([]byte, len(expected)-1)
-       if _, err = r.Read(buf); err != nil {
+       if buf, err = r.Peek(len(expected) - 1); err != nil {
                return
        }
 
        buf = append(c, buf...)
-       if _, err = wr.Write(buf); err != nil {
-               return
-       }
-
        return bytes.Equal(expected, buf), nil
 }
 
index 1da38a1850c3e4e452b6dec269ad6bd45795af47..6d65d9dcb54d9f45f36dd504126d9bc2ac134d26 100644 (file)
@@ -24,12 +24,15 @@ var (
        CONTENT_INCOMPLETE_BEG_FM_DELIM = "--\ntitle: incomplete beg fm delim\n---\nincomplete frontmatter delim"
        CONTENT_INCOMPLETE_END_FM_DELIM = "---\ntitle: incomplete end fm delim\n--\nincomplete frontmatter delim"
        CONTENT_MISSING_END_FM_DELIM    = "---\ntitle: incomplete end fm delim\nincomplete frontmatter delim"
+       CONTENT_SLUG_WORKING            = "---\ntitle: slug doc 2\nslug: slug-doc-2\n\n---\nslug doc 2 content"
+       CONTENT_SLUG_WORKING_VARIATION  = "---\ntitle: slug doc 3\nslug: slug-doc 3\n---\nslug doc 3 content"
+       CONTENT_SLUG_BUG                = "---\ntitle: slug doc 2\nslug: slug-doc-2\n---\nslug doc 2 content"
        CONTENT_FM_NO_DOC               = "---\ntitle: no doc\n---"
-       CONTENT_WITH_JS_FM = "{\n  \"categories\": \"d\",\n  \"tags\": [\n    \"a\", \n    \"b\", \n    \"c\"\n  ]\n}\nJSON Front Matter with tags and categories"
+       CONTENT_WITH_JS_FM              = "{\n  \"categories\": \"d\",\n  \"tags\": [\n    \"a\", \n    \"b\", \n    \"c\"\n  ]\n}\nJSON Front Matter with tags and categories"
 )
 
 var lineEndings = []string{"\n", "\r\n"}
-var delimiters = []string{"-", "+"}
+var delimiters = []string{"---", "+++"}
 
 func pageMust(p Page, err error) *page {
        if err != nil {
@@ -83,13 +86,13 @@ func checkPageFrontMatterContent(t *testing.T, p *page, frontMatter string) {
                return
        }
        if !bytes.Equal(p.frontmatter, []byte(frontMatter)) {
-               t.Errorf("expected frontmatter %q, got %q", frontMatter, p.frontmatter)
+               t.Errorf("frontmatter mismatch\nexp: %q\ngot: %q", frontMatter, p.frontmatter)
        }
 }
 
 func checkPageContent(t *testing.T, p *page, expected string) {
        if !bytes.Equal(p.content, []byte(expected)) {
-               t.Errorf("expected content %q, got %q", expected, p.content)
+               t.Errorf("content mismatch\nexp: %q\ngot: %q", expected, p.content)
        }
 }
 
@@ -101,6 +104,7 @@ func TestStandaloneCreatePageFrom(t *testing.T) {
                frontMatter        string
                bodycontent        string
        }{
+
                {CONTENT_NO_FRONTMATTER, true, true, "", "a page with no front matter"},
                {CONTENT_WITH_FRONTMATTER, true, false, "---\ntitle: front matter\n---\n", "Content with front matter"},
                {CONTENT_HTML_NODOCTYPE, false, true, "", "<html>\n\t<body>\n\t</body>\n</html>"},
@@ -109,6 +113,9 @@ func TestStandaloneCreatePageFrom(t *testing.T) {
                {CONTENT_LWS_HTML, false, true, "", "<html><body></body></html>"},
                {CONTENT_LWS_LF_HTML, false, true, "", "<html><body></body></html>"},
                {CONTENT_WITH_JS_FM, true, false, "{\n  \"categories\": \"d\",\n  \"tags\": [\n    \"a\", \n    \"b\", \n    \"c\"\n  ]\n}", "JSON Front Matter with tags and categories"},
+               {CONTENT_SLUG_WORKING, true, false, "---\ntitle: slug doc 2\nslug: slug-doc-2\n\n---\n", "slug doc 2 content"},
+               {CONTENT_SLUG_WORKING_VARIATION, true, false, "---\ntitle: slug doc 3\nslug: slug-doc 3\n---\n", "slug doc 3 content"},
+               {CONTENT_SLUG_BUG, true, false, "---\ntitle: slug doc 2\nslug: slug-doc-2\n---\n", "slug doc 2 content"},
        }
 
        for _, test := range tests {
@@ -224,6 +231,7 @@ func TestExtractFrontMatter(t *testing.T) {
                {"---\nralb\n---\n", []byte("---\nralb\n---\n"), true},
                {"---\nminc\n---\ncontent", []byte("---\nminc\n---\n"), true},
                {"---\ncnim\n---\ncontent\n", []byte("---\ncnim\n---\n"), true},
+               {"---\ntitle: slug doc 2\nslug: slug-doc-2\n---\ncontent\n", []byte("---\ntitle: slug doc 2\nslug: slug-doc-2\n---\n"), true},
        }
 
        for _, test := range tests {
@@ -231,8 +239,8 @@ func TestExtractFrontMatter(t *testing.T) {
                        test.frontmatter = strings.Replace(test.frontmatter, "\n", ending, -1)
                        test.extracted = bytes.Replace(test.extracted, []byte("\n"), []byte(ending), -1)
                        for _, delim := range delimiters {
-                               test.frontmatter = strings.Replace(test.frontmatter, "-", delim, -1)
-                               test.extracted = bytes.Replace(test.extracted, []byte("-"), []byte(delim), -1)
+                               test.frontmatter = strings.Replace(test.frontmatter, "---", delim, -1)
+                               test.extracted = bytes.Replace(test.extracted, []byte("---"), []byte(delim), -1)
                                line, err := peekLine(bufio.NewReader(strings.NewReader(test.frontmatter)))
                                if err != nil {
                                        continue
@@ -245,8 +253,7 @@ func TestExtractFrontMatter(t *testing.T) {
                                        continue
                                }
                                if !bytes.Equal(fm, test.extracted) {
-                                       t.Logf("\n%q\n", string(test.frontmatter))
-                                       t.Errorf("Expected front matter %q. got %q", string(test.extracted), fm)
+                                       t.Errorf("Frontmatter did not match:\nexp: %q\ngot: %q", string(test.extracted), fm)
                                }
                        }
                }
@@ -285,8 +292,7 @@ func TestExtractFrontMatterDelim(t *testing.T) {
                }
                if !bytes.Equal(fm, []byte(test.extracted)) {
                        t.Logf("\n%q\n", string(test.frontmatter))
-                       t.Errorf("Expected front matter %q. got %q", string(test.extracted), fm)
+                       t.Errorf("Frontmatter did not match:\nexp: %q\ngot: %q", string(test.extracted), fm)
                }
        }
 }
-
index f63f1683b5a5d5537265575d31976bbf60dff9f1..369b2d6cac86cbe9bcb970bcfa10311b37692870 100644 (file)
@@ -1,9 +1,9 @@
 package transform
 
 import (
+       htmltran "code.google.com/p/go-html-transform/html/transform"
        "io"
        "net/url"
-       htmltran "code.google.com/p/go-html-transform/html/transform"
 )
 
 type Transformer struct {
index de2d2277c34608633d8ac0aaded5689d0f653628..08fe18c11d0a99377d8956e6392060395f203e4f 100644 (file)
@@ -1,23 +1,23 @@
 package transform
 
 import (
-       "testing"
-       "strings"
        "bytes"
+       "strings"
+       "testing"
 )
 
 const H5_JS_CONTENT_DOUBLE_QUOTE = "<!DOCTYPE html><html><head><script src=\"foobar.js\"></script></head><body><nav><h1>title</h1></nav><article>content <a href='/foobar'>foobar</a>. Follow up</article></body></html>"
 const H5_JS_CONTENT_SINGLE_QUOTE = "<!DOCTYPE html><html><head><script src='foobar.js'></script></head><body><nav><h1>title</h1></nav><article>content <a href='/foobar'>foobar</a>. Follow up</article></body></html>"
 const H5_JS_CONTENT_ABS_URL = "<!DOCTYPE html><html><head><script src=\"http://user@host:10234/foobar.js\"></script></head><body><nav><h1>title</h1></nav><article>content <a href=\"https://host/foobar\">foobar</a>. Follow up</article></body></html>"
+
 // URL doesn't recognize authorities.  BUG?
 //const H5_JS_CONTENT_ABS_URL = "<!DOCTYPE html><html><head><script src=\"//host/foobar.js\"></script></head><body><nav><h1>title</h1></nav><article>content <a href=\"https://host/foobar\">foobar</a>. Follow up</article></body></html>"
 
 const CORRECT_OUTPUT_SRC_HREF = "<!DOCTYPE html><html><head><script src=\"http://base/foobar.js\"></script></head><body><nav><h1>title</h1></nav><article>content <a href=\"http://base/foobar\">foobar</a>. Follow up</article></body></html>"
 
-
 func TestAbsUrlify(t *testing.T) {
        tests := []struct {
-               content string
+               content  string
                expected string
        }{
                {H5_JS_CONTENT_DOUBLE_QUOTE, CORRECT_OUTPUT_SRC_HREF},
@@ -29,13 +29,13 @@ func TestAbsUrlify(t *testing.T) {
                tr := &Transformer{
                        BaseURL: "http://base",
                }
-       out := new(bytes.Buffer)
-       err := tr.Apply(strings.NewReader(test.content), out)
-       if err != nil {
-               t.Errorf("Unexpected error: %s", err)
-       }
-       if test.expected != string(out.Bytes()) {
-               t.Errorf("Expected:\n%s\nGot:\n%s", test.expected, string(out.Bytes()))
+               out := new(bytes.Buffer)
+               err := tr.Apply(strings.NewReader(test.content), out)
+               if err != nil {
+                       t.Errorf("Unexpected error: %s", err)
+               }
+               if test.expected != string(out.Bytes()) {
+                       t.Errorf("Expected:\n%s\nGot:\n%s", test.expected, string(out.Bytes()))
+               }
        }
 }
-}