diff --git a/main.go b/main.go index b578fa1..f516d8d 100644 --- a/main.go +++ b/main.go @@ -1,7 +1,7 @@ package main -import "github.com/fengxxc/wechatmp2markdown/parse" +import "github.com/fengxxc/wechatmp2markdown/test" func main() { - parse.Test() + test.Test1() } diff --git a/parse/parse.go b/parse/parse.go index 9bb0ee2..3a4b58c 100644 --- a/parse/parse.go +++ b/parse/parse.go @@ -1,9 +1,12 @@ package parse import ( + "bytes" "fmt" "io" + "io/ioutil" "log" + "os" "regexp" "strings" @@ -92,6 +95,19 @@ func ParseFromHTMLString(s string) Article { return ParseFromReader(strings.NewReader(s)) } +func ParseFromHTMLFile(filepath string) Article { + file, err := os.Open(filepath) + if err != nil { + panic(err) + } + defer file.Close() + content, err2 := ioutil.ReadAll(file) + if err2 != nil { + panic(err) + } + return ParseFromReader(bytes.NewReader(content)) +} + func removeBrAndBlank(s string) string { regstr := "\\s{2,}" reg, _ := regexp.Compile(regstr) @@ -104,68 +120,3 @@ func removeBrAndBlank(s string) string { } return strings.Replace(string(sb), "\n", " ", -1) } - -var testHTML = ` -
写公众号一年了,一直盼着能有人喷喷我,今天终于被我碰到了!