Skip to content

saihon/gohtml

Repository files navigation

gohtml

JavaScript-like HTML parser for Go language. If function names, etc. are the same as in JavaScript, it will be easier for JavaScript users to use.


GoDoc Test



Usage

import (
    "github.com/saihon/gohtml"
)

func main() {
    text := "<html><head></head><body></body></html>"

    // Parse text HTML
    document, err := gohtml.Parse(strings.NewReader(text))
    if err != nil {
       return
    }

    documentElement := document.DocumentElement()
    all     := document.All()
    body    := document.Body()
    title   := document.Title() // title string
    head    := document.Head()
    form    := document.Form()
    images  := document.Images()
    links   := document.Links()
    anchors := document.Anchors()


    element := document.GetElementById("id")
    element = document.QuerySelector("div > p")
    // Must be check if element is nil.
    if element != nil {
        textContent := element.TextContent()
        // ...
    }

    // Get HTML collection
    elements := document.GetElementsByClassName("class")
    elements = document.QuerySelectorAll("div > p")
    elements = document.GetElementsByName("name")
    elements = document.GetElementsByTagName("p")

    // for loop (Recommended because fast)
    for i := 0; i < elements.Length(); i++ {
        outerHtml := elements.Get(i).OuterHTML()
        // ...
    }
    // or 
    for element := range elements.Enumerator() {
        outerHtml := element.OuterHTML()
        // ...
    }
    // or 
    elements.ForEach(func(element *Element, index int, collection Collection) {
        outerHtml := element.OuterHTML()
        // ...
    })


    // Set text content
    element.TextContent("hello")
    // Get text content
    textContent := element.TextContent()
    // Set HTML
    element.InnerHTML("<p>hello</p>")
    // Get
    innerHtml := element.InnerHTML()

    // Get id attribute
    id := element.HasAttribute("id")
    // Get class name attribute
    className := element.GetAttribute("class")
    // Set attribute
    element.SetAttribute("key", "value")
    // Remove attribute
    element.RemoveAttribute("key")
}

For more detailed documentation is here.


License

MIT License