On May 19, 5:42 pm, Archos <
raul....@sent.com> wrote:
> Use the package [html][1].
>
> import (
> "bytes"
> "exp/html"
> )
>
> var (
> anchorTag = []byte{'a'}
> )
>
> tkzer := html.NewTokenizer(page)
>
> for {
> switch tkzer.Next() {
> case html.ErrorToken:
> // HANDLE ERROR
>
> case html.StartTagToken:
> tag, hasAttr := tkzer.TagName()
> if hasAttr && bytes.Equal(anchorTag, tag) { // a
> // HANDLE ANCHOR
> }
> }
> }
>
> [1]:
http://weekly.golang.org/pkg/exp/html/
And to match only the href tags:
var (
anchorTag = []byte{'a'}
hrefTag = []byte("href")
httpTag = []byte("http")
)
// * * *
// HANDLE ANCHOR
key, val, _ := tkzer.TagAttr()
if bytes.Equal(hrefTag, key) && bytes.HasPrefix(val, httpTag) { //
href, http(s)
// HREF TAG
}