mirror of
https://github.com/gocsaf/csaf.git
synced 2025-12-22 05:40:11 +01:00
Harvest only JSON files.
This commit is contained in:
parent
4428679822
commit
eaa2620eba
2 changed files with 11 additions and 5 deletions
|
|
@ -12,6 +12,7 @@ import (
|
|||
"io"
|
||||
"net/http"
|
||||
"net/url"
|
||||
"strings"
|
||||
|
||||
"github.com/PuerkitoBio/goquery"
|
||||
)
|
||||
|
|
@ -66,6 +67,10 @@ func linksOnPage(r io.Reader, resolve func(string) (string, error)) ([]string, e
|
|||
return
|
||||
}
|
||||
if link, ok := s.Attr("href"); ok {
|
||||
// Only care for JSON files here.
|
||||
if !strings.HasSuffix(link, ".json") {
|
||||
return
|
||||
}
|
||||
if link, err = resolve(link); err == nil {
|
||||
links = append(links, link)
|
||||
}
|
||||
|
|
|
|||
|
|
@ -8,14 +8,15 @@ import (
|
|||
|
||||
const page0 = `<html>
|
||||
<body>
|
||||
<a href="link0">link0</a>
|
||||
<a href="no-a-json">Not a JSON</a>
|
||||
<a href="link0.json">link0</a>
|
||||
<ol>
|
||||
<li><a href="link1">link1</a></li>
|
||||
<li><a href="link2">link2</a></li>
|
||||
<li><a href="link1.json">link1</a></li>
|
||||
<li><a href="link2.json">link1</a></li>
|
||||
</ol>
|
||||
<p>
|
||||
<div>
|
||||
<li><a href="link3">link3</a></li>
|
||||
<li><a href="link3.json">link1</a></li>
|
||||
</div>
|
||||
<p>
|
||||
</body>
|
||||
|
|
@ -36,7 +37,7 @@ func TestLinksOnPage(t *testing.T) {
|
|||
}
|
||||
|
||||
for i, link := range links {
|
||||
href := fmt.Sprintf("link%d", i)
|
||||
href := fmt.Sprintf("link%d.json", i)
|
||||
if href != link {
|
||||
t.Fatalf("Expected link '%s', got '%s'\n", href, link)
|
||||
}
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue