linkwallet/content/content_test.go

92 lines
2.0 KiB
Go
Raw Normal View History

2022-06-01 15:42:23 +09:30
package content
import (
"net/http"
"net/http/httptest"
"testing"
"github.com/tardisx/linkwallet/entity"
)
func newTestServer() *httptest.Server {
mux := http.NewServeMux()
mux.HandleFunc("/", func(w http.ResponseWriter, r *http.Request) {
w.Header().Set("Content-Type", "text/html")
w.Write([]byte(`<!DOCTYPE html>
<html>
<head>
<title>Test Page</title>
</head>
<body>
<h1>Hello World</h1>
<p class="description">This is a test page</p>
<p class="description">This is a test paragraph</p>
</body>
</html>
`))
})
return httptest.NewServer(mux)
}
func TestSimpleScrape(t *testing.T) {
ts := newTestServer()
defer ts.Close()
bm := entity.Bookmark{URL: ts.URL}
info := FetchPageInfo(bm)
if info.Title != "Test Page" {
t.Errorf("'%s' is wrong title (expected Test Page)", info.Title)
}
if info.Size != 208 {
t.Errorf("expected 208 bytes, got %d", info.Size)
}
if info.StatusCode != 200 {
t.Errorf("got status code %d not 200", info.StatusCode)
}
}
2025-04-25 23:57:04 +09:30
// func TestWords(t *testing.T) {
2022-06-01 15:42:23 +09:30
2025-04-25 23:57:04 +09:30
// bm := entity.Bookmark{
// // ID: 0,
// // URL: "",
// Info: entity.PageInfo{RawText: "the quick brown fox jumped over the lazy dog"},
// // Tags: []string{},
// }
// words := Words(&bm)
// if len(words) != 7 {
// t.Errorf("got %d words not 7", len(words))
// } else {
// if words[0] != "quick" ||
// words[1] != "brown" ||
// words[2] != "fox" ||
// words[3] != "jump" ||
// words[4] != "over" ||
// words[5] != "lazi" ||
// words[6] != "dog" {
// t.Error("incorrect words returned")
// }
// }
// }
2022-06-01 15:42:23 +09:30
2025-04-25 23:57:04 +09:30
// func TestStemmer(t *testing.T) {
// s := `quick quick fox 😂 smile http://google.com`
// words1 := StringToStemmedSearchWords(s)
// t.Log(words1)
// if len(words1) != 7 {
// t.Error("wrong number of words")
// }
// if words1[0] != "quick" ||
// words1[1] != "quick" ||
// words1[2] != "fox" ||
// words1[3] != "smile" ||
// words1[4] != "http" ||
// words1[5] != "googl" ||
// words1[6] != "com" {
// t.Error("bad words")
// }
2022-06-01 15:42:23 +09:30
2025-04-25 23:57:04 +09:30
// }