Add link expander
This commit is contained in:
parent
e71e32228c
commit
043a7fd66f
35
scraper/link_expander.go
Normal file
35
scraper/link_expander.go
Normal file
@ -0,0 +1,35 @@
|
||||
package scraper
|
||||
|
||||
import (
|
||||
"fmt"
|
||||
"time"
|
||||
"net/http"
|
||||
)
|
||||
|
||||
|
||||
/**
|
||||
* Return the expanded version of a short URL. Input must be a real short URL.
|
||||
*/
|
||||
func ExpandShortUrl(short_url string) string {
|
||||
// Create a client that doesn't follow redirects
|
||||
client := &http.Client{
|
||||
Timeout: 5 * time.Second,
|
||||
CheckRedirect: func(req *http.Request, via []*http.Request) error {
|
||||
return http.ErrUseLastResponse
|
||||
},
|
||||
}
|
||||
|
||||
resp, err := client.Get(short_url)
|
||||
if err != nil {
|
||||
panic(err) // TODO: handle timeouts
|
||||
}
|
||||
if resp.StatusCode != 301 {
|
||||
panic(fmt.Sprintf("Unknown status code returned when expanding short url %q: %s", short_url, resp.Status))
|
||||
}
|
||||
|
||||
long_url := resp.Header.Get("Location")
|
||||
if long_url == "" {
|
||||
panic(fmt.Sprintf("Header didn't have a Location field for short url %q", short_url))
|
||||
}
|
||||
return long_url
|
||||
}
|
25
scraper/link_expander_test.go
Normal file
25
scraper/link_expander_test.go
Normal file
@ -0,0 +1,25 @@
|
||||
package scraper_test
|
||||
|
||||
import (
|
||||
"testing"
|
||||
|
||||
"net/http"
|
||||
"net/http/httptest"
|
||||
|
||||
"offline_twitter/scraper"
|
||||
)
|
||||
|
||||
|
||||
func TestExpandShortUrl(t *testing.T) {
|
||||
redirecting_to := "redirect target"
|
||||
srvr := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, req *http.Request) {
|
||||
w.Header().Set("Location", redirecting_to)
|
||||
w.WriteHeader(301)
|
||||
}))
|
||||
defer srvr.Close()
|
||||
|
||||
result := scraper.ExpandShortUrl(srvr.URL)
|
||||
if result != redirecting_to {
|
||||
t.Errorf("Expected %q, got %q", redirecting_to, result)
|
||||
}
|
||||
}
|
Loading…
x
Reference in New Issue
Block a user