Revised fileserver Accept-Encoding and ETag (#1435)

* Revised fileserver Accept-Encoding and ETag

* calculateEtag improved following microbenchmarking
This commit is contained in:
Rick Beton 2017-02-18 22:52:50 +00:00 committed by Matt Holt
parent ce3580bf91
commit 6083871088
2 changed files with 144 additions and 33 deletions

View file

@ -1,7 +1,6 @@
package staticfiles package staticfiles
import ( import (
"fmt"
"math/rand" "math/rand"
"net/http" "net/http"
"os" "os"
@ -40,6 +39,14 @@ func (fs FileServer) ServeHTTP(w http.ResponseWriter, r *http.Request) (int, err
return fs.serveFile(w, r, r.URL.Path) return fs.serveFile(w, r, r.URL.Path)
} }
// calculateEtag produces a strong etag by default. Prefix the result with "W/" to convert this into a weak one.
// see https://tools.ietf.org/html/rfc7232#section-2.3
func calculateEtag(d os.FileInfo) string {
t := strconv.FormatInt(d.ModTime().Unix(), 36)
s := strconv.FormatInt(d.Size(), 36)
return `"` + t + s + `"`
}
// serveFile writes the specified file to the HTTP response. // serveFile writes the specified file to the HTTP response.
// name is '/'-separated, not filepath.Separator. // name is '/'-separated, not filepath.Separator.
func (fs FileServer) serveFile(w http.ResponseWriter, r *http.Request, name string) (int, error) { func (fs FileServer) serveFile(w http.ResponseWriter, r *http.Request, name string) (int, error) {
@ -138,9 +145,19 @@ func (fs FileServer) serveFile(w http.ResponseWriter, r *http.Request, name stri
} }
filename := d.Name() filename := d.Name()
etag := calculateEtag(d) // strong
for _, encoding := range staticEncodingPriority { for _, encoding := range staticEncodingPriority {
if !strings.Contains(r.Header.Get("Accept-Encoding"), encoding) { acceptEncoding := strings.Split(r.Header.Get("Accept-Encoding"), ",")
accepted := false
for _, acc := range acceptEncoding {
if accepted || strings.TrimSpace(acc) == encoding {
accepted = true
}
}
if !accepted {
continue continue
} }
@ -158,8 +175,7 @@ func (fs FileServer) serveFile(w http.ResponseWriter, r *http.Request, name stri
// Close previous file - release fd // Close previous file - release fd
f.Close() f.Close()
// Stat is needed for generating valid ETag etag = calculateEtag(encodedFileInfo)
d = encodedFileInfo
// Encoded file will be served // Encoded file will be served
f = encodedFile f = encodedFile
@ -169,12 +185,11 @@ func (fs FileServer) serveFile(w http.ResponseWriter, r *http.Request, name stri
defer f.Close() defer f.Close()
break break
} }
// Experimental ETag header // Set the ETag returned to the user-agent. Note that a conditional If-None-Match
e := fmt.Sprintf(`W/"%x-%x"`, d.ModTime().Unix(), d.Size()) // request is handled in http.ServeContent below, which checks against this ETag value.
w.Header().Set("ETag", e) w.Header().Set("ETag", etag)
// Note: Errors generated by ServeContent are written immediately // Note: Errors generated by ServeContent are written immediately
// to the response. This usually only happens if seeking fails (rare). // to the response. This usually only happens if seeking fails (rare).

View file

@ -19,6 +19,19 @@ var (
testWebRoot = filepath.Join(testDir, "webroot") testWebRoot = filepath.Join(testDir, "webroot")
) )
var (
webrootFile1Html = filepath.Join("webroot", "file1.html")
webrootDirFile2Html = filepath.Join("webroot", "dir", "file2.html")
webrootDirHiddenHtml = filepath.Join("webroot", "dir", "hidden.html")
webrootDirwithindexIndeHtml = filepath.Join("webroot", "dirwithindex", "index.html")
webrootSubGzippedHtml = filepath.Join("webroot", "sub", "gzipped.html")
webrootSubGzippedHtmlGz = filepath.Join("webroot", "sub", "gzipped.html.gz")
webrootSubGzippedHtmlBr = filepath.Join("webroot", "sub", "gzipped.html.br")
webrootSubBrotliHtml = filepath.Join("webroot", "sub", "brotli.html")
webrootSubBrotliHtmlGz = filepath.Join("webroot", "sub", "brotli.html.gz")
webrootSubBrotliHtmlBr = filepath.Join("webroot", "sub", "brotli.html.br")
)
// testFiles is a map with relative paths to test files as keys and file content as values. // testFiles is a map with relative paths to test files as keys and file content as values.
// The map represents the following structure: // The map represents the following structure:
// - $TEMP/caddy_testdir/ // - $TEMP/caddy_testdir/
@ -31,17 +44,17 @@ var (
// '------ file2.html // '------ file2.html
// '------ hidden.html // '------ hidden.html
var testFiles = map[string]string{ var testFiles = map[string]string{
"unreachable.html": "<h1>must not leak</h1>", "unreachable.html": "<h1>must not leak</h1>",
filepath.Join("webroot", "file1.html"): "<h1>file1.html</h1>", webrootFile1Html: "<h1>file1.html</h1>",
filepath.Join("webroot", "sub", "gzipped.html"): "<h1>gzipped.html</h1>", webrootDirFile2Html: "<h1>dir/file2.html</h1>",
filepath.Join("webroot", "sub", "gzipped.html.gz"): "gzipped.html.gz", webrootDirwithindexIndeHtml: "<h1>dirwithindex/index.html</h1>",
filepath.Join("webroot", "sub", "gzipped.html.gz"): "gzipped.html.gz", webrootDirHiddenHtml: "<h1>dir/hidden.html</h1>",
filepath.Join("webroot", "sub", "brotli.html"): "brotli.html", webrootSubGzippedHtml: "<h1>gzipped.html</h1>",
filepath.Join("webroot", "sub", "brotli.html.gz"): "brotli.html.gz", webrootSubGzippedHtmlGz: "1.gzipped.html.gz",
filepath.Join("webroot", "sub", "brotli.html.br"): "brotli.html.br", webrootSubGzippedHtmlBr: "2.gzipped.html.br",
filepath.Join("webroot", "dirwithindex", "index.html"): "<h1>dirwithindex/index.html</h1>", webrootSubBrotliHtml: "3.brotli.html",
filepath.Join("webroot", "dir", "file2.html"): "<h1>dir/file2.html</h1>", webrootSubBrotliHtmlGz: "4.brotli.html.gz",
filepath.Join("webroot", "dir", "hidden.html"): "<h1>dir/hidden.html</h1>", webrootSubBrotliHtmlBr: "5.brotli.html.br",
} }
// TestServeHTTP covers positive scenarios when serving files. // TestServeHTTP covers positive scenarios when serving files.
@ -58,11 +71,14 @@ func TestServeHTTP(t *testing.T) {
movedPermanently := "Moved Permanently" movedPermanently := "Moved Permanently"
tests := []struct { tests := []struct {
url string url string
acceptEncoding string
expectedStatus int expectedStatus int
expectedBodyContent string expectedBodyContent string
expectedEtag string expectedEtag string
expectedVary string
expectedEncoding string
}{ }{
// Test 0 - access without any path // Test 0 - access without any path
{ {
@ -78,15 +94,15 @@ func TestServeHTTP(t *testing.T) {
{ {
url: "https://foo/file1.html", url: "https://foo/file1.html",
expectedStatus: http.StatusOK, expectedStatus: http.StatusOK,
expectedBodyContent: testFiles[filepath.Join("webroot", "file1.html")], expectedBodyContent: testFiles[webrootFile1Html],
expectedEtag: `W/"1e240-13"`, expectedEtag: `"2n9cj"`,
}, },
// Test 3 - access folder with index file with trailing slash // Test 3 - access folder with index file with trailing slash
{ {
url: "https://foo/dirwithindex/", url: "https://foo/dirwithindex/",
expectedStatus: http.StatusOK, expectedStatus: http.StatusOK,
expectedBodyContent: testFiles[filepath.Join("webroot", "dirwithindex", "index.html")], expectedBodyContent: testFiles[webrootDirwithindexIndeHtml],
expectedEtag: `W/"1e240-20"`, expectedEtag: `"2n9cw"`,
}, },
// Test 4 - access folder with index file without trailing slash // Test 4 - access folder with index file without trailing slash
{ {
@ -125,8 +141,8 @@ func TestServeHTTP(t *testing.T) {
{ {
url: "https://foo/dirwithindex/index.html", url: "https://foo/dirwithindex/index.html",
expectedStatus: http.StatusOK, expectedStatus: http.StatusOK,
expectedBodyContent: testFiles[filepath.Join("webroot", "dirwithindex", "index.html")], expectedBodyContent: testFiles[webrootDirwithindexIndeHtml],
expectedEtag: `W/"1e240-20"`, expectedEtag: `"2n9cw"`,
}, },
// Test 11 - send a request with query params // Test 11 - send a request with query params
{ {
@ -152,6 +168,7 @@ func TestServeHTTP(t *testing.T) {
// Test 15 - attempt to bypass hidden file // Test 15 - attempt to bypass hidden file
{ {
url: "https://foo/dir/hidden.html%20.", url: "https://foo/dir/hidden.html%20.",
acceptEncoding: "br, gzip",
expectedStatus: http.StatusNotFound, expectedStatus: http.StatusNotFound,
}, },
// Test 16 - serve another file with same name as hidden file. // Test 16 - serve another file with same name as hidden file.
@ -167,16 +184,32 @@ func TestServeHTTP(t *testing.T) {
// Test 18 - try to get pre-gzipped file. // Test 18 - try to get pre-gzipped file.
{ {
url: "https://foo/sub/gzipped.html", url: "https://foo/sub/gzipped.html",
acceptEncoding: "gzip",
expectedStatus: http.StatusOK, expectedStatus: http.StatusOK,
expectedBodyContent: testFiles[filepath.Join("webroot", "sub", "gzipped.html.gz")], expectedBodyContent: testFiles[webrootSubGzippedHtmlGz],
expectedEtag: `W/"1e240-f"`, expectedEtag: `"2n9ch"`,
expectedVary: "Accept-Encoding",
expectedEncoding: "gzip",
}, },
// Test 19 - try to get pre-brotli encoded file. // Test 19 - try to get pre-brotli encoded file.
{ {
url: "https://foo/sub/brotli.html", url: "https://foo/sub/brotli.html",
acceptEncoding: "br,gzip",
expectedStatus: http.StatusOK, expectedStatus: http.StatusOK,
expectedBodyContent: testFiles[filepath.Join("webroot", "sub", "brotli.html.br")], expectedBodyContent: testFiles[webrootSubBrotliHtmlBr],
expectedEtag: `W/"1e240-e"`, expectedEtag: `"2n9cg"`,
expectedVary: "Accept-Encoding",
expectedEncoding: "br",
},
// Test 20 - not allowed to get pre-brotli encoded file.
{
url: "https://foo/sub/brotli.html",
acceptEncoding: "nicebrew", // contains "br" substring but not "br"
expectedStatus: http.StatusOK,
expectedBodyContent: testFiles[webrootSubBrotliHtml],
expectedEtag: `"2n9cd"`,
expectedVary: "",
expectedEncoding: "",
}, },
// Test 20 - treat existing file as a directory. // Test 20 - treat existing file as a directory.
{ {
@ -189,7 +222,7 @@ func TestServeHTTP(t *testing.T) {
responseRecorder := httptest.NewRecorder() responseRecorder := httptest.NewRecorder()
request, err := http.NewRequest("GET", test.url, nil) request, err := http.NewRequest("GET", test.url, nil)
request.Header.Add("Accept-Encoding", "br,gzip") request.Header.Add("Accept-Encoding", test.acceptEncoding)
if err != nil { if err != nil {
t.Errorf("Test %d: Error making request: %v", i, err) t.Errorf("Test %d: Error making request: %v", i, err)
@ -200,6 +233,9 @@ func TestServeHTTP(t *testing.T) {
} }
status, err := fileserver.ServeHTTP(responseRecorder, request) status, err := fileserver.ServeHTTP(responseRecorder, request)
etag := responseRecorder.Header().Get("Etag") etag := responseRecorder.Header().Get("Etag")
body := responseRecorder.Body.String()
vary := responseRecorder.Header().Get("Vary")
encoding := responseRecorder.Header().Get("Content-Encoding")
// check if error matches expectations // check if error matches expectations
if err != nil { if err != nil {
@ -216,9 +252,19 @@ func TestServeHTTP(t *testing.T) {
t.Errorf("Test %d: Expected Etag header %s, found %s", i, test.expectedEtag, etag) t.Errorf("Test %d: Expected Etag header %s, found %s", i, test.expectedEtag, etag)
} }
// check vary
if test.expectedVary != vary {
t.Errorf("Test %d: Expected Vary header %s, found %s", i, test.expectedVary, vary)
}
// check content-encoding
if test.expectedEncoding != encoding {
t.Errorf("Test %d: Expected Content-Encoding header %s, found %s", i, test.expectedEncoding, encoding)
}
// check body content // check body content
if !strings.Contains(responseRecorder.Body.String(), test.expectedBodyContent) { if !strings.Contains(body, test.expectedBodyContent) {
t.Errorf("Test %d: Expected body to contain %q, found %q", i, test.expectedBodyContent, responseRecorder.Body.String()) t.Errorf("Test %d: Expected body to contain %q, found %q", i, test.expectedBodyContent, body)
} }
} }
@ -418,3 +464,53 @@ func TestServeHTTPFailingStat(t *testing.T) {
} }
} }
} }
//-------------------------------------------------------------------------------------------------
type fileInfo struct {
name string
size int64
mode os.FileMode
modTime time.Time
isDir bool
}
func (fi fileInfo) Name() string {
return fi.name
}
func (fi fileInfo) Size() int64 {
return fi.size
}
func (fi fileInfo) Mode() os.FileMode {
return fi.mode
}
func (fi fileInfo) ModTime() time.Time {
return fi.modTime
}
func (fi fileInfo) IsDir() bool {
return fi.isDir
}
func (fi fileInfo) Sys() interface{} {
return nil
}
var _ os.FileInfo = fileInfo{}
//-------------------------------------------------------------------------------------------------
func BenchmarkEtag(b *testing.B) {
d := fileInfo{
size: 1234567890,
modTime: time.Now(),
}
b.ResetTimer()
for i := 0; i < b.N; i++ {
calculateEtag(d)
}
}