Files
EdgeNode/internal/nodes/http_request_cache.go

547 lines
15 KiB
Go
Raw Normal View History

2020-10-05 16:55:14 +08:00
package nodes
import (
"bytes"
2021-01-13 12:02:50 +08:00
"errors"
2021-10-17 20:23:10 +08:00
"github.com/TeaOSLab/EdgeCommon/pkg/rpc/pb"
2020-10-05 16:55:14 +08:00
"github.com/TeaOSLab/EdgeNode/internal/caches"
2022-02-22 19:29:27 +08:00
"github.com/TeaOSLab/EdgeNode/internal/compressions"
"github.com/TeaOSLab/EdgeNode/internal/goman"
"github.com/TeaOSLab/EdgeNode/internal/remotelogs"
2021-10-17 20:23:10 +08:00
"github.com/TeaOSLab/EdgeNode/internal/rpc"
2021-12-02 09:34:38 +08:00
"github.com/TeaOSLab/EdgeNode/internal/utils"
"io"
2020-10-05 16:55:14 +08:00
"net/http"
2021-10-03 18:00:57 +08:00
"path/filepath"
2020-10-05 16:55:14 +08:00
"strconv"
2021-08-26 15:48:09 +08:00
"strings"
2021-06-14 11:46:39 +08:00
"time"
2020-10-05 16:55:14 +08:00
)
// 读取缓存
2021-12-16 17:27:21 +08:00
func (this *HTTPRequest) doCacheRead(useStale bool) (shouldStop bool) {
this.cacheCanTryStale = false
2021-12-17 11:53:59 +08:00
2022-02-15 16:44:39 +08:00
var cachePolicy = this.ReqServer.HTTPCachePolicy
if cachePolicy == nil || !cachePolicy.IsOn {
return
}
if this.web.Cache == nil || !this.web.Cache.IsOn || (len(cachePolicy.CacheRefs) == 0 && len(this.web.Cache.CacheRefs) == 0) {
2020-10-05 16:55:14 +08:00
return
}
2021-08-26 15:48:09 +08:00
// 判断是否在预热
if (strings.HasPrefix(this.RawReq.RemoteAddr, "127.") || strings.HasPrefix(this.RawReq.RemoteAddr, "[::1]")) && this.RawReq.Header.Get("X-Cache-Action") == "preheat" {
2021-08-26 15:48:09 +08:00
return
}
2021-05-12 16:10:03 +08:00
var addStatusHeader = this.web.Cache.AddStatusHeader
if addStatusHeader {
defer func() {
cacheStatus := this.varMapping["cache.status"]
if cacheStatus != "HIT" {
this.writer.Header().Set("X-Cache", cacheStatus)
}
}()
}
2020-10-05 16:55:14 +08:00
// 检查服务独立的缓存条件
refType := ""
2020-10-05 16:55:14 +08:00
for _, cacheRef := range this.web.Cache.CacheRefs {
if !cacheRef.IsOn ||
cacheRef.Conds == nil ||
!cacheRef.Conds.HasRequestConds() {
continue
}
if cacheRef.Conds.MatchRequest(this.Format) {
2021-06-08 22:45:11 +08:00
if cacheRef.IsReverse {
return
}
2020-10-05 16:55:14 +08:00
this.cacheRef = cacheRef
refType = "server"
2020-10-05 16:55:14 +08:00
break
}
}
2022-02-24 20:39:43 +08:00
if this.cacheRef == nil && !this.web.Cache.DisablePolicyRefs {
// 检查策略默认的缓存条件
for _, cacheRef := range cachePolicy.CacheRefs {
if !cacheRef.IsOn ||
cacheRef.Conds == nil ||
!cacheRef.Conds.HasRequestConds() {
continue
}
if cacheRef.Conds.MatchRequest(this.Format) {
2021-06-08 22:45:11 +08:00
if cacheRef.IsReverse {
return
}
this.cacheRef = cacheRef
refType = "policy"
break
}
}
2022-02-24 20:39:43 +08:00
}
2022-02-24 20:39:43 +08:00
if this.cacheRef == nil {
return
2020-10-05 16:55:14 +08:00
}
2021-12-07 10:43:42 +08:00
// 校验请求
if !this.cacheRef.MatchRequest(this.RawReq) {
this.cacheRef = nil
return
}
2020-10-05 16:55:14 +08:00
// 相关变量
this.varMapping["cache.policy.name"] = cachePolicy.Name
this.varMapping["cache.policy.id"] = strconv.FormatInt(cachePolicy.Id, 10)
this.varMapping["cache.policy.type"] = cachePolicy.Type
2020-10-05 16:55:14 +08:00
// Cache-Pragma
if this.cacheRef.EnableRequestCachePragma {
if this.RawReq.Header.Get("Cache-Control") == "no-cache" || this.RawReq.Header.Get("Pragma") == "no-cache" {
this.cacheRef = nil
return
}
}
// TODO 支持Vary Header
// 缓存标签
var tags = []string{}
2020-10-05 16:55:14 +08:00
// 检查是否有缓存
var key = this.Format(this.cacheRef.Key)
2020-10-05 16:55:14 +08:00
if len(key) == 0 {
this.cacheRef = nil
return
}
var method = this.Method()
if method != http.MethodGet && method != http.MethodPost {
key += cacheMethodSuffix + method
tags = append(tags, strings.ToLower(method))
}
2021-10-03 18:00:57 +08:00
2020-10-05 16:55:14 +08:00
this.cacheKey = key
2021-12-07 09:28:15 +08:00
this.varMapping["cache.key"] = key
2020-10-05 16:55:14 +08:00
// 读取缓存
storage := caches.SharedManager.FindStorageWithPolicy(cachePolicy.Id)
2020-10-05 16:55:14 +08:00
if storage == nil {
this.cacheRef = nil
return
}
2022-02-22 19:29:27 +08:00
this.writer.cacheStorage = storage
2020-10-05 16:55:14 +08:00
2021-10-17 20:23:10 +08:00
// 判断是否在Purge
if this.web.Cache.PurgeIsOn && strings.ToUpper(this.RawReq.Method) == "PURGE" && this.RawReq.Header.Get("X-Edge-Purge-Key") == this.web.Cache.PurgeKey {
2021-12-02 09:34:38 +08:00
this.varMapping["cache.status"] = "PURGE"
2022-02-22 21:52:28 +08:00
var subKeys = []string{key, key + cacheMethodSuffix + "HEAD"}
2022-02-22 19:29:27 +08:00
// TODO 根据实际缓存的内容进行组合
for _, encoding := range compressions.AllEncodings() {
subKeys = append(subKeys, key+compressionCacheSuffix+encoding)
subKeys = append(subKeys, key+webpCacheSuffix+compressionCacheSuffix+encoding)
}
for _, subKey := range subKeys {
err := storage.Delete(subKey)
if err != nil {
remotelogs.Error("HTTP_REQUEST_CACHE", "purge failed: "+err.Error())
}
2021-10-17 20:23:10 +08:00
}
2022-02-22 19:29:27 +08:00
// 通过API节点清除别节点上的的Key
// TODO 改为队列不需要每个请求都使用goroutine
goman.New(func() {
2021-10-17 20:23:10 +08:00
rpcClient, err := rpc.SharedRPC()
if err == nil {
for _, rpcServerService := range rpcClient.ServerRPCList() {
_, err = rpcServerService.PurgeServerCache(rpcClient.Context(), &pb.PurgeServerCacheRequest{
2022-01-01 20:15:39 +08:00
Domains: []string{this.ReqHost},
2021-10-17 20:23:10 +08:00
Keys: []string{key},
Prefixes: nil,
})
if err != nil {
remotelogs.Error("HTTP_REQUEST_CACHE", "purge failed: "+err.Error())
}
}
}
})
2021-10-17 20:23:10 +08:00
return true
}
// 调用回调
this.onRequest()
if this.writer.isFinished {
return
}
2021-10-03 18:00:57 +08:00
var reader caches.Reader
var err error
2020-10-05 16:55:14 +08:00
2022-02-22 19:29:27 +08:00
// 检查是否支持WebP
var webPIsEnabled = false
var isHeadMethod = method == http.MethodHead
if !isHeadMethod &&
this.web.WebP != nil &&
2021-10-03 18:00:57 +08:00
this.web.WebP.IsOn &&
this.web.WebP.MatchRequest(filepath.Ext(this.Path()), this.Format) &&
2022-02-22 19:29:27 +08:00
this.web.WebP.MatchAccept(this.RawReq.Header.Get("Accept")) {
webPIsEnabled = true
}
// 检查压缩缓存
if !isHeadMethod && reader == nil {
2022-02-22 19:29:27 +08:00
if this.web.Compression != nil && this.web.Compression.IsOn {
_, encoding, ok := this.web.Compression.MatchAcceptEncoding(this.RawReq.Header.Get("Accept-Encoding"))
if ok {
// 检查支持WebP的压缩缓存
if webPIsEnabled {
reader, _ = storage.OpenReader(key+webpCacheSuffix+compressionCacheSuffix+encoding, useStale)
if reader != nil {
tags = append(tags, "webp", encoding)
}
}
// 检查普通缓存
if reader == nil {
reader, _ = storage.OpenReader(key+compressionCacheSuffix+encoding, useStale)
if reader != nil {
tags = append(tags, encoding)
}
}
}
}
}
// 检查WebP
if !isHeadMethod && reader == nil && webPIsEnabled {
2022-02-22 19:29:27 +08:00
reader, _ = storage.OpenReader(key+webpCacheSuffix, useStale)
if reader != nil {
2022-02-22 19:29:27 +08:00
this.writer.cacheReaderSuffix = webpCacheSuffix
tags = append(tags, "webp")
}
2021-10-03 18:00:57 +08:00
}
// 检查正常的文件
if reader == nil {
2021-12-16 17:27:21 +08:00
reader, err = storage.OpenReader(key, useStale)
2021-10-03 18:00:57 +08:00
if err != nil {
if err == caches.ErrNotFound {
// cache相关变量
this.varMapping["cache.status"] = "MISS"
2021-12-16 17:27:21 +08:00
if !useStale && this.web.Cache.Stale != nil && this.web.Cache.Stale.IsOn {
2021-12-16 17:27:21 +08:00
this.cacheCanTryStale = true
}
2021-10-03 18:00:57 +08:00
return
}
if !this.canIgnore(err) {
2022-02-17 17:24:35 +08:00
remotelogs.Warn("HTTP_REQUEST_CACHE", this.URL()+": read from cache failed: open cache failed: "+err.Error())
2021-10-03 18:00:57 +08:00
}
return
2021-05-23 15:50:21 +08:00
}
2021-01-13 12:02:50 +08:00
}
2021-01-13 12:02:50 +08:00
defer func() {
if !this.writer.DelayRead() {
_ = reader.Close()
}
2021-01-13 12:02:50 +08:00
}()
2020-10-05 16:55:14 +08:00
2021-12-17 11:53:59 +08:00
if useStale {
this.varMapping["cache.status"] = "STALE"
this.logAttrs["cache.status"] = "STALE"
} else {
this.varMapping["cache.status"] = "HIT"
this.logAttrs["cache.status"] = "HIT"
}
2020-10-05 16:55:14 +08:00
2021-12-16 17:27:21 +08:00
// 准备Buffer
2021-12-19 11:32:26 +08:00
var pool = this.bytePool(reader.BodySize())
var buf = pool.Get()
2021-12-16 17:27:21 +08:00
defer func() {
2021-12-19 11:32:26 +08:00
pool.Put(buf)
2021-12-16 17:27:21 +08:00
}()
2021-01-13 12:02:50 +08:00
// 读取Header
2021-12-19 11:32:26 +08:00
var headerBuf = []byte{}
2021-01-13 12:02:50 +08:00
err = reader.ReadHeader(buf, func(n int) (goNext bool, err error) {
headerBuf = append(headerBuf, buf[:n]...)
2020-10-05 16:55:14 +08:00
for {
2021-01-13 12:02:50 +08:00
nIndex := bytes.Index(headerBuf, []byte{'\n'})
if nIndex >= 0 {
row := headerBuf[:nIndex]
spaceIndex := bytes.Index(row, []byte{':'})
if spaceIndex <= 0 {
return false, errors.New("invalid header '" + string(row) + "'")
}
this.writer.Header().Set(string(row[:spaceIndex]), string(row[spaceIndex+1:]))
headerBuf = headerBuf[nIndex+1:]
} else {
2020-10-05 16:55:14 +08:00
break
}
}
2021-01-13 12:02:50 +08:00
return true, nil
2020-10-05 16:55:14 +08:00
})
if err != nil {
2021-05-23 16:16:56 +08:00
if !this.canIgnore(err) {
2022-02-17 17:24:35 +08:00
remotelogs.Warn("HTTP_REQUEST_CACHE", this.URL()+": read from cache failed: read header failed: "+err.Error())
2021-05-23 15:50:21 +08:00
}
2020-10-05 16:55:14 +08:00
return
}
2021-12-02 09:34:38 +08:00
// 设置cache.age变量
var age = strconv.FormatInt(reader.ExpiresAt()-utils.UnixTime(), 10)
this.varMapping["cache.age"] = age
2021-12-02 09:34:38 +08:00
2021-05-12 16:10:03 +08:00
if addStatusHeader {
2021-12-17 11:53:59 +08:00
if useStale {
this.writer.Header().Set("X-Cache", "STALE, "+refType+", "+reader.TypeName())
} else {
this.writer.Header().Set("X-Cache", "HIT, "+refType+", "+reader.TypeName())
}
} else {
this.writer.Header().Del("X-Cache")
2021-05-12 16:10:03 +08:00
}
if this.web.Cache.AddAgeHeader {
this.writer.Header().Set("Age", age)
}
2021-06-14 11:46:39 +08:00
// ETag
// 这里强制设置ETag如果先前源站设置了ETag将会被覆盖避免因为源站的ETag导致源站返回304 Not Modified
2021-06-14 11:46:39 +08:00
var respHeader = this.writer.Header()
var eTag = ""
2021-06-14 11:46:39 +08:00
var lastModifiedAt = reader.LastModified()
if lastModifiedAt > 0 {
2022-02-22 19:29:27 +08:00
if len(tags) > 0 {
eTag = "\"" + strconv.FormatInt(lastModifiedAt, 10) + "_" + strings.Join(tags, "_") + "\""
} else {
eTag = "\"" + strconv.FormatInt(lastModifiedAt, 10) + "\""
}
respHeader.Del("Etag")
respHeader["ETag"] = []string{eTag}
2021-06-14 11:46:39 +08:00
}
// 支持 Last-Modified
// 这里强制设置Last-Modified如果先前源站设置了Last-Modified将会被覆盖避免因为源站的Last-Modified导致源站返回304 Not Modified
var modifiedTime = ""
if lastModifiedAt > 0 {
modifiedTime = time.Unix(utils.GMTUnixTime(lastModifiedAt), 0).Format("Mon, 02 Jan 2006 15:04:05") + " GMT"
respHeader.Set("Last-Modified", modifiedTime)
2021-06-14 11:46:39 +08:00
}
// 支持 If-None-Match
if len(eTag) > 0 && this.requestHeader("If-None-Match") == eTag {
// 自定义Header
this.processResponseHeaders(http.StatusNotModified)
this.writer.WriteHeader(http.StatusNotModified)
this.isCached = true
2021-06-14 19:55:06 +08:00
this.cacheRef = nil
this.writer.SetOk()
2021-06-14 11:46:39 +08:00
return true
}
// 支持 If-Modified-Since
if len(modifiedTime) > 0 && this.requestHeader("If-Modified-Since") == modifiedTime {
// 自定义Header
this.processResponseHeaders(http.StatusNotModified)
this.writer.WriteHeader(http.StatusNotModified)
this.isCached = true
2021-06-14 19:55:06 +08:00
this.cacheRef = nil
this.writer.SetOk()
2021-06-14 11:46:39 +08:00
return true
}
2021-01-13 12:02:50 +08:00
this.processResponseHeaders(reader.Status())
this.addExpiresHeader(reader.ExpiresAt())
2021-01-13 12:02:50 +08:00
// 输出Body
2021-01-13 12:52:38 +08:00
if this.RawReq.Method == http.MethodHead {
this.writer.WriteHeader(reader.Status())
} else {
ifRangeHeaders, ok := this.RawReq.Header["If-Range"]
supportRange := true
if ok {
supportRange = false
for _, v := range ifRangeHeaders {
if v == this.writer.Header().Get("ETag") || v == this.writer.Header().Get("Last-Modified") {
supportRange = true
}
}
}
// 支持Range
rangeSet := [][]int64{}
if supportRange {
fileSize := reader.BodySize()
contentRange := this.RawReq.Header.Get("Range")
if len(contentRange) > 0 {
if fileSize == 0 {
this.processResponseHeaders(http.StatusRequestedRangeNotSatisfiable)
this.writer.WriteHeader(http.StatusRequestedRangeNotSatisfiable)
return true
}
set, ok := httpRequestParseContentRange(contentRange)
if !ok {
this.processResponseHeaders(http.StatusRequestedRangeNotSatisfiable)
this.writer.WriteHeader(http.StatusRequestedRangeNotSatisfiable)
return true
}
if len(set) > 0 {
rangeSet = set
for _, arr := range rangeSet {
if arr[0] == -1 {
arr[0] = fileSize + arr[1]
arr[1] = fileSize - 1
if arr[0] < 0 {
this.processResponseHeaders(http.StatusRequestedRangeNotSatisfiable)
this.writer.WriteHeader(http.StatusRequestedRangeNotSatisfiable)
return true
}
}
if arr[1] < 0 {
arr[1] = fileSize - 1
}
if arr[1] >= fileSize {
arr[1] = fileSize - 1
}
if arr[0] > arr[1] {
this.processResponseHeaders(http.StatusRequestedRangeNotSatisfiable)
this.writer.WriteHeader(http.StatusRequestedRangeNotSatisfiable)
return true
}
}
}
}
}
if len(rangeSet) == 1 {
respHeader.Set("Content-Range", "bytes "+strconv.FormatInt(rangeSet[0][0], 10)+"-"+strconv.FormatInt(rangeSet[0][1], 10)+"/"+strconv.FormatInt(reader.BodySize(), 10))
respHeader.Set("Content-Length", strconv.FormatInt(rangeSet[0][1]-rangeSet[0][0]+1, 10))
this.writer.WriteHeader(http.StatusPartialContent)
err = reader.ReadBodyRange(buf, rangeSet[0][0], rangeSet[0][1], func(n int) (goNext bool, err error) {
_, err = this.writer.Write(buf[:n])
if err != nil {
2021-06-16 08:29:38 +08:00
return false, errWritingToClient
2021-01-13 12:52:38 +08:00
}
return true, nil
})
2021-01-13 12:02:50 +08:00
if err != nil {
this.varMapping["cache.status"] = "MISS"
2021-01-13 12:52:38 +08:00
if err == caches.ErrInvalidRange {
this.processResponseHeaders(http.StatusRequestedRangeNotSatisfiable)
this.writer.WriteHeader(http.StatusRequestedRangeNotSatisfiable)
return true
}
2021-05-23 16:16:56 +08:00
if !this.canIgnore(err) {
remotelogs.Warn("HTTP_REQUEST_CACHE", this.URL()+": read from cache failed: "+err.Error())
2021-05-23 15:50:21 +08:00
}
2021-01-13 12:52:38 +08:00
return
}
} else if len(rangeSet) > 1 {
boundary := httpRequestGenBoundary()
respHeader.Set("Content-Type", "multipart/byteranges; boundary="+boundary)
respHeader.Del("Content-Length")
contentType := respHeader.Get("Content-Type")
this.writer.WriteHeader(http.StatusPartialContent)
for index, set := range rangeSet {
if index == 0 {
_, err = this.writer.WriteString("--" + boundary + "\r\n")
} else {
_, err = this.writer.WriteString("\r\n--" + boundary + "\r\n")
}
if err != nil {
2021-06-16 08:29:38 +08:00
// 不提示写入客户端错误
2021-01-13 12:52:38 +08:00
return true
}
_, err = this.writer.WriteString("Content-Range: " + "bytes " + strconv.FormatInt(set[0], 10) + "-" + strconv.FormatInt(set[1], 10) + "/" + strconv.FormatInt(reader.BodySize(), 10) + "\r\n")
if err != nil {
2021-06-16 08:29:38 +08:00
// 不提示写入客户端错误
2021-01-13 12:52:38 +08:00
return true
}
if len(contentType) > 0 {
_, err = this.writer.WriteString("Content-Type: " + contentType + "\r\n\r\n")
if err != nil {
2021-06-16 08:29:38 +08:00
// 不提示写入客户端错误
2021-01-13 12:52:38 +08:00
return true
}
}
err := reader.ReadBodyRange(buf, set[0], set[1], func(n int) (goNext bool, err error) {
_, err = this.writer.Write(buf[:n])
2021-06-16 08:29:38 +08:00
if err != nil {
return false, errWritingToClient
}
return true, nil
2021-01-13 12:52:38 +08:00
})
if err != nil {
2021-05-23 16:16:56 +08:00
if !this.canIgnore(err) {
remotelogs.Warn("HTTP_REQUEST_CACHE", this.URL()+": read from cache failed: "+err.Error())
2021-05-23 15:50:21 +08:00
}
2021-01-13 12:52:38 +08:00
return true
}
}
_, err = this.writer.WriteString("\r\n--" + boundary + "--\r\n")
if err != nil {
this.varMapping["cache.status"] = "MISS"
2021-06-16 08:29:38 +08:00
// 不提示写入客户端错误
2021-01-13 12:52:38 +08:00
return true
}
2021-01-13 16:11:28 +08:00
} else { // 没有Range
var resp = &http.Response{Body: reader}
this.writer.Prepare(resp, reader.BodySize(), reader.Status(), false)
2021-01-13 12:52:38 +08:00
this.writer.WriteHeader(reader.Status())
_, err = io.CopyBuffer(this.writer, resp.Body, buf)
if err == io.EOF {
err = nil
}
2021-01-13 12:52:38 +08:00
if err != nil {
this.varMapping["cache.status"] = "MISS"
2021-05-23 16:16:56 +08:00
if !this.canIgnore(err) {
2022-02-17 17:24:35 +08:00
remotelogs.Warn("HTTP_REQUEST_CACHE", this.URL()+": read from cache failed: read body failed: "+err.Error())
2021-05-23 15:50:21 +08:00
}
2021-01-13 12:52:38 +08:00
return
2021-01-13 12:02:50 +08:00
}
}
2020-10-05 16:55:14 +08:00
}
2021-06-08 11:24:41 +08:00
this.isCached = true
2021-06-14 19:55:06 +08:00
this.cacheRef = nil
this.writer.SetOk()
2020-10-05 16:55:14 +08:00
return true
}
// 设置Expires Header
func (this *HTTPRequest) addExpiresHeader(expiresAt int64) {
if this.cacheRef.ExpiresTime != nil && this.cacheRef.ExpiresTime.IsPrior && this.cacheRef.ExpiresTime.IsOn {
if this.cacheRef.ExpiresTime.Overwrite || len(this.writer.Header().Get("Expires")) == 0 {
if this.cacheRef.ExpiresTime.AutoCalculate {
this.writer.Header().Set("Expires", time.Unix(utils.GMTUnixTime(expiresAt), 0).Format("Mon, 2 Jan 2006 15:04:05")+" GMT")
} else if this.cacheRef.ExpiresTime.Duration != nil {
var duration = this.cacheRef.ExpiresTime.Duration.Duration()
if duration > 0 {
this.writer.Header().Set("Expires", utils.GMTTime(time.Now().Add(duration)).Format("Mon, 2 Jan 2006 15:04:05")+" GMT")
}
}
}
}
}