2019-06-30 16:07:58 -06:00
|
|
|
// Copyright 2015 Matthew Holt and The Caddy Authors
|
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
|
|
|
|
2019-05-23 13:16:34 -06:00
|
|
|
package rewrite
|
2019-05-20 23:48:43 -06:00
|
|
|
|
|
|
|
import (
|
2020-03-30 11:49:53 -06:00
|
|
|
"fmt"
|
2019-05-20 23:48:43 -06:00
|
|
|
"net/http"
|
|
|
|
"net/url"
|
2021-03-01 18:27:59 -07:00
|
|
|
"regexp"
|
2020-03-30 11:49:53 -06:00
|
|
|
"strconv"
|
2019-05-20 23:48:43 -06:00
|
|
|
"strings"
|
|
|
|
|
2019-07-02 12:37:06 -06:00
|
|
|
"github.com/caddyserver/caddy/v2"
|
|
|
|
"github.com/caddyserver/caddy/v2/modules/caddyhttp"
|
2019-10-28 14:39:37 -06:00
|
|
|
"go.uber.org/zap"
|
2019-05-20 23:48:43 -06:00
|
|
|
)
|
|
|
|
|
|
|
|
func init() {
|
2019-08-21 10:46:35 -06:00
|
|
|
caddy.RegisterModule(Rewrite{})
|
2019-05-20 23:48:43 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
// Rewrite is a middleware which can rewrite HTTP requests.
|
2019-12-23 12:45:35 -07:00
|
|
|
//
|
2020-01-11 13:47:42 -07:00
|
|
|
// The Method and URI properties are "setters": the request URI
|
|
|
|
// will be set to the given values. Other properties are "modifiers":
|
|
|
|
// they modify existing files but do not explicitly specify what the
|
|
|
|
// result will be. It is atypical to combine the use of setters and
|
|
|
|
// modifiers in a single rewrite.
|
2019-05-20 23:48:43 -06:00
|
|
|
type Rewrite struct {
|
2019-12-23 12:45:35 -07:00
|
|
|
// Changes the request's HTTP verb.
|
2019-10-19 19:22:29 -06:00
|
|
|
Method string `json:"method,omitempty"`
|
|
|
|
|
2020-01-11 13:47:42 -07:00
|
|
|
// Changes the request's URI, which consists of path and query string.
|
2019-12-23 12:45:35 -07:00
|
|
|
// Only components of the URI that are specified will be changed.
|
2020-01-11 13:47:42 -07:00
|
|
|
// For example, a value of "/foo.html" or "foo.html" will only change
|
|
|
|
// the path and will preserve any existing query string. Similarly, a
|
|
|
|
// value of "?a=b" will only change the query string and will not affect
|
|
|
|
// the path. Both can also be changed: "/foo?a=b" - this sets both the
|
|
|
|
// path and query string at the same time.
|
|
|
|
//
|
|
|
|
// You can also use placeholders. For example, to preserve the existing
|
|
|
|
// query string, you might use: "?{http.request.uri.query}&a=b". Any
|
|
|
|
// key-value pairs you add to the query string will not overwrite
|
2020-01-16 17:08:52 -07:00
|
|
|
// existing values (individual pairs are append-only).
|
2020-01-11 13:47:42 -07:00
|
|
|
//
|
|
|
|
// To clear the query string, explicitly set an empty one: "?"
|
2019-12-23 12:45:35 -07:00
|
|
|
URI string `json:"uri,omitempty"`
|
|
|
|
|
|
|
|
// Strips the given prefix from the beginning of the URI path.
|
2020-01-11 13:47:42 -07:00
|
|
|
StripPathPrefix string `json:"strip_path_prefix,omitempty"`
|
2019-10-19 19:22:29 -06:00
|
|
|
|
2019-12-23 12:45:35 -07:00
|
|
|
// Strips the given suffix from the end of the URI path.
|
2020-01-11 13:47:42 -07:00
|
|
|
StripPathSuffix string `json:"strip_path_suffix,omitempty"`
|
2019-12-23 12:45:35 -07:00
|
|
|
|
|
|
|
// Performs substring replacements on the URI.
|
2021-03-01 18:27:59 -07:00
|
|
|
URISubstring []substrReplacer `json:"uri_substring,omitempty"`
|
|
|
|
|
|
|
|
// Performs regular expression replacements on the URI path.
|
|
|
|
PathRegexp []*regexReplacer `json:"path_regexp,omitempty"`
|
2019-12-23 12:45:35 -07:00
|
|
|
|
2019-10-28 14:39:37 -06:00
|
|
|
logger *zap.Logger
|
2019-05-20 23:48:43 -06:00
|
|
|
}
|
|
|
|
|
2019-08-21 10:46:35 -06:00
|
|
|
// CaddyModule returns the Caddy module information.
|
|
|
|
func (Rewrite) CaddyModule() caddy.ModuleInfo {
|
|
|
|
return caddy.ModuleInfo{
|
2019-12-10 13:36:46 -07:00
|
|
|
ID: "http.handlers.rewrite",
|
|
|
|
New: func() caddy.Module { return new(Rewrite) },
|
2019-08-21 10:46:35 -06:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-10-28 14:39:37 -06:00
|
|
|
// Provision sets up rewr.
|
|
|
|
func (rewr *Rewrite) Provision(ctx caddy.Context) error {
|
|
|
|
rewr.logger = ctx.Logger(rewr)
|
2021-03-01 18:27:59 -07:00
|
|
|
|
|
|
|
for i, rep := range rewr.PathRegexp {
|
|
|
|
if rep.Find == "" {
|
|
|
|
return fmt.Errorf("path_regexp find cannot be empty")
|
|
|
|
}
|
|
|
|
re, err := regexp.Compile(rep.Find)
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("compiling regular expression %d: %v", i, err)
|
|
|
|
}
|
|
|
|
rep.re = re
|
|
|
|
}
|
|
|
|
|
2019-10-28 14:39:37 -06:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2019-05-20 23:48:43 -06:00
|
|
|
func (rewr Rewrite) ServeHTTP(w http.ResponseWriter, r *http.Request, next caddyhttp.Handler) error {
|
2019-12-29 13:12:52 -07:00
|
|
|
repl := r.Context().Value(caddy.ReplacerCtxKey).(*caddy.Replacer)
|
2019-05-20 23:48:43 -06:00
|
|
|
|
2019-10-28 14:39:37 -06:00
|
|
|
logger := rewr.logger.With(
|
|
|
|
zap.Object("request", caddyhttp.LoggableHTTPRequest{Request: r}),
|
|
|
|
)
|
|
|
|
|
2019-12-12 14:32:35 -07:00
|
|
|
changed := rewr.rewrite(r, repl, logger)
|
|
|
|
|
|
|
|
if changed {
|
|
|
|
logger.Debug("rewrote request",
|
|
|
|
zap.String("method", r.Method),
|
|
|
|
zap.String("uri", r.RequestURI),
|
|
|
|
)
|
|
|
|
}
|
|
|
|
|
|
|
|
return next.ServeHTTP(w, r)
|
|
|
|
}
|
|
|
|
|
2020-01-10 16:59:57 -07:00
|
|
|
// rewrite performs the rewrites on r using repl, which should
|
|
|
|
// have been obtained from r, but is passed in for efficiency.
|
|
|
|
// It returns true if any changes were made to r.
|
2019-12-29 13:12:52 -07:00
|
|
|
func (rewr Rewrite) rewrite(r *http.Request, repl *caddy.Replacer, logger *zap.Logger) bool {
|
2019-12-12 14:32:35 -07:00
|
|
|
oldMethod := r.Method
|
|
|
|
oldURI := r.RequestURI
|
|
|
|
|
|
|
|
// method
|
2019-05-20 23:48:43 -06:00
|
|
|
if rewr.Method != "" {
|
|
|
|
r.Method = strings.ToUpper(repl.ReplaceAll(rewr.Method, ""))
|
|
|
|
}
|
|
|
|
|
2020-04-01 00:43:40 -06:00
|
|
|
// uri (path, query string and... fragment, because why not)
|
2020-01-10 16:59:57 -07:00
|
|
|
if uri := rewr.URI; uri != "" {
|
|
|
|
// find the bounds of each part of the URI that exist
|
|
|
|
pathStart, qsStart, fragStart := -1, -1, -1
|
|
|
|
pathEnd, qsEnd := -1, -1
|
|
|
|
for i, ch := range uri {
|
|
|
|
switch {
|
|
|
|
case ch == '?' && qsStart < 0:
|
|
|
|
pathEnd, qsStart = i, i+1
|
|
|
|
case ch == '#' && fragStart < 0:
|
|
|
|
qsEnd, fragStart = i, i+1
|
|
|
|
case pathStart < 0 && qsStart < 0 && fragStart < 0:
|
|
|
|
pathStart = i
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if pathStart >= 0 && pathEnd < 0 {
|
|
|
|
pathEnd = len(uri)
|
|
|
|
}
|
|
|
|
if qsStart >= 0 && qsEnd < 0 {
|
|
|
|
qsEnd = len(uri)
|
2019-05-20 23:48:43 -06:00
|
|
|
}
|
|
|
|
|
2020-04-01 00:43:40 -06:00
|
|
|
// isolate the three main components of the URI
|
|
|
|
var path, query, frag string
|
|
|
|
if pathStart > -1 {
|
|
|
|
path = uri[pathStart:pathEnd]
|
|
|
|
}
|
|
|
|
if qsStart > -1 {
|
|
|
|
query = uri[qsStart:qsEnd]
|
|
|
|
}
|
|
|
|
if fragStart > -1 {
|
|
|
|
frag = uri[fragStart:]
|
|
|
|
}
|
|
|
|
|
2020-01-15 11:44:21 -07:00
|
|
|
// build components which are specified, and store them
|
|
|
|
// in a temporary variable so that they all read the
|
|
|
|
// same version of the URI
|
|
|
|
var newPath, newQuery, newFrag string
|
2022-01-13 12:17:15 -05:00
|
|
|
|
2020-04-01 00:43:40 -06:00
|
|
|
if path != "" {
|
2022-01-13 12:17:15 -05:00
|
|
|
// Since the 'uri' placeholder performs a URL-encode,
|
|
|
|
// we need to intercept it so that it doesn't, because
|
|
|
|
// otherwise we risk a double-encode of the path.
|
|
|
|
uriPlaceholder := "{http.request.uri}"
|
|
|
|
if strings.Contains(path, uriPlaceholder) {
|
|
|
|
tmpUri := r.URL.Path
|
|
|
|
if r.URL.RawQuery != "" {
|
|
|
|
tmpUri += "?" + r.URL.RawQuery
|
|
|
|
}
|
|
|
|
path = strings.ReplaceAll(path, uriPlaceholder, tmpUri)
|
|
|
|
}
|
|
|
|
|
2020-04-01 00:43:40 -06:00
|
|
|
newPath = repl.ReplaceAll(path, "")
|
2019-05-20 23:48:43 -06:00
|
|
|
}
|
2020-04-01 00:43:40 -06:00
|
|
|
|
|
|
|
// before continuing, we need to check if a query string
|
|
|
|
// snuck into the path component during replacements
|
|
|
|
if quPos := strings.Index(newPath, "?"); quPos > -1 {
|
|
|
|
// recompute; new path contains a query string
|
|
|
|
var injectedQuery string
|
|
|
|
newPath, injectedQuery = newPath[:quPos], newPath[quPos+1:]
|
|
|
|
// don't overwrite explicitly-configured query string
|
|
|
|
if query == "" {
|
|
|
|
query = injectedQuery
|
|
|
|
}
|
2019-05-20 23:48:43 -06:00
|
|
|
}
|
2020-04-01 00:43:40 -06:00
|
|
|
|
|
|
|
if query != "" {
|
|
|
|
newQuery = buildQueryString(query, repl)
|
|
|
|
}
|
|
|
|
if frag != "" {
|
|
|
|
newFrag = repl.ReplaceAll(frag, "")
|
2020-01-15 11:44:21 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
// update the URI with the new components
|
|
|
|
// only after building them
|
|
|
|
if pathStart >= 0 {
|
|
|
|
r.URL.Path = newPath
|
|
|
|
}
|
|
|
|
if qsStart >= 0 {
|
|
|
|
r.URL.RawQuery = newQuery
|
|
|
|
}
|
|
|
|
if fragStart >= 0 {
|
|
|
|
r.URL.Fragment = newFrag
|
2019-05-20 23:48:43 -06:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-10-19 19:22:29 -06:00
|
|
|
// strip path prefix or suffix
|
2020-01-11 13:47:42 -07:00
|
|
|
if rewr.StripPathPrefix != "" {
|
|
|
|
prefix := repl.ReplaceAll(rewr.StripPathPrefix, "")
|
2021-01-11 17:18:53 +01:00
|
|
|
r.URL.RawPath = strings.TrimPrefix(r.URL.RawPath, prefix)
|
|
|
|
if p, err := url.PathUnescape(r.URL.RawPath); err == nil && p != "" {
|
|
|
|
r.URL.Path = p
|
|
|
|
} else {
|
|
|
|
r.URL.Path = strings.TrimPrefix(r.URL.Path, prefix)
|
|
|
|
}
|
2019-10-19 19:22:29 -06:00
|
|
|
}
|
2020-01-11 13:47:42 -07:00
|
|
|
if rewr.StripPathSuffix != "" {
|
|
|
|
suffix := repl.ReplaceAll(rewr.StripPathSuffix, "")
|
2021-03-01 18:27:59 -07:00
|
|
|
changePath(r, func(pathOrRawPath string) string {
|
|
|
|
return strings.TrimSuffix(pathOrRawPath, suffix)
|
|
|
|
})
|
2019-10-19 19:22:29 -06:00
|
|
|
}
|
|
|
|
|
2019-12-12 14:32:35 -07:00
|
|
|
// substring replacements in URI
|
|
|
|
for _, rep := range rewr.URISubstring {
|
|
|
|
rep.do(r, repl)
|
2019-10-19 19:22:29 -06:00
|
|
|
}
|
|
|
|
|
2021-03-01 18:27:59 -07:00
|
|
|
// regular expression replacements on the path
|
|
|
|
for _, rep := range rewr.PathRegexp {
|
|
|
|
rep.do(r, repl)
|
|
|
|
}
|
|
|
|
|
2019-12-12 14:32:35 -07:00
|
|
|
// update the encoded copy of the URI
|
|
|
|
r.RequestURI = r.URL.RequestURI()
|
|
|
|
|
|
|
|
// return true if anything changed
|
|
|
|
return r.Method != oldMethod || r.RequestURI != oldURI
|
|
|
|
}
|
|
|
|
|
2020-01-10 16:59:57 -07:00
|
|
|
// buildQueryString takes an input query string and
|
|
|
|
// performs replacements on each component, returning
|
2020-01-11 11:40:03 -07:00
|
|
|
// the resulting query string. This function appends
|
|
|
|
// duplicate keys rather than replaces.
|
2020-01-10 16:59:57 -07:00
|
|
|
func buildQueryString(qs string, repl *caddy.Replacer) string {
|
|
|
|
var sb strings.Builder
|
2020-01-11 11:40:03 -07:00
|
|
|
|
|
|
|
// first component must be key, which is the same
|
|
|
|
// as if we just wrote a value in previous iteration
|
|
|
|
wroteVal := true
|
2020-01-10 16:59:57 -07:00
|
|
|
|
|
|
|
for len(qs) > 0 {
|
2020-01-11 11:40:03 -07:00
|
|
|
// determine the end of this component, which will be at
|
|
|
|
// the next equal sign or ampersand, whichever comes first
|
2020-01-10 16:59:57 -07:00
|
|
|
nextEq, nextAmp := strings.Index(qs, "="), strings.Index(qs, "&")
|
2020-01-11 11:40:03 -07:00
|
|
|
ampIsNext := nextAmp >= 0 && (nextAmp < nextEq || nextEq < 0)
|
|
|
|
end := len(qs) // assume no delimiter remains...
|
|
|
|
if ampIsNext {
|
|
|
|
end = nextAmp // ...unless ampersand is first...
|
|
|
|
} else if nextEq >= 0 && (nextEq < nextAmp || nextAmp < 0) {
|
|
|
|
end = nextEq // ...or unless equal is first.
|
2020-01-10 16:59:57 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
// consume the component and write the result
|
|
|
|
comp := qs[:end]
|
2020-03-30 11:49:53 -06:00
|
|
|
comp, _ = repl.ReplaceFunc(comp, func(name string, val interface{}) (interface{}, error) {
|
2020-01-11 11:40:03 -07:00
|
|
|
if name == "http.request.uri.query" && wroteVal {
|
2020-01-10 16:59:57 -07:00
|
|
|
return val, nil // already escaped
|
|
|
|
}
|
2020-03-30 11:49:53 -06:00
|
|
|
var valStr string
|
|
|
|
switch v := val.(type) {
|
|
|
|
case string:
|
|
|
|
valStr = v
|
|
|
|
case fmt.Stringer:
|
|
|
|
valStr = v.String()
|
|
|
|
case int:
|
|
|
|
valStr = strconv.Itoa(v)
|
|
|
|
default:
|
|
|
|
valStr = fmt.Sprintf("%+v", v)
|
|
|
|
}
|
|
|
|
return url.QueryEscape(valStr), nil
|
2020-01-10 16:59:57 -07:00
|
|
|
})
|
|
|
|
if end < len(qs) {
|
|
|
|
end++ // consume delimiter
|
|
|
|
}
|
|
|
|
qs = qs[end:]
|
|
|
|
|
2020-01-11 11:40:03 -07:00
|
|
|
// if previous iteration wrote a value,
|
|
|
|
// that means we are writing a key
|
|
|
|
if wroteVal {
|
2020-01-15 11:44:21 -07:00
|
|
|
if sb.Len() > 0 && len(comp) > 0 {
|
2020-01-11 11:40:03 -07:00
|
|
|
sb.WriteRune('&')
|
|
|
|
}
|
|
|
|
} else {
|
2020-01-10 16:59:57 -07:00
|
|
|
sb.WriteRune('=')
|
|
|
|
}
|
|
|
|
sb.WriteString(comp)
|
2020-01-11 11:40:03 -07:00
|
|
|
|
|
|
|
// remember for the next iteration that we just wrote a value,
|
|
|
|
// which means the next iteration MUST write a key
|
|
|
|
wroteVal = ampIsNext
|
2020-01-10 16:59:57 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
return sb.String()
|
|
|
|
}
|
|
|
|
|
2021-03-01 18:27:59 -07:00
|
|
|
// substrReplacer describes either a simple and fast substring replacement.
|
|
|
|
type substrReplacer struct {
|
|
|
|
// A substring to find. Supports placeholders.
|
2019-12-12 14:32:35 -07:00
|
|
|
Find string `json:"find,omitempty"`
|
|
|
|
|
2021-03-01 18:27:59 -07:00
|
|
|
// The substring to replace with. Supports placeholders.
|
2019-12-12 14:32:35 -07:00
|
|
|
Replace string `json:"replace,omitempty"`
|
|
|
|
|
|
|
|
// Maximum number of replacements per string.
|
|
|
|
// Set to <= 0 for no limit (default).
|
|
|
|
Limit int `json:"limit,omitempty"`
|
|
|
|
}
|
|
|
|
|
2021-03-01 18:27:59 -07:00
|
|
|
// do performs the substring replacement on r.
|
|
|
|
func (rep substrReplacer) do(r *http.Request, repl *caddy.Replacer) {
|
|
|
|
if rep.Find == "" {
|
2021-01-11 17:18:53 +01:00
|
|
|
return
|
2019-12-12 14:32:35 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
lim := rep.Limit
|
|
|
|
if lim == 0 {
|
|
|
|
lim = -1
|
|
|
|
}
|
|
|
|
|
|
|
|
find := repl.ReplaceAll(rep.Find, "")
|
|
|
|
replace := repl.ReplaceAll(rep.Replace, "")
|
|
|
|
|
2021-03-01 18:27:59 -07:00
|
|
|
changePath(r, func(pathOrRawPath string) string {
|
|
|
|
return strings.Replace(pathOrRawPath, find, replace, lim)
|
|
|
|
})
|
2019-12-12 14:32:35 -07:00
|
|
|
|
2021-01-11 17:18:53 +01:00
|
|
|
r.URL.RawQuery = strings.Replace(r.URL.RawQuery, find, replace, lim)
|
2019-05-20 23:48:43 -06:00
|
|
|
}
|
|
|
|
|
2021-03-01 18:27:59 -07:00
|
|
|
// regexReplacer describes a replacement using a regular expression.
|
|
|
|
type regexReplacer struct {
|
|
|
|
// The regular expression to find.
|
|
|
|
Find string `json:"find,omitempty"`
|
|
|
|
|
|
|
|
// The substring to replace with. Supports placeholders and
|
|
|
|
// regular expression capture groups.
|
|
|
|
Replace string `json:"replace,omitempty"`
|
|
|
|
|
|
|
|
re *regexp.Regexp
|
|
|
|
}
|
|
|
|
|
|
|
|
func (rep regexReplacer) do(r *http.Request, repl *caddy.Replacer) {
|
|
|
|
if rep.Find == "" || rep.re == nil {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
replace := repl.ReplaceAll(rep.Replace, "")
|
|
|
|
changePath(r, func(pathOrRawPath string) string {
|
|
|
|
return rep.re.ReplaceAllString(pathOrRawPath, replace)
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
// changePath updates the path on the request URL. It first executes newVal on
|
|
|
|
// req.URL.RawPath, and if the result is a valid escaping, it will be copied
|
|
|
|
// into req.URL.Path; otherwise newVal is evaluated only on req.URL.Path.
|
|
|
|
func changePath(req *http.Request, newVal func(pathOrRawPath string) string) {
|
|
|
|
req.URL.RawPath = newVal(req.URL.RawPath)
|
|
|
|
if p, err := url.PathUnescape(req.URL.RawPath); err == nil && p != "" {
|
|
|
|
req.URL.Path = p
|
|
|
|
} else {
|
|
|
|
req.URL.Path = newVal(req.URL.Path)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-05-20 23:48:43 -06:00
|
|
|
// Interface guard
|
|
|
|
var _ caddyhttp.MiddlewareHandler = (*Rewrite)(nil)
|