components-contrib/middleware/http/opa/middleware.go

269 lines
7.8 KiB
Go

/*
Copyright 2021 The Dapr Authors
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
package opa
import (
"bytes"
"context"
"encoding/json"
"errors"
"fmt"
"io"
"math"
"net/http"
"net/textproto"
"reflect"
"slices"
"strconv"
"strings"
"time"
"github.com/open-policy-agent/opa/rego"
"github.com/dapr/components-contrib/common/httputils"
contribMetadata "github.com/dapr/components-contrib/metadata"
"github.com/dapr/components-contrib/middleware"
"github.com/dapr/kit/logger"
kitmd "github.com/dapr/kit/metadata"
kitstrings "github.com/dapr/kit/strings"
)
type Status int
type middlewareMetadata struct {
Rego string `json:"rego" mapstructure:"rego"`
DefaultStatus Status `json:"defaultStatus,omitempty" mapstructure:"defaultStatus"`
IncludedHeaders string `json:"includedHeaders,omitempty" mapstructure:"includedHeaders"`
ReadBody string `json:"readBody,omitempty" mapstructure:"readBody"`
internalIncludedHeadersParsed []string `json:"-" mapstructure:"-"`
}
// NewMiddleware returns a new Open Policy Agent middleware.
func NewMiddleware(logger logger.Logger) middleware.Middleware {
return &Middleware{logger: logger}
}
// Middleware is an OPA middleware.
type Middleware struct {
logger logger.Logger
}
// RegoResult is the expected result from rego policy.
type RegoResult struct {
Allow bool `json:"allow"`
AdditionalHeaders map[string]string `json:"additional_headers,omitempty"`
StatusCode int `json:"status_code,omitempty"`
}
const opaErrorHeaderKey = "x-dapr-opa-error"
var (
errOpaNoResult = errors.New("received no results back from rego policy. Are you setting data.http.allow?")
errOpaInvalidResultType = errors.New("got an invalid type back from repo policy. Only a boolean or map is valid")
)
func (s *Status) UnmarshalJSON(b []byte) error {
if len(b) == 0 {
return nil
}
var v interface{}
if err := json.Unmarshal(b, &v); err != nil {
return err
}
switch value := v.(type) {
case float64:
if value != math.Trunc(value) {
return fmt.Errorf("invalid float value %f parse to status(int)", value)
}
*s = Status(value)
case string:
intVal, err := strconv.Atoi(value)
if err != nil {
return err
}
*s = Status(intVal)
default:
return fmt.Errorf("invalid value %v parse to status(int)", value)
}
if !s.Valid() {
return fmt.Errorf("invalid status value %d expected in range [100-599]", *s)
}
return nil
}
// Check status is in the correct range for RFC 2616 status codes [100-599].
func (s *Status) Valid() bool {
return s != nil && *s >= 100 && *s < 600
}
// GetHandler returns the HTTP handler provided by the middleware.
func (m *Middleware) GetHandler(parentCtx context.Context, metadata middleware.Metadata) (func(next http.Handler) http.Handler, error) {
meta, err := m.getNativeMetadata(metadata)
if err != nil {
return nil, err
}
ctx, cancel := context.WithTimeout(parentCtx, time.Minute)
query, err := rego.New(
rego.Query("result = data.http.allow"),
rego.Module("inline.rego", meta.Rego),
).PrepareForEval(ctx)
cancel()
if err != nil {
return nil, err
}
return func(next http.Handler) http.Handler {
return http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
if allow := m.evalRequest(w, r, meta, &query); !allow {
return
}
next.ServeHTTP(w, r)
})
}, nil
}
func (m *Middleware) evalRequest(w http.ResponseWriter, r *http.Request, meta *middlewareMetadata, query *rego.PreparedEvalQuery) bool {
headers := map[string]string{}
for key, value := range r.Header {
if len(value) > 0 && slices.Contains(meta.internalIncludedHeadersParsed, key) {
headers[key] = strings.Join(value, ", ")
}
}
var body string
if kitstrings.IsTruthy(meta.ReadBody) {
buf, _ := io.ReadAll(r.Body)
body = string(buf)
// Put the body back in the request
r.Body = io.NopCloser(bytes.NewBuffer(buf))
}
pathParts := strings.Split(strings.Trim(r.URL.Path, "/"), "/")
input := map[string]interface{}{
"request": map[string]interface{}{
"method": r.Method,
"path": r.URL.Path,
"path_parts": pathParts,
"raw_query": r.URL.RawQuery,
"query": map[string][]string(r.URL.Query()),
"headers": headers,
"scheme": r.URL.Scheme,
"body": body,
},
}
results, err := query.Eval(r.Context(), rego.EvalInput(input))
if err != nil {
m.opaError(w, meta, err)
return false
}
if len(results) == 0 {
m.opaError(w, meta, errOpaNoResult)
return false
}
return m.handleRegoResult(w, r, meta, results[0].Bindings["result"])
}
// handleRegoResult takes the in process request and open policy agent evaluation result
// and maps it the appropriate response or headers.
// It returns true if the request should continue, or false if a response should be immediately returned.
func (m *Middleware) handleRegoResult(w http.ResponseWriter, r *http.Request, meta *middlewareMetadata, result any) bool {
if allowed, ok := result.(bool); ok {
if !allowed {
httputils.RespondWithError(w, int(meta.DefaultStatus))
}
return allowed
}
if _, ok := result.(map[string]any); !ok {
m.opaError(w, meta, errOpaInvalidResultType)
return false
}
// Is it expensive to marshal back and forth? Should we just manually pull out properties?
marshaled, err := json.Marshal(result)
if err != nil {
m.opaError(w, meta, err)
return false
}
regoResult := RegoResult{
// By default, a non-allowed request with return a 403 response.
StatusCode: int(meta.DefaultStatus),
AdditionalHeaders: make(map[string]string),
}
if err = json.Unmarshal(marshaled, &regoResult); err != nil {
m.opaError(w, meta, err)
return false
}
// If the result isn't allowed, set the response status and
// apply the additional headers to the response.
// Otherwise, set the headers on the ongoing request (overriding as necessary).
if !regoResult.Allow {
for key, value := range regoResult.AdditionalHeaders {
w.Header().Set(key, value)
}
httputils.RespondWithError(w, regoResult.StatusCode)
} else {
for key, value := range regoResult.AdditionalHeaders {
r.Header.Set(key, value)
}
}
return regoResult.Allow
}
func (m *Middleware) opaError(w http.ResponseWriter, meta *middlewareMetadata, err error) {
w.Header().Set(opaErrorHeaderKey, "true")
httputils.RespondWithError(w, int(meta.DefaultStatus))
m.logger.Warnf("Error procesing rego policy: %v", err)
}
func (m *Middleware) getNativeMetadata(metadata middleware.Metadata) (*middlewareMetadata, error) {
meta := middlewareMetadata{
DefaultStatus: 403,
}
err := kitmd.DecodeMetadata(metadata.Properties, &meta)
if err != nil {
return nil, err
}
meta.internalIncludedHeadersParsed = strings.Split(meta.IncludedHeaders, ",")
n := 0
for i := range meta.internalIncludedHeadersParsed {
scrubbed := strings.ReplaceAll(meta.internalIncludedHeadersParsed[i], " ", "")
if scrubbed != "" {
meta.internalIncludedHeadersParsed[n] = textproto.CanonicalMIMEHeaderKey(scrubbed)
n++
}
}
meta.internalIncludedHeadersParsed = meta.internalIncludedHeadersParsed[:n]
return &meta, nil
}
func (m *Middleware) GetComponentMetadata() (metadataInfo contribMetadata.MetadataMap) {
metadataStruct := middlewareMetadata{}
contribMetadata.GetMetadataInfoFromStructType(reflect.TypeOf(metadataStruct), &metadataInfo, contribMetadata.MiddlewareType)
return
}