Skip to content

Commit

Permalink
Add Basic Auth to HTTP Connector (#569)
Browse files Browse the repository at this point in the history
* implemented initial processing of authentication variables in http connector endpoints
* restructuring endpoint config to use CredentialsFactory
* add check for credentials in decorator
* update changelog

---------

Co-authored-by: david <[email protected]>
Co-authored-by: djkhl <[email protected]>
Co-authored-by: djkhl <[email protected]>
Co-authored-by: ekneg54 <[email protected]>
  • Loading branch information
5 people authored Apr 23, 2024
1 parent f66b548 commit d93cd99
Show file tree
Hide file tree
Showing 12 changed files with 495 additions and 217 deletions.
2 changes: 2 additions & 0 deletions .gitignore
Original file line number Diff line number Diff line change
Expand Up @@ -22,3 +22,5 @@ sql_db_table.json
build/
dist/
error_file
experiments
**/_static/*.xlsx
12 changes: 10 additions & 2 deletions CHANGELOG.md
Original file line number Diff line number Diff line change
@@ -1,14 +1,22 @@
## Upcoming Changes

## next release

### Breaking

### Features

### Improvements

### Bugfix

## 11.1.0

### Features

* new documentation part with security best practices which compiles to `user_manual/security/best_practices.html`
* also comes with excel export functionality of given best practices

### Improvements
* add basic auth to http_input

### Bugfix

Expand Down
2 changes: 1 addition & 1 deletion doc/source/conf.py
Original file line number Diff line number Diff line change
Expand Up @@ -118,7 +118,7 @@ def setup(app):
# documentation.
#
html_theme_options = {
"navigation_depth": 5,
"navigation_depth": 4,
}

# Add any paths that contain custom static files (such as style sheets) here,
Expand Down
139 changes: 116 additions & 23 deletions logprep/connector/http/input.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,8 +5,11 @@
A http input connector that spawns an uvicorn server and accepts http requests, parses them,
puts them to an internal queue and pops them via :code:`get_next` method.
Example
^^^^^^^
HTTP Connector Config Example
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
An example config file would look like:
.. code-block:: yaml
:linenos:
Expand All @@ -17,12 +20,61 @@
collect_meta: False
metafield_name: "@metadata"
uvicorn_config:
host: 0.0.0.0
port: 9000
host: 0.0.0.0
port: 9000
endpoints:
/firstendpoint: json
/seccondendpoint: plaintext
/thirdendpoint: jsonl
/firstendpoint: json
/second*: plaintext
/(third|fourth)/endpoint: jsonl
The endpoint config supports regex and wildcard patterns:
* :code:`/second*`: matches everything after asterisk
* :code:`/(third|fourth)/endpoint` matches either third or forth in the first part
Endpoint Credentials Config Example
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
By providing a credentials file in environment variable :code:`LOGPREP_CREDENTIALS_FILE` you can
add basic authentication for a specific endpoint. The format of this file would look like:
.. code-block:: yaml
:caption: Example for credentials file
:linenos:
input:
endpoints:
/firstendpoint:
username: user
password_file: quickstart/exampledata/config/user_password.txt
/second*:
username: user
password: secret_password
You can choose between a plain secret with the key :code:`password` or a filebased secret
with the key :code:`password_file`.
.. security-best-practice::
:title: Http Input Connector - Authentication
When using basic auth with the http input connector the following points should be taken into account:
- basic auth must only be used with strong passwords
- basic auth must only be used with TLS encryption
- avoid to reveal your plaintext secrets in public repositories
Behaviour of HTTP Requests
^^^^^^^^^^^^^^^^^^^^^^^^^^
* :code:`GET`:
* Responds always with 200 (ignores configured Basic Auth)
* When Messages Queue is full, it responds with 429
* :code:`POST`:
* Responds with 200 on non-Basic Auth Endpoints
* Responds with 401 on Basic Auth Endpoints (and 200 with appropriate credentials)
* When Messages Queue is full, it responds wiht 429
* :code:`ALL OTHER`:
* Responds with 405
"""

import inspect
Expand All @@ -32,6 +84,7 @@
import re
import threading
from abc import ABC
from base64 import b64encode
from logging import Logger
from typing import Callable, Mapping, Tuple, Union

Expand All @@ -40,27 +93,40 @@
import uvicorn
from attrs import define, field, validators
from falcon import ( # pylint: disable=no-name-in-module
HTTP_200,
HTTPMethodNotAllowed,
HTTPTooManyRequests,
HTTPUnauthorized,
)

from logprep.abc.input import FatalInputError, Input
from logprep.util import defaults
from logprep.util.credentials import CredentialsFactory

uvicorn_parameter_keys = inspect.signature(uvicorn.Config).parameters.keys()
UVICORN_CONFIG_KEYS = [
parameter for parameter in uvicorn_parameter_keys if parameter not in ["app", "log_level"]
]

# Config Parts that's checked for Config Change
HTTP_INPUT_CONFIG_KEYS = [
"preprocessing",
"uvicorn_config",
"endpoints",
"collect_meta",
"metafield_name",
"message_backlog_size",
]

def decorator_basic_auth(func: Callable):
"""Decorator to check basic authentication.
Will raise 401 on wrong credentials or missing Authorization-Header"""

async def func_wrapper(*args, **kwargs):
endpoint = args[0]
req = args[1]
if endpoint.credentials:
auth_request_header = req.get_header("Authorization")
if not auth_request_header:
raise HTTPUnauthorized
basic_string = req.auth
if endpoint.basicauth_b64 not in basic_string:
raise HTTPUnauthorized
func_wrapper = await func(*args, **kwargs)
return func_wrapper

return func_wrapper


def decorator_request_exceptions(func: Callable):
Expand All @@ -70,6 +136,13 @@ async def func_wrapper(*args, **kwargs):
try:
if args[1].method == "POST":
func_wrapper = await func(*args, **kwargs)
elif args[1].method == "GET":
endpoint = args[0]
resp = args[2]
resp.status = HTTP_200
if endpoint.messages.full():
raise HTTPTooManyRequests(description="Logprep Message Queue is full.")
return
else:
raise HTTPMethodNotAllowed(["POST"])
except queue.Full as exc:
Expand Down Expand Up @@ -125,12 +198,25 @@ class HttpEndpoint(ABC):
Collects Metadata on True (default)
metafield_name: str
Defines key name for metadata
credentials: dict
Includes authentication credentials, if unset auth is disabled
"""

def __init__(self, messages: mp.Queue, collect_meta: bool, metafield_name: str) -> None:
def __init__(
self,
messages: mp.Queue,
collect_meta: bool,
metafield_name: str,
credentials: dict,
) -> None:
self.messages = messages
self.collect_meta = collect_meta
self.metafield_name = metafield_name
self.credentials = credentials
if self.credentials:
self.basicauth_b64 = b64encode(
f"{self.credentials.username}:{self.credentials.password}".encode("utf-8")
).decode("utf-8")


class JSONHttpEndpoint(HttpEndpoint):
Expand All @@ -139,6 +225,7 @@ class JSONHttpEndpoint(HttpEndpoint):
_decoder = msgspec.json.Decoder()

@decorator_request_exceptions
@decorator_basic_auth
@decorator_add_metadata
async def __call__(self, req, resp, **kwargs): # pylint: disable=arguments-differ
"""json endpoint method"""
Expand All @@ -156,6 +243,7 @@ class JSONLHttpEndpoint(HttpEndpoint):
_decoder = msgspec.json.Decoder()

@decorator_request_exceptions
@decorator_basic_auth
@decorator_add_metadata
async def __call__(self, req, resp, **kwargs): # pylint: disable=arguments-differ
"""jsonl endpoint method"""
Expand All @@ -174,13 +262,13 @@ class PlaintextHttpEndpoint(HttpEndpoint):
and put it in :code:`message` field"""

@decorator_request_exceptions
@decorator_basic_auth
@decorator_add_metadata
async def __call__(self, req, resp, **kwargs): # pylint: disable=arguments-differ
"""plaintext endpoint method"""
data = await req.stream.read()
metadata = kwargs.get("metadata", {})
event = {"message": data.decode("utf8")}
print(event)
self.messages.put({**event, **metadata}, block=False)


Expand Down Expand Up @@ -322,8 +410,10 @@ class Config(Input.Config):
]
)
"""Configure endpoint routes with a Mapping of a path to an endpoint. Possible endpoints
are: :code:`json`, :code:`jsonl`, :code:`plaintext`.
are: :code:`json`, :code:`jsonl`, :code:`plaintext`. It's possible to use wildcards and
regexes for pattern matching.
.. autoclass:: logprep.connector.http.input.PlaintextHttpEndpoint
:noindex:
.. autoclass:: logprep.connector.http.input.JSONLHttpEndpoint
Expand Down Expand Up @@ -401,11 +491,14 @@ def setup(self):
endpoints_config = {}
collect_meta = self._config.collect_meta
metafield_name = self._config.metafield_name
cred_factory = CredentialsFactory()
# preparing dict with endpoint paths and initialized endpoints objects
for endpoint_path, endpoint_name in self._config.endpoints.items():
endpoint_class = self._endpoint_registry.get(endpoint_name)
# and add authentication if credentials are existing for path
for endpoint_path, endpoint_type in self._config.endpoints.items():
endpoint_class = self._endpoint_registry.get(endpoint_type)
credentials = cred_factory.from_endpoint(endpoint_path)
endpoints_config[endpoint_path] = endpoint_class(
self.messages, collect_meta, metafield_name
self.messages, collect_meta, metafield_name, credentials
)

self.http_server = ThreadingHTTPServer( # pylint: disable=attribute-defined-outside-init
Expand Down
Loading

0 comments on commit d93cd99

Please sign in to comment.