new version released: 1.0.3

GGontijo · GGontijo · commit 46d40323defd · 2024-05-13T13:46:41.000-04:00
diff --git a/build/lib/fastapi_elasticsearch_middleware/__init__.py b/build/lib/fastapi_elasticsearch_middleware/__init__.py
diff --git a/build/lib/fastapi_elasticsearch_middleware/elasticsearch_middleware.py b/build/lib/fastapi_elasticsearch_middleware/elasticsearch_middleware.py
@@ -0,0 +1,169 @@
+import json
+import logging
+import time
+from fastapi import Request
+from datetime import datetime, timezone
+from fastapi.datastructures import Headers
+from starlette.types import ASGIApp, Receive, Scope, Send
+from elasticsearch import Elasticsearch
+
+class LogLevelEnum:
+    level_mapping = {
+        2: "Info",
+        3: "Warning",
+        4: "Warning",
+        5: "Error"
+    }
+
+class ElasticsearchLoggerMiddleware:
+    def __init__(self, app: ASGIApp, config: dict) -> None:
+        """
+        Initializes an Elasticsearch Logger Middleware for FastAPI.
+
+        Args:
+            app (ASGIApp): The FastAPI ASGI application.
+            config (dict): Configuration settings for Elasticsearch logging.
+                {
+                    'url': str,          # Elasticsearch server URL
+                    'user': str,         # Elasticsearch API user
+                    'password': str      # Elasticsearch API password
+                    'index': str,        # Elasticsearch index name
+                    'environment': str,  # Environment identifier for logs
+                    'limit': bool,       # Limit Elasticsearch payload array and string lenght
+                    'debug': bool        # When True logs aren't sent to Elasticsearch
+                }
+        """
+        elastic_config = config
+        elastic_user = config.get('user')
+        elastic_password = config.get('password')
+        basic_auth = (elastic_user, elastic_password) if elastic_user and elastic_password else None
+        self.elasticsearch_client = Elasticsearch([elastic_config.get('url')], basic_auth=basic_auth)
+        self.index = elastic_config.get('index')
+        self.limit = elastic_config.get('limit', False)
+        self.environment = elastic_config.get('environment', 'Development')
+        self.debug = elastic_config.get('debug', False)
+        self.app = app
+
+    async def __call__(self, scope: Scope, receive: Receive, send: Send) -> None:
+
+        if scope.get('type') == 'http' and not self.debug:
+
+            request = Request(scope)
+
+            async def intercept_send(response):
+                nonlocal log_data
+                if response['type'] == 'http.response.body' and "response" not in log_data.keys(): # Streaming response, we don't want to log this
+                    await send(response)
+                    return 
+                if response['type'] == 'http.response.body' and "response" in log_data.keys(): # Response part
+                    
+                    # Finishes telemetry
+                    end_time = time.time()
+                    elapsed_time = end_time - start_time
+
+                    log_data["elapsed_time"] = elapsed_time
+
+                    if log_data["response"]["headers"].get('content-type') == 'application/json':
+                        response_body = json.loads(response.get('body'))
+                        response_body = self.limit_array_length(response_body)
+
+                        response_body = json.dumps(response_body, ensure_ascii=False) if 'body' in response.keys() else None
+                        log_data["response"]["body"] = response_body
+
+                    elif log_data["response"]["headers"].get('content-type') == 'application/octet-stream':
+                        log_data["response"]["body"] = str(response.get('body')) if 'body' in response.keys() else None
+
+                    self.log_to_elasticsearch(log_data)
+
+                if response['type'] == 'http.response.start': # Request part
+                    
+                    request_headers = dict(request.headers) if 'headers' in request.keys() else None
+                    request_query_parameters = dict(request.query_params) if len(request.query_params._list) > 0 else None
+
+                    response_headers = dict(Headers(raw=response.get('headers'))) if 'headers' in response.keys() else None
+
+                    log_data["status_code"] = response['status']
+                    log_data["level"] = LogLevelEnum.level_mapping.get(int(str(response['status'])[0]))
+                    log_data["request"]["headers"] = request_headers
+                    log_data["request"]["query_parameters"] = request_query_parameters
+                    log_data["response"]["headers"] = response_headers
+
+                await send(response)
+
+            start_time = time.time()
+            
+            log_data = {
+                "@timestamp": datetime.now().replace(tzinfo=timezone.utc).strftime("%Y-%m-%dT%H:%M:%S"),
+                "environment": self.environment, 
+                "method": request.method,
+                "path": request.url.path,
+                "request": {},
+                "response": {}
+            }
+ 
+            # Starts telemetry
+            start_time = time.time()
+
+            async def intercept_receive():
+                message = await receive()
+
+                more_body = message.get("more_body", False)
+                body = message.get("body", "")
+                while more_body:
+                    message = await receive()
+                    body += message.get("body", b"")
+                    more_body = message.get("more_body", False)
+
+                message["body"] = body
+                request_body = ''
+
+                if len(message["body"]) > 0:
+                    request_body = json.loads(body.decode('utf-8'))
+                    request_body = self.limit_string_length(request_body)
+                    request_body = json.dumps(request_body, ensure_ascii=False) if len(body.decode('utf-8')) > 0 else None
+                
+                log_data["request"]["body"] = request_body
+
+                return message
+        
+            await self.app(scope, intercept_receive, intercept_send)
+            
+        else:
+            await self.app(scope, receive, send)
+
+    def log_to_elasticsearch(self, log_data) -> None:
+        try:
+            self.elasticsearch_client.index(index=self.index, body=log_data)
+            log_data.clear()
+        except Exception as e:
+            logging.error(f"Failed to log to Elasticsearch: {str(e)}")
+
+    def limit_string_length(self, data, max_lines=50):
+        if not self.limit:
+            return data
+        if isinstance(data, dict):
+            for key, value in data.items():
+                data[key] = self.limit_string_length(value, max_lines)
+        elif isinstance(data, list):
+            for i in range(len(data)):
+                data[i] = self.limit_string_length(data[i], max_lines)          
+        elif isinstance(data, str) and len(data.split('\n')) > max_lines:
+            data_splitted = data.split('\n')[:max_lines]
+            data_splitted.append(f' [...] value limited in {max_lines} lines')
+            data = '\n'.join(data_splitted)
+        elif isinstance(data, str) and len(data.split('/')) > max_lines: # Base64 files
+            data_splitted = data.split('/')[:max_lines]
+            data_splitted.append(f' [...] value limited in {max_lines} lines')
+            data = '/'.join(data_splitted)
+        return data
+    
+    def limit_array_length(self, data, max_length=3):
+        if not self.limit:
+            return data
+        if isinstance(data, dict):
+            for key, value in data.items():
+                data[key] = self.limit_array_length(value, max_length)
+        elif isinstance(data, list) and len(data) > max_length:
+            data = data[:max_length]
+            data.append(f'[...] array limited in {max_length} objects')
+        return data
diff --git a/setup.py b/setup.py
@@ -2,16 +2,33 @@
   
 setup( 
     name='fastapi_elasticsearch_middleware', 
-    version='1.0.2', 
+    version='1.0.3', 
     url='https://github.com/GGontijo/fastapi-elasticsearch-middleware.git',
     description='Elasticsearch Logger Middleware for FastAPI',
     long_description_content_type='text/markdown',
     long_description=open('README.md').read(),
     author='Gabriel Gontijo', 
     author_email='gabrieldercilio08@gmail.com', 
     packages=find_packages(), 
+    keywords=['python', 'middleware', 'fastapi', 'elasticsearch', 'kibana', 'logstash', 'fastapi-middleware'],
     install_requires=[ 
         'fastapi', 
         'elasticsearch', 
-    ], 
+    ],
+    classifiers=[
+        "Programming Language :: Python :: 3",
+        "License :: OSI Approved :: MIT License",
+        "Operating System :: OS Independent",
+        "Development Status :: 4 - Beta",
+        "Intended Audience :: Developers",
+        "Topic :: Software Development :: Libraries :: Python Modules",
+        "Topic :: Internet :: WWW/HTTP :: HTTP Servers",
+        "Topic :: Internet :: WWW/HTTP :: ASGI",
+        "Topic :: Internet :: WWW/HTTP :: ASGI :: Middleware",
+        "Topic :: Internet :: WWW/HTTP :: ASGI :: Server",
+        "Topic :: Internet :: WWW/HTTP :: ASGI :: Application",
+        "Topic :: Internet :: WWW/HTTP :: ASGI :: Server",
+        "Topic :: Internet :: WWW/HTTP :: ASGI :: Middleware",
+        "Topic :: Internet :: WWW/HTTP :: ASGI :: Application",
+    ]
 )