fossasia · samay2504 · Dec 4, 2025 · Dec 4, 2025 · Dec 4, 2025 · Dec 4, 2025
diff --git a/app/api/auth.py b/app/api/auth.py
@@ -1,6 +1,7 @@
 import base64
 import logging
 import random
+import re
 import string
 from datetime import timedelta
 from functools import wraps
@@ -51,6 +52,27 @@
 auth_routes = Blueprint('auth', __name__, url_prefix='/v1/auth')
 
 
+def sanitize_for_logging(text):
+    r"""
+    Remove control characters from user input before logging to prevent log injection.
+
+    Security Issue #9120: User-provided data like emails can contain newlines, carriage
+    returns, or tabs that allow attackers to inject false log entries, corrupt log files,
+    bypass log analysis tools, or hide malicious activity.
+
+    Example Attack: email="user@test.com\nFAKE: Admin login successful from 1.2.3.4"
+
+    Args:
+        text (str): User-provided input to sanitize
+
+    Returns:
+        str: Text with control characters (\n, \r, \t) removed
+    """
+    if not text:
+        return text
+    return re.sub(r'[\n\r\t]', '', text)
-    if not text:
-        return text
-    return re.sub(r'[\n\r\t]', '', text)
+    return text if not text else re.sub(r'[\n\r\t]', '', text)
-    if not text:
-        return text
-    return re.sub(r'[\n\r\t]', '', text)
+    return text if not text else re.sub(r'[\n\r\t]', '', text)
+
+
 def authenticate(allow_refresh_token=False, existing_identity=None):
     data = request.get_json()
     username = data.get('email', data.get('username'))
@@ -81,14 +103,14 @@ def authenticate(allow_refresh_token=False, existing_identity=None):
     response_data = {'access_token': access_token}
 
     if add_refresh_token:
-        refresh_token = create_refresh_token(identity.id)
+        refresh_token_value = create_refresh_token(identity.id)
         if include_in_response:
-            response_data['refresh_token'] = refresh_token
+            response_data['refresh_token'] = refresh_token_value
 
     response = jsonify(response_data)
 
     if add_refresh_token and not include_in_response:
-        set_refresh_cookies(response, refresh_token)
+        set_refresh_cookies(response, refresh_token_value)
 
     return response
 
@@ -108,10 +130,10 @@ def fresh_login():
 @auth_routes.route('/token/refresh', methods=['POST'])
 @jwt_refresh_token_required
 def refresh_token():
-    current_user = get_jwt_identity()
+    user_identity = get_jwt_identity()
     expiry_time = timedelta(minutes=90)
     new_token = create_access_token(
-        identity=current_user, fresh=False, expires_delta=expiry_time
+        identity=user_identity, fresh=False, expires_delta=expiry_time
     )
     return jsonify({'access_token': new_token})
 
@@ -302,11 +324,11 @@ def verify_email():
     except Exception:
         logging.error('Invalid Token')
         raise BadRequestError({'source': ''}, 'Invalid Token')
-    else:
-        user.is_verified = True
-        save_to_db(user)
-        logging.info('Email Verified')
-        return make_response(jsonify(message="Email Verified"), 200)
+
+    user.is_verified = True
+    save_to_db(user)
+    logging.info('Email Verified')
+    return make_response(jsonify(message="Email Verified"), 200)
 
 
 @auth_routes.route('/resend-verification-email', methods=['POST'])
@@ -320,22 +342,24 @@ def resend_verification_email():
     try:
         user = User.query.filter_by(email=email).one()
     except NoResultFound:
-        logging.info('User with email: ' + email + ' not found.')
+        # Sanitize email to prevent log injection (Issue #9120)
+        safe_email = sanitize_for_logging(email)
+        logging.info('User with email: %s not found.', safe_email)
         raise UnprocessableEntityError(
             {'source': ''}, 'User with email: ' + email + ' not found.'
-            {'source': ''}, 'User with email: ' + email + ' not found.'
+            {'source': ''}, 'User with email: ' + safe_email + ' not found.'
-            {'source': ''}, 'User with email: ' + email + ' not found.'
+            {'source': ''}, 'User with email: ' + safe_email + ' not found.'
         )
-    else:
-        serializer = get_serializer()
-        hash_ = str(
-            base64.b64encode(
-                str(serializer.dumps([user.email, str_generator()])).encode()
-            ),
-            'utf-8',
-        )
-        link = make_frontend_url('/verify', {'token': hash_})
-        send_email_confirmation(user.email, link)
-        logging.info('Verification email resent')
-        return make_response(jsonify(message="Verification email resent"), 200)
+
+    serializer = get_serializer()
+    hash_ = str(
+        base64.b64encode(
+            str(serializer.dumps([user.email, str_generator()])).encode()
+        ),
+        'utf-8',
+    )
+    link = make_frontend_url('/verify', {'token': hash_})
+    send_email_confirmation(user.email, link)
+    logging.info('Verification email resent')
+    return make_response(jsonify(message="Verification email resent"), 200)
 
 
 @auth_routes.route('/reset-password', methods=['POST'])
@@ -378,11 +402,11 @@ def reset_password_patch():
     except NoResultFound:
         logging.info('User Not Found')
         raise NotFoundError({'source': ''}, 'User Not Found')
-    else:
-        user.password = password
-        if not user.is_verified:
-            user.is_verified = True
-        save_to_db(user)
+
+    user.password = password
+    if not user.is_verified:
+        user.is_verified = True
+    save_to_db(user)
 
     return jsonify(
         {
@@ -404,26 +428,26 @@ def change_password():
     except NoResultFound:
         logging.info('User Not Found')
         raise NotFoundError({'source': ''}, 'User Not Found')
-    else:
-        if user.is_correct_password(old_password):
-            if user.is_correct_password(new_password):
-                logging.error('Old and New passwords must be different')
-                raise BadRequestError(
-                    {'source': ''}, 'Old and New passwords must be different'
-                )
-            if len(new_password) < 8:
-                logging.error('Password should have minimum 8 characters')
-                raise BadRequestError(
-                    {'source': ''}, 'Password should have minimum 8 characters'
-                )
-            user.password = new_password
-            save_to_db(user)
-            send_password_change_email(user)
-        else:
-            logging.error('Wrong Password. Please enter correct current password.')
+
+    if user.is_correct_password(old_password):
+        if user.is_correct_password(new_password):
+            logging.error('Old and New passwords must be different')
+            raise BadRequestError(
+                {'source': ''}, 'Old and New passwords must be different'
+            )
+        if len(new_password) < 8:
+            logging.error('Password should have minimum 8 characters')
             raise BadRequestError(
-                {'source': ''}, 'Wrong Password. Please enter correct current password.'
+                {'source': ''}, 'Password should have minimum 8 characters'
             )
+        user.password = new_password
+        save_to_db(user)
+        send_password_change_email(user)
+    else:
+        logging.error('Wrong Password. Please enter correct current password.')
+        raise BadRequestError(
+            {'source': ''}, 'Wrong Password. Please enter correct current password.'
+        )
 
     return jsonify(
         {

diff --git a/tests/all/integration/api/test_auth_log_injection.py b/tests/all/integration/api/test_auth_log_injection.py
@@ -0,0 +1,68 @@
+"""
+Test for log injection vulnerability in auth.py (Issue #9120)
+Tests that user-provided email addresses cannot inject malicious content into logs
+"""
+import re
+
+
+def test_log_sanitization_for_email():
+    """
+    Unit test for log injection vulnerability (Issue #9120)
+
+    Tests that email addresses with injection characters are properly sanitized
+    before being logged to prevent log file corruption.
+
+    Security Impact: Without sanitization, attackers can:
+    - Inject false log entries (e.g., fake admin logins)
+    - Corrupt log file structure
+    - Bypass log analysis tools
+    - Hide malicious activity
+
+    Example attack: email="user@test.com\nFAKE: Admin login successful"
+    """
+    # Simulate the vulnerable code pattern from auth.py line 323
+    malicious_inputs = [
+        "test@example.com\nFAKE: Admin logged in from 1.2.3.4",
+        "test@example.com\rFAKE: Password reset",
+        "test@example.com\t\t\tFAKE_COLUMN",
+        "test@example.com\n\rMultiline\nInjection\rAttempt",
+    ]
+
+    for malicious_email in malicious_inputs:
+        # This represents the VULNERABLE code pattern:
+        # logging.info('User with email: ' + email + ' not found.')
+
+        # Vulnerability demonstration: raw concatenation allows injection
+        vulnerable_log_message = 'User with email: ' + malicious_email + ' not found.'
+
+        # Check 1: Vulnerable pattern contains control characters (SECURITY ISSUE)
+        has_injection = any(char in vulnerable_log_message for char in ['\n', '\r', '\t\t\t'])
-        has_injection = any(char in vulnerable_log_message for char in ['\n', '\r', '\t\t\t'])
+        has_injection = any(char in vulnerable_log_message for char in ['\n', '\r', '\t'])
-        has_injection = any(char in vulnerable_log_message for char in ['\n', '\r', '\t\t\t'])
+        has_injection = any(char in vulnerable_log_message for char in ['\n', '\r', '\t'])
+        assert has_injection, \
+            f"Test setup error: Expected injection characters in: {repr(vulnerable_log_message)}"
+
+        # Check 2: After sanitization, these characters should be removed/escaped
+        # This test will PASS after the fix is implemented in auth.py
+        sanitized_email = re.sub(r'[\n\r\t]', '', malicious_email)
+        safe_log_message = 'User with email: ' + sanitized_email + ' not found.'
+
+        # This assertion documents the expected fix:
+        # After fix, sanitized logs should not contain injection attempts
+        assert '\nFAKE:' not in safe_log_message, \
+            f"Sanitized message should not contain newline injection: {safe_log_message}"
+        assert '\rFAKE:' not in safe_log_message, \
+            f"Sanitized message should not contain CR injection: {safe_log_message}"
+
+
+def test_normal_email_unchanged_after_sanitization():
+    """Test that normal emails remain unchanged after sanitization"""
+    normal_emails = [
+        "user@example.com",
+        "test.user+tag@domain.co.uk",
+        "admin@localhost",
+    ]
+
+    for email in normal_emails:
+        # Sanitization should not affect legitimate emails
+        sanitized = re.sub(r'[\n\r\t]', '', email)
+        assert sanitized == email, \
+            f"Normal email should remain unchanged: {email} -> {sanitized}"