Amartyajha · Amartyajha · Apr 7, 2025 · sourcery-ai · Apr 7, 2025 · sourcery-ai
diff --git a/new-test/app.py b/new-test/app.py
@@ -0,0 +1,129 @@
+from flask import Flask, request, jsonify
+from flask_sqlalchemy import SQLAlchemy
+import jwt
+import os
+import pandas as pd
+import numpy as np
+from datetime import datetime
+import redis
+import json
+import subprocess
+import base64
+import hashlib
+import requests
+import time
+import xml.etree.ElementTree as ET
+
+# Unused imports (dead code)
+import logging
+import threading
+import socket
+
+app = Flask(__name__)
+
+# Security Issue: Hardcoded credentials
+DB_PASSWORD = "super_secret_password123"
+JWT_SECRET = "my_jwt_secret_key"
-DB_PASSWORD = "super_secret_password123"
-JWT_SECRET = "my_jwt_secret_key"
+DB_PASSWORD = os.getenv("DB_PASSWORD")
+JWT_SECRET = os.getenv("JWT_SECRET")
-DB_PASSWORD = "super_secret_password123"
-JWT_SECRET = "my_jwt_secret_key"
+DB_PASSWORD = os.getenv("DB_PASSWORD")
+JWT_SECRET = os.getenv("JWT_SECRET")
+
+# Security Issue: Insecure database configuration
+app.config['SQLALCHEMY_DATABASE_URI'] = f'sqlite:///app.db'
-app.config['SQLALCHEMY_DATABASE_URI'] = f'sqlite:///app.db'
+app.config['SQLALCHEMY_DATABASE_URI'] = 'sqlite:///app.db'
-# Security Issue: Insecure database configuration
-app.config['SQLALCHEMY_DATABASE_URI'] = f'sqlite:///app.db'
+# Security Issue: Insecure database configuration
+app.config['SQLALCHEMY_DATABASE_URI'] = 'sqlite:///app.db'
-app.config['SQLALCHEMY_DATABASE_URI'] = f'sqlite:///app.db'
+app.config['SQLALCHEMY_DATABASE_URI'] = 'sqlite:///app.db'
-# Security Issue: Insecure database configuration
-app.config['SQLALCHEMY_DATABASE_URI'] = f'sqlite:///app.db'
+# Security Issue: Insecure database configuration
+app.config['SQLALCHEMY_DATABASE_URI'] = 'sqlite:///app.db'
+app.config['SQLALCHEMY_TRACK_MODIFICATIONS'] = False
+
+db = SQLAlchemy(app)
+redis_client = redis.Redis(host='localhost', port=6379, db=0)
+
+# Inefficient data structure: Using list instead of set for O(n) lookup
+BLOCKED_IPS = []
+
+class User(db.Model):
+    id = db.Column(db.Integer, primary_key=True)
+    username = db.Column(db.String(80), unique=True, nullable=False)
+    password = db.Column(db.String(120), nullable=False)
+    documents = db.relationship('Document', backref='owner', lazy=True)
+
+class Document(db.Model):
+    id = db.Column(db.Integer, primary_key=True)
+    content = db.Column(db.Text, nullable=False)
+    user_id = db.Column(db.Integer, db.ForeignKey('user.id'), nullable=False)
+
+# Performance Issue: Unnecessary computation in loop
+def process_user_data(users):
+    result = []
+    for user in users:
+        # Inefficient: Recalculating same value in loop
+        timestamp = int(time.time())
+        processed_data = {
+            'id': user.id,
+            'username': user.username,
+            'docs_count': len(user.documents),
+            'timestamp': timestamp
+        }
+        # Unnecessary list conversion
+        result = result + [processed_data]
+    return result
+
+# Security Issue: SQL Injection vulnerability
+@app.route('/search_users')
+def search_users():
+    query = request.args.get('q', '')
+    # NEVER do this in real code - SQL injection vulnerability
+    raw_sql = f"SELECT * FROM user WHERE username LIKE '%{query}%'"
+    result = db.engine.execute(raw_sql)
-    raw_sql = f"SELECT * FROM user WHERE username LIKE '%{query}%'"
-    result = db.engine.execute(raw_sql)
+    from sqlalchemy import text
+    raw_sql = text("SELECT * FROM user WHERE username LIKE :query")
+    result = db.engine.execute(raw_sql, query=f"%{query}%")
-    raw_sql = f"SELECT * FROM user WHERE username LIKE '%{query}%'"
-    result = db.engine.execute(raw_sql)
+    from sqlalchemy import text
+    raw_sql = text("SELECT * FROM user WHERE username LIKE :query")
+    result = db.engine.execute(raw_sql, query=f"%{query}%")
+    return jsonify([dict(row) for row in result])
+
-# Security Issue: SQL Injection vulnerability
-@app.route('/search_users')
-def search_users():
-    query = request.args.get('q', '')
-    # NEVER do this in real code - SQL injection vulnerability
-    raw_sql = f"SELECT * FROM user WHERE username LIKE '%{query}%'"
-    result = db.engine.execute(raw_sql)
-    return jsonify([dict(row) for row in result])
+# Security Issue: SQL Injection vulnerability
+@app.route('/search_users')
+def search_users():
+    query = request.args.get('q', '')
+    # Example of using a safe parameter for LIKE queries:
+    raw_sql = text("SELECT * FROM user WHERE username LIKE :query")
+    result = db.engine.execute(raw_sql, {"query": f"%{query}%"})
+    return jsonify([dict(row) for row in result])
-# Security Issue: SQL Injection vulnerability
-@app.route('/search_users')
-def search_users():
-    query = request.args.get('q', '')
-    # NEVER do this in real code - SQL injection vulnerability
-    raw_sql = f"SELECT * FROM user WHERE username LIKE '%{query}%'"
-    result = db.engine.execute(raw_sql)
-    return jsonify([dict(row) for row in result])
+# Security Issue: SQL Injection vulnerability
+@app.route('/search_users')
+def search_users():
+    query = request.args.get('q', '')
+    # Example of using a safe parameter for LIKE queries:
+    raw_sql = text("SELECT * FROM user WHERE username LIKE :query")
+    result = db.engine.execute(raw_sql, {"query": f"%{query}%"})
+    return jsonify([dict(row) for row in result])
+# Security Issue: Command Injection vulnerability
+@app.route('/ping')
+def ping_host():
+    host = request.args.get('host', 'localhost')
+    # NEVER do this in real code - Command injection vulnerability
+    result = subprocess.check_output(f'ping -c 1 {host}', shell=True)
-    result = subprocess.check_output(f'ping -c 1 {host}', shell=True)
+    result = subprocess.check_output(['ping', '-c', '1', host])
-    result = subprocess.check_output(f'ping -c 1 {host}', shell=True)
+    result = subprocess.check_output(['ping', '-c', '1', host])
+    return result.decode()
+
-# Security Issue: Command Injection vulnerability
-@app.route('/ping')
-def ping_host():
-    host = request.args.get('host', 'localhost')
-    # NEVER do this in real code - Command injection vulnerability
-    result = subprocess.check_output(f'ping -c 1 {host}', shell=True)
-    return result.decode()
+# Security Issue: Command Injection vulnerability
+@app.route('/ping')
+def ping_host():
+    host = request.args.get('host', 'localhost')
+    # NEVER do this in real code - Command injection vulnerability
+    # Example of a safer approach:
+    import shlex
+    safe_host = shlex.quote(host)
+    result = subprocess.check_output(["ping", "-c", "1", safe_host])
+    return result.decode()
-# Security Issue: Command Injection vulnerability
-@app.route('/ping')
-def ping_host():
-    host = request.args.get('host', 'localhost')
-    # NEVER do this in real code - Command injection vulnerability
-    result = subprocess.check_output(f'ping -c 1 {host}', shell=True)
-    return result.decode()
+# Security Issue: Command Injection vulnerability
+@app.route('/ping')
+def ping_host():
+    host = request.args.get('host', 'localhost')
+    # NEVER do this in real code - Command injection vulnerability
+    # Example of a safer approach:
+    import shlex
+    safe_host = shlex.quote(host)
+    result = subprocess.check_output(["ping", "-c", "1", safe_host])
+    return result.decode()
+# Performance Issue: Inefficient data processing
+@app.route('/process_documents', methods=['POST'])
+def process_documents():
+    documents = request.json.get('documents', [])
+
+    # Inefficient: Creating new DataFrame for each document
+    results = []
+    for doc in documents:
+        df = pd.DataFrame([doc])
+        # Unnecessary type conversion
+        doc_id = str(doc.get('id'))
+        doc_id = int(doc_id)
+
+        # Memory inefficient: Creating new array for each operation
+        data = np.array(df.values)
+        data = data * 2
+        data = data + 1
+        results.append(data.tolist())
+
+    return jsonify(results)
+
-# Performance Issue: Inefficient data processing
-@app.route('/process_documents', methods=['POST'])
-def process_documents():
-    documents = request.json.get('documents', [])
-    
-    # Inefficient: Creating new DataFrame for each document
-    results = []
-    for doc in documents:
-        df = pd.DataFrame([doc])
-        # Unnecessary type conversion
-        doc_id = str(doc.get('id'))
-        doc_id = int(doc_id)
-        
-        # Memory inefficient: Creating new array for each operation
-        data = np.array(df.values)
-        data = data * 2
-        data = data + 1
-        results.append(data.tolist())
-    
-    return jsonify(results)
+# Performance Issue: Inefficient data processing
+@app.route('/process_documents', methods=['POST'])
+def process_documents():
+    docs_json = request.json.get('documents', [])
+    df = pd.DataFrame(docs_json)
+    # Example vectorized transformations:
+    df['id'] = df['id'].astype(int)
+    numeric_data = df.select_dtypes(include=[np.number]) * 2 + 1
+    df.update(numeric_data)
+    return jsonify(df.to_dict(orient='records'))
-# Performance Issue: Inefficient data processing
-@app.route('/process_documents', methods=['POST'])
-def process_documents():
-    documents = request.json.get('documents', [])
-    
-    # Inefficient: Creating new DataFrame for each document
-    results = []
-    for doc in documents:
-        df = pd.DataFrame([doc])
-        # Unnecessary type conversion
-        doc_id = str(doc.get('id'))
-        doc_id = int(doc_id)
-        
-        # Memory inefficient: Creating new array for each operation
-        data = np.array(df.values)
-        data = data * 2
-        data = data + 1
-        results.append(data.tolist())
-    
-    return jsonify(results)
+# Performance Issue: Inefficient data processing
+@app.route('/process_documents', methods=['POST'])
+def process_documents():
+    docs_json = request.json.get('documents', [])
+    df = pd.DataFrame(docs_json)
+    # Example vectorized transformations:
+    df['id'] = df['id'].astype(int)
+    numeric_data = df.select_dtypes(include=[np.number]) * 2 + 1
+    df.update(numeric_data)
+    return jsonify(df.to_dict(orient='records'))
+# Security Issue: XML parsing vulnerability
+@app.route('/parse_xml', methods=['POST'])
+def parse_xml():
+    xml_data = request.data
+    # NEVER do this in real code - XML parsing vulnerability
+    root = ET.fromstring(xml_data)
+    return jsonify({'root_tag': root.tag})
+
+# Business Logic Error: Incorrect calculation
+def calculate_discount(price, quantity):
+    # Error: Applies discount incorrectly
+    if quantity > 10:
+        return price * 0.9  # Should be (price * quantity) * 0.9
+    return price
-    if quantity > 10:
-        return price * 0.9  # Should be (price * quantity) * 0.9
-    return price
+    return price * 0.9 if quantity > 10 else price
-    # Error: Applies discount incorrectly
-    if quantity > 10:
-        return price * 0.9  # Should be (price * quantity) * 0.9
-    return price
+    def calculate_discount(price, quantity):
+        if quantity > 10:
+            return (price * quantity) * 0.9
+        return price * quantity
-    if quantity > 10:
-        return price * 0.9  # Should be (price * quantity) * 0.9
-    return price
+    return price * 0.9 if quantity > 10 else price
-    # Error: Applies discount incorrectly
-    if quantity > 10:
-        return price * 0.9  # Should be (price * quantity) * 0.9
-    return price
+    def calculate_discount(price, quantity):
+        if quantity > 10:
+            return (price * quantity) * 0.9
+        return price * quantity
+
-# Business Logic Error: Incorrect calculation
-def calculate_discount(price, quantity):
-    # Error: Applies discount incorrectly
-    if quantity > 10:
-        return price * 0.9  # Should be (price * quantity) * 0.9
-    return price
+# Business Logic Error: Incorrect calculation
+def calculate_discount(price, quantity):
+    # Error: Applies discount incorrectly
+    if quantity > 10:
+        return (price * quantity) * 0.9
+    return price * quantity
-# Business Logic Error: Incorrect calculation
-def calculate_discount(price, quantity):
-    # Error: Applies discount incorrectly
-    if quantity > 10:
-        return price * 0.9  # Should be (price * quantity) * 0.9
-    return price
+# Business Logic Error: Incorrect calculation
+def calculate_discount(price, quantity):
+    # Error: Applies discount incorrectly
+    if quantity > 10:
+        return (price * quantity) * 0.9
+    return price * quantity
+# Dead Code: Never used function
+def unused_helper_function():
+    print("This function is never called")
+
+# Security Issue: Insecure password hashing
+def hash_password(password):
+    # NEVER do this in real code - Use proper password hashing
+    return hashlib.md5(password.encode()).hexdigest()
-def hash_password(password):
-    # NEVER do this in real code - Use proper password hashing
-    return hashlib.md5(password.encode()).hexdigest()
+def hash_password(password):
+    return bcrypt.hashpw(password.encode(), bcrypt.gensalt()).decode()
-def hash_password(password):
-    # NEVER do this in real code - Use proper password hashing
-    return hashlib.md5(password.encode()).hexdigest()
+def hash_password(password):
+    return bcrypt.hashpw(password.encode(), bcrypt.gensalt()).decode()
+
-# Security Issue: Insecure password hashing
-def hash_password(password):
-    # NEVER do this in real code - Use proper password hashing
-    return hashlib.md5(password.encode()).hexdigest()
+# Security Issue: Insecure password hashing
+import bcrypt
+
+def hash_password(password):
+    salt = bcrypt.gensalt()
+    return bcrypt.hashpw(password.encode(), salt).decode()
-# Security Issue: Insecure password hashing
-def hash_password(password):
-    # NEVER do this in real code - Use proper password hashing
-    return hashlib.md5(password.encode()).hexdigest()
+# Security Issue: Insecure password hashing
+import bcrypt
+
+def hash_password(password):
+    salt = bcrypt.gensalt()
+    return bcrypt.hashpw(password.encode(), salt).decode()
+if __name__ == '__main__':
+    # Security Issue: Debug mode in production
+    app.run(debug=True, host='0.0.0.0', port=5000)
-if __name__ == '__main__':
-    # Security Issue: Debug mode in production
-    app.run(debug=True, host='0.0.0.0', port=5000)
+if __name__ == '__main__':
+    app.run(debug=False, host='0.0.0.0', port=5000)
-if __name__ == '__main__':
-    # Security Issue: Debug mode in production
-    app.run(debug=True, host='0.0.0.0', port=5000)
+if __name__ == '__main__':
+    app.run(debug=False, host='0.0.0.0', port=5000)
diff --git a/new-test/req.txt b/new-test/req.txt
@@ -0,0 +1,9 @@
+Flask==2.0.1  # Intentionally older version
+flask-sqlalchemy==2.5.1
+PyJWT==1.7.1  # Vulnerable version
+requests==2.25.0  # Older version with known vulnerabilities
+python-dotenv==0.19.0
+bcrypt==3.2.0
+redis==3.5.3
+pandas==1.3.0  # Older version
+numpy==1.19.5  # Older version