Spaces:

jarif
/

FraudNet-Real-Time-Detection-with-GNNs

Sleeping

App Files Files Community

FraudNet-Real-Time-Detection-with-GNNs / src /streamlit_app.py

jarif

Update src/streamlit_app.py

69b6195 verified about 1 month ago

raw

history blame contribute delete

15 kB

	import streamlit as st
	import pandas as pd
	import numpy as np
	import torch
	import torch.nn as nn
	import torch.nn.functional as F
	from torch_geometric.nn import GATConv
	from torch_geometric.data import Data
	import os

	# Define FraudGNN class
	class FraudGNN(nn.Module):
	def __init__(self, input_dim, hidden_dim, output_dim):
	super(FraudGNN, self).__init__()
	self.conv1 = GATConv(input_dim, hidden_dim, heads=4, dropout=0.3)
	self.conv2 = GATConv(hidden_dim * 4, hidden_dim, heads=1, dropout=0.3)
	self.fc = nn.Linear(hidden_dim, output_dim)

	def forward(self, data):
	x, edge_index = data.x, data.edge_index
	x = F.relu(self.conv1(x, edge_index))
	x = F.dropout(x, p=0.3, training=self.training)
	x = F.relu(self.conv2(x, edge_index))
	x = self.fc(x)
	return torch.sigmoid(x).squeeze()

	# Device configuration
	device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')

	# Load model and threshold
	try:
	# Try root directory first (Hugging Face Spaces working directory)
	model_path = 'fraud_gnn_model.pth'
	threshold_path = 'optimal_threshold.txt'

	# Fallback: Try relative to src/ (if files are misplaced)
	if not os.path.exists(model_path):
	model_path = os.path.join(os.path.dirname(__file__), 'fraud_gnn_model.pth')
	if not os.path.exists(threshold_path):
	threshold_path = os.path.join(os.path.dirname(__file__), 'optimal_threshold.txt')

	# Alternative: If files are in a 'models/' folder (uncomment if applicable)
	# model_path = os.path.join(os.path.dirname(__file__), '..', 'models', 'fraud_gnn_model.pth')
	# threshold_path = os.path.join(os.path.dirname(__file__), '..', 'models', 'optimal_threshold.txt')

	if not os.path.exists(model_path):
	raise FileNotFoundError(f"Model file not found at {model_path}. Please upload fraud_gnn_model.pth to the repository root.")
	if not os.path.exists(threshold_path):
	raise FileNotFoundError(f"Threshold file not found at {threshold_path}. Please upload optimal_threshold.txt to the repository root.")

	model = FraudGNN(input_dim=7, hidden_dim=16, output_dim=1).to(device)
	model.load_state_dict(torch.load(model_path, map_location=device))
	model.eval()

	with open(threshold_path, 'r') as f:
	threshold = float(f.read())
	except FileNotFoundError as e:
	st.error(f"Error: {e}")
	st.stop()
	except Exception as e:
	st.error(f"Error loading model or threshold: {e}")
	st.stop()

	# City and state mappings
	city_mapping = {
	'Atlanta': 0, 'Bronx': 1, 'Brooklyn': 2, 'Chicago': 3, 'Dallas': 4, 'Houston': 5,
	'Indianapolis': 6, 'Las Vegas': 7, 'Los Angeles': 8, 'Louisville': 9, 'Miami': 10,
	'Minneapolis': 11, 'New York': 12, 'ONLINE': 13, 'Orlando': 14, 'Philadelphia': 15,
	'San Antonio': 16, 'San Diego': 17, 'San Francisco': 18, 'Tucson': 19, 'other': 20
	}
	state_mapping = {
	'AK': 0, 'AL': 1, 'AR': 2, 'AZ': 3, 'Algeria': 4, 'Antigua and Barbuda': 5, 'Argentina': 6,
	'Aruba': 7, 'Australia': 8, 'Austria': 9, 'Azerbaijan': 10, 'Bahrain': 11, 'Bangladesh': 12,
	'Barbados': 13, 'Belarus': 14, 'Belgium': 15, 'Belize': 16, 'Bosnia and Herzegovina': 17,
	'Brazil': 18, 'CA': 19, 'CO': 20, 'CT': 21, 'Cabo Verde': 22, 'Cambodia': 23, 'Canada': 24,
	'Central African Republic': 25, 'Chile': 26, 'China': 27, 'Colombia': 28, 'Costa Rica': 29,
	"Cote d'Ivoire": 30, 'Croatia': 31, 'Czech Republic': 32, 'DC': 33, 'DE': 34, 'Denmark': 35,
	'Dominica': 36, 'Dominican Republic': 37, 'East Timor (Timor-Leste)': 38, 'Ecuador': 39,
	'Egypt': 40, 'Eritrea': 41, 'Estonia': 42, 'FL': 43, 'Fiji': 44, 'Finland': 45, 'France': 46,
	'GA': 47, 'Georgia': 48, 'Germany': 49, 'Ghana': 50, 'Greece': 51, 'Guatemala': 52,
	'Guyana': 53, 'HI': 54, 'Haiti': 55, 'Honduras': 56, 'Hong Kong': 57, 'Hungary': 58,
	'IA': 59, 'ID': 60, 'IL': 61, 'IN': 62, 'Iceland': 63, 'India': 64, 'Indonesia': 65,
	'Ireland': 66, 'Israel': 67, 'Italy': 68, 'Jamaica': 69, 'Japan': 70, 'Jordan': 71,
	'KS': 72, 'KY': 73, 'Kenya': 74, 'Kosovo': 75, 'Kuwait': 76, 'LA': 77, 'Latvia': 78,
	'Lebanon': 79, 'Liberia': 80, 'Lithuania': 81, 'Luxembourg': 82, 'MA': 83, 'MD': 84,
	'ME': 85, 'MI': 86, 'MN': 87, 'MO': 88, 'MS': 89, 'MT': 90, 'Macedonia': 91,
	'Malaysia': 92, 'Malta': 93, 'Mexico': 94, 'Moldova': 95, 'Monaco': 96, 'Morocco': 97,
	'Mozambique': 98, 'Myanmar (Burma)': 99, 'NC': 100, 'ND': 101, 'NE': 102, 'NH': 103,
	'NJ': 104, 'NM': 105, 'NV': 106, 'NY': 107, 'Nauru': 108, 'Netherlands': 109,
	'New Zealand': 110, 'Nicaragua': 111, 'Niger': 112, 'Nigeria': 113, 'Norway': 114,
	'OH': 115, 'OK': 116, 'OR': 117, 'Oman': 118, 'PA': 119, 'Pakistan': 120, 'Panama': 121,
	'Peru': 122, 'Philippines': 123, 'Poland': 124, 'Portugal': 125, 'RI': 126, 'Romania': 127,
	'Russia': 128, 'SC': 129, 'SD': 130, 'Saudi Arabia': 131, 'Senegal': 132, 'Serbia': 133,
	'Seychelles': 134, 'Singapore': 135, 'Slovakia': 136, 'Slovenia': 137, 'Somalia': 138,
	'South Africa': 139, 'South Korea': 140, 'Spain': 141, 'Sri Lanka': 142, 'Sudan': 143,
	'Suriname': 144, 'Sweden': 145, 'Switzerland': 146, 'Syria': 147, 'TN': 148, 'TX': 149,
	'Taiwan': 150, 'Thailand': 151, 'The Bahamas': 152, 'Tunisia': 153, 'Turkey': 154,
	'Tuvalu': 155, 'UT': 156, 'Uganda': 157, 'Ukraine': 158, 'United Arab Emirates': 159,
	'United Kingdom': 160, 'Uruguay': 161, 'Uzbekistan': 162, 'VA': 163, 'VT': 164,
	'Vatican City': 165, 'Vietnam': 166, 'WA': 167, 'WI': 168, 'WV': 169, 'WY': 170,
	'Yemen': 171, 'Zimbabwe': 172
	}

	def predict_fraud(transactions):
	try:
	df = pd.DataFrame(transactions, columns=[
	'Zipcode', 'Merchant_State_Code', 'User_Frequency_Per_Day',
	'Time_Difference_Hours', 'Merchant_Category_Code',
	'Merchant_City_Code', 'Transaction_Amount'
	])
	node_features = torch.tensor(df.values, dtype=torch.float).to(device)

	edge_index = torch.empty((2, 0), dtype=torch.long).to(device)

	if len(df) > 1:
	zipcodes = node_features[:, 0].cpu().numpy()
	edge_list = []
	zipcode_threshold = 1000
	for i in range(len(df)):
	for j in range(i + 1, len(df)):
	if abs(zipcodes[i] - zipcodes[j]) < zipcode_threshold:
	edge_list.append([i, j])
	edge_list.append([j, i])
	if edge_list:
	edge_index = torch.tensor(edge_list, dtype=torch.long).t().contiguous().to(device)

	graph_data = Data(x=node_features, edge_index=edge_index).to(device)

	if model is None:
	raise ValueError("Model not loaded. Check if fraud_gnn_model.pth exists.")

	with torch.no_grad():
	out = model(graph_data)
	out = torch.atleast_1d(out)
	pred_binary = (out > threshold).float().cpu().numpy()
	pred_proba = out.cpu().numpy()
	pred_binary = np.atleast_1d(pred_binary)
	pred_proba = np.atleast_1d(pred_proba)

	return pred_binary, pred_proba
	except Exception as e:
	st.error(f"Error in predict_fraud: {e}")
	return None, None

	# Custom CSS for highly compact, eye-catching design
	st.markdown("""
	<style>
	@import url('https://fonts.googleapis.com/css2?family=Poppins:wght@400;600&display=swap');
	@import url('https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.0/css/all.min.css');

	@keyframes glow {
	0% { box-shadow: 0 0 5px rgba(52, 152, 219, 0.5); }
	50% { box-shadow: 0 0 15px rgba(52, 152, 219, 0.8); }
	100% { box-shadow: 0 0 5px rgba(52, 152, 219, 0.5); }
	}
	@keyframes icon-pulse {
	0% { transform: scale(1); }
	50% { transform: scale(1.1); }
	100% { transform: scale(1); }
	}

	.stApp {
	background: #ffffff;
	max-width: 400px;
	margin: 10px auto;
	padding: 10px;
	font-family: 'Poppins', sans-serif;
	border-radius: 10px;
	box-shadow: 0 6px 20px rgba(0, 0, 0, 0.1);
	border: 2px solid transparent;
	animation: glow 3s infinite;
	}
	/* Alternative Pastel Gradient Design (uncomment to use) */
	/*
	.stApp {
	background: linear-gradient(135deg, #e6f0fa, #f3e5f5);
	max-width: 400px;
	margin: 10px auto;
	padding: 10px;
	font-family: 'Poppins', sans-serif;
	border-radius: 10px;
	box-shadow: 0 6px 20px rgba(0, 0, 0, 0.1);
	border: 2px solid transparent;
	animation: glow 3s infinite;
	}
	*/
	.stTextInput > div > div > input, .stNumberInput > div > div > input, .stSelectbox > div > div > select {
	padding: 5px;
	border: 1px solid #ddd;
	border-radius: 5px;
	font-size: 0.8rem;
	background: #f9f9f9;
	transition: border-color 0.3s, box-shadow 0.3s;
	}
	.stTextInput > div > div > input:focus, .stNumberInput > div > div > input:focus, .stSelectbox > div > div > select:focus {
	outline: none;
	border-color: #3498db;
	box-shadow: 0 0 6px rgba(52, 152, 219, 0.7);
	}
	.stSelectbox > div > div > select {
	appearance: none;
	background: #f9f9f9 url('data:image/svg+xml;utf8,<svg xmlns="http://www.w3.org/2000/svg" width="10" height="10" viewBox="0 0 24 24"><path fill="%23333" d="M7 10l5 5 5-5z"/></svg>') no-repeat right 8px center;
	}
	.stButton > button {
	padding: 6px;
	background: linear-gradient(45deg, #3498db, #ff6f61);
	color: white;
	border: none;
	border-radius: 5px;
	font-size: 0.85rem;
	font-weight: 600;
	width: 100%;
	transition: transform 0.2s, box-shadow 0.3s;
	}
	.stButton > button:hover {
	transform: translateY(-2px);
	box-shadow: 0 4px 12px rgba(255, 111, 97, 0.5);
	}
	.stButton > button:active {
	transform: translateY(0);
	}
	.result-box {
	background: #f1f3f5;
	padding: 8px;
	border-radius: 6px;
	text-align: center;
	margin-top: 8px;
	border: 1px solid #ddd;
	animation: glow 3s infinite;
	}
	.result-box h2 {
	font-size: 1rem;
	color: #2c3e50;
	margin-bottom: 4px;
	}
	.result-box p {
	font-size: 0.8rem;
	color: #7f8c8d;
	}
	.fa-shield-alt {
	animation: icon-pulse 2s infinite;
	}
	.form-label {
	font-weight: 600;
	font-size: 0.75rem;
	color: #2c3e50;
	margin-bottom: 3px;
	display: flex;
	align-items: center;
	}
	.form-label i {
	color: #ff6f61;
	margin-right: 5px;
	transition: color 0.3s;
	}
	.form-label i:hover {
	color: #3498db;
	}
	.stForm {
	display: flex;
	flex-direction: column;
	gap: 6px;
	}
	</style>
	""", unsafe_allow_html=True)

	# Streamlit UI
	st.markdown("""
	<h1 style='text-align: center; color: #2c3e50; font-size: 1.5rem; margin-bottom: 8px;'>
	<i class='fas fa-shield-alt' style='color: #ff6f61; margin-right: 8px;'></i>
	FraudShield
	</h1>
	<p style='text-align: center; font-size: 0.8rem; color: #555; margin-bottom: 8px; line-height: 1.4;'>
	Enter transaction details to detect fraud. Provide accurate zip code, merchant details, and amount.
	</p>
	""", unsafe_allow_html=True)

	with st.form(key="fraud_form"):
	st.markdown("<div class='form-label'><i class='fas fa-map-marker-alt'></i>Zipcode</div>", unsafe_allow_html=True)
	zipcode = st.number_input("", value=91750.0, step=0.01, format="%.2f", key="zipcode")

	st.markdown("<div class='form-label'><i class='fas fa-globe'></i>Merchant State</div>", unsafe_allow_html=True)
	merchant_state = st.selectbox("", sorted(state_mapping.keys()), index=sorted(state_mapping.keys()).index("TX"), key="state")

	st.markdown("<div class='form-label'><i class='fas fa-user-clock'></i>User Frequency Per Day</div>", unsafe_allow_html=True)
	user_freq = st.number_input("", value=1.0, step=0.01, format="%.2f", key="freq")

	st.markdown("<div class='form-label'><i class='fas fa-hourglass-half'></i>Time Difference (Hours)</div>", unsafe_allow_html=True)
	time_diff = st.number_input("", value=16601.95, step=0.01, format="%.2f", key="time")

	st.markdown("<div class='form-label'><i class='fas fa-store'></i>Merchant Category Code</div>", unsafe_allow_html=True)
	merchant_category = st.number_input("", value=5912.0, step=0.01, format="%.2f", key="category")

	st.markdown("<div class='form-label'><i class='fas fa-city'></i>Merchant City</div>", unsafe_allow_html=True)
	merchant_city = st.selectbox("", sorted(city_mapping.keys()), index=sorted(city_mapping.keys()).index("Houston"), key="city")

	st.markdown("<div class='form-label'><i class='fas fa-dollar-sign'></i>Transaction Amount</div>", unsafe_allow_html=True)
	transaction_amount = st.number_input("", value=128.35, step=0.01, format="%.2f", key="amount")

	submit_button = st.form_submit_button("Predict Fraud", use_container_width=True)

	if submit_button:
	try:
	if not all([zipcode, user_freq, time_diff, merchant_category, transaction_amount]):
	st.error("All fields are required.")
	elif merchant_state not in state_mapping:
	st.error(f"Invalid Merchant State: {merchant_state}")
	elif merchant_city not in city_mapping:
	st.error(f"Invalid Merchant City: {merchant_city}")
	else:
	transaction = {
	'Zipcode': float(zipcode),
	'Merchant_State_Code': int(state_mapping[merchant_state]),
	'User_Frequency_Per_Day': float(user_freq),
	'Time_Difference_Hours': float(time_diff),
	'Merchant_Category_Code': float(merchant_category),
	'Merchant_City_Code': int(city_mapping[merchant_city]),
	'Transaction_Amount': float(transaction_amount)
	}
	transactions = [list(transaction.values())]
	predictions, probabilities = predict_fraud(transactions)

	if predictions is None or probabilities is None:
	st.error("Prediction failed. Check server logs for details.")
	else:
	result = 'Fraud' if predictions[0] == 1 else 'Not Fraud'
	st.markdown(f"""
	<div class='result-box'>
	<h2>Transaction: {result}</h2>
	<p>Probability of Fraud: {probabilities[0]:.4f}</p>
	</div>
	""", unsafe_allow_html=True)
	except Exception as e:
	st.error(f"Error: Invalid input - {str(e)}")