Spaces:

shayan5422
/

Eyemovement

Build error

App Files Files Community

Eyemovement / src /utils.py

shayan5422

Upload 10 files

496c8b9 verified 7 months ago

raw

history blame contribute delete

42.2 kB

	import streamlit as st
	import matplotlib.pyplot as plt
	import numpy as np
	import plotly.graph_objects as go
	import plotly.express as px
	import cv2
	import dlib
	from scipy.spatial import distance as dist # For EAR calculation
	import time # for progress bar simulation and potentially camera loop

	# Constants for detection (from eye_eyebrow_detector.py)
	EYEBROW_TO_EYE_VERTICAL_DISTANCE_INCREASE_FACTOR = 0.15
	CALIBRATION_FRAMES = 30 # Reduced for faster demo calibration
	EAR_THRESHOLD = 0.20
	DLIB_SHAPE_PREDICTOR_PATH = "shape_predictor_68_face_landmarks.dat"

	# Display states (from eye_eyebrow_detector.py)
	STATE_YES = "Yes"
	STATE_NO = "No"
	STATE_NORMAL = "Normal"
	STATE_CALIBRATING = "Calibrating..."

	# Landmark indices (from eye_eyebrow_detector.py)
	(user_L_eye_indices_start, user_L_eye_indices_end) = (42, 48)
	(user_R_eye_indices_start, user_R_eye_indices_end) = (36, 42)
	user_L_eye_top_indices = [43, 44]
	user_R_eye_top_indices = [37, 38]
	user_L_eyebrow_y_calc_indices = range(23, 26)
	user_R_eyebrow_y_calc_indices = range(18, 21)


	# Initialize dlib's face detector and facial landmark predictor
	# We'll initialize this inside the function or manage its state
	# to avoid issues with Streamlit's rerun behavior.

	# Stock photo URLs provided
	FACIAL_RECOGNITION_IMAGES = [
	"https://pixabay.com/get/g12854d8ea8c029d2435717f123bb6b3afe5f218d14e94f3f1bd28aedaf46900b3c663fdca24e3e5ff97ed203a4ac97bdd34215b14df2f288e76f20602a81cb7d_1280.jpg",
	"https://pixabay.com/get/gf7f1fe0deb60c9c2217635915c6efdd85c3a35b943185d9d7c1b08ead1ec8f6d082af4bfe7a16759a66c38872d828da9c7d28f9ccd6ed4c243f50471537c072d_1280.jpg",
	"https://pixabay.com/get/g5226c742de43d538d1d4dd7e927224fb5be1b7f0f197f568dedc10336530b516cf9b2b3acc3128a4ea78a43ca348c8ce101234788ff131ed802e296e799ddc00_1280.jpg",
	"https://pixabay.com/get/g95d27127dde404c64753341780b8d8871f128bda7dfd5cc3ef287e4e838a1719fc91bc6c4bb24c52ef7cf27dad266a50d474142afe73e25f207ef9ef375c268e_1280.jpg"
	]

	AI_DATA_VIZ_IMAGES = [
	"https://pixabay.com/get/g155188879e1e171fb82c63d79b2963561b3a77f46ecb38053344fb6a1e236c2f406d66b1c3ae23260573869a9458daee7bfc00f37ef6840fce3a379da3d608e4_1280.jpg",
	"https://pixabay.com/get/g2620d81b6747dcda89657292ec3627897d7e61e906e76de11ecf6babedfcbe40aa0d0608950e1474795bc3a2abc67660ebc08977ba37da526834bec3cf342ba1_1280.jpg",
	"https://pixabay.com/get/ge8f809c48922d0dd956c8896157bd3ea8f606948d2ff72e507bad98b42b823e6409cc2923100bc91b15a499f72263fd8ca0f0949ac5ad2bbbb176f16e3dd0043_1280.jpg",
	"https://pixabay.com/get/g20331e7a18a7b2759056b7a9a73d20c34ff4f863ec4660535f9e5a1b15d3ad4b5b72bb07c385dd3ce154dc23b72fedd5c1eb9e2a4f2b335dfb17534d2b11d8e0_1280.jpg"
	]

	PRESENTATION_SLIDE_IMAGES = [
	"https://pixabay.com/get/gb57703b075295316bc1711f9701b18b84cfb89f469bb77f415392cc8986f922927cabc9afd50638f77ed51f53bcc62f423b96fbeb5f008abd1017db5b33e9e96_1280.jpg",
	"https://pixabay.com/get/gf4116a5ec8333a8a6bb33dcfe0baecc03580e6f7af95f2895880c9ec051479f3af002ecde96686e5fb6d3a860cf794fef532f27d373318317330932475a8b46c_1280.jpg"
	]

	def section_header(title):
	"""Generate a section header with consistent styling"""
	st.markdown(f'<p class="section-header">{title}</p>', unsafe_allow_html=True)

	def render_intro_section():
	"""Render the introduction section of the presentation"""
	section_header("Introduction")

	col1, col2 = st.columns([3, 2])

	with col1:
	st.markdown("""
	# Facial Gesture Recognition

	Facial gesture recognition is an exciting field at the intersection of computer vision and artificial intelligence that focuses on identifying and interpreting human facial expressions and movements.

	This presentation explores a system that can:

	- Detect facial landmarks in real-time video
	- Track specific facial movements (eyes, eyebrows)
	- Classify gestures into meaningful actions
	- Respond to gestures with appropriate system actions

	Using a combination of Convolutional Neural Networks (CNN) and Long Short-Term Memory (LSTM) architecture, this system achieves high accuracy in real-time environments.
	""")

	with col2:
	st.image(FACIAL_RECOGNITION_IMAGES[0], use_container_width=True)
	st.caption("Facial recognition technology")

	st.markdown("---")

	st.markdown("""
	### Why Facial Gesture Recognition Matters

	Facial gestures provide a natural, intuitive way for humans to communicate with computers:

	- Accessibility: Enables computer control for people with mobility limitations
	- Hands-free Interaction: Useful in environments where hands are occupied or contaminated
	- Enhanced User Experience: Creates more natural human-computer interactions
	- Safety Applications: Driver drowsiness detection, attention monitoring
	""")

	def render_objective_section():
	"""Render the project objectives section"""
	section_header("Project Objective")

	col1, col2 = st.columns([1, 1])

	with col1:
	st.markdown("""
	## Primary Goal

	Create an intelligent system that automatically recognizes facial gestures from a video stream in real-time.

	### Key Objectives

	1. Real-time Processing: Analyze video frames with minimal latency
	2. Accurate Detection: Precisely identify facial landmarks
	3. Gesture Classification: Correctly interpret facial movements
	4. Responsive Output: Provide immediate feedback based on detected gestures
	""")

	st.markdown("""
	### Target Gestures

	The system focuses on recognizing the following facial gestures:

	- Eye movements (blinks, winks)
	- Eyebrow movements (raising, furrowing)
	- Normal/neutral state
	""")

	with col2:


	# Add an interactive element - demo selector
	st.markdown("### Interactive Demo")
	gesture_type = st.selectbox(
	"Select a gesture type to learn more",
	["Eye Movements", "Eyebrow Movements", "Neutral State"]
	)

	if gesture_type == "Eye Movements":
	st.info("Eye movements like blinks and winks can be used for selection or confirmation actions.")
	elif gesture_type == "Eyebrow Movements":
	st.info("Eyebrow raising can indicate interest or be used as a trigger for specific actions.")
	elif gesture_type == "Neutral State":
	st.info("The neutral state serves as the baseline for detecting deviations that signal intentional gestures.")

	def render_architecture_section():
	"""Render the architecture and methodology section"""
	section_header("Architecture & Methodology")

	st.markdown("""
	## CNN-LSTM Architecture

	The system employs a hybrid deep learning architecture combining:

	- Convolutional Neural Networks (CNN): Extract spatial features from facial images
	- Long Short-Term Memory (LSTM): Capture temporal patterns in sequential frames
	""")

	# Display CNN-LSTM architecture diagram

	st.caption("Visual representation of CNN-LSTM architecture")

	col1, col2 = st.columns([1, 1])

	with col1:
	st.markdown("""
	### CNN Component

	The CNN portion of the architecture:

	- Processes individual video frames
	- Extracts spatial features from facial regions
	- Identifies key patterns in facial structure
	- Uses multiple convolutional layers with pooling
	""")

	# Create interactive CNN visualization
	st.markdown("#### CNN Layer Visualization")
	layer_slider = st.slider("Explore CNN layers", 1, 5, 1)

	fig, ax = plt.subplots(figsize=(6, 4))
	plt.title(f"CNN Layer {layer_slider} Feature Maps")

	# Generate mock feature map visualization
	grid_size = 4
	feature_maps = np.random.rand(grid_size, grid_size, 9)
	for i in range(9):
	plt.subplot(3, 3, i+1)
	plt.imshow(feature_maps[:,:,i], cmap='viridis')
	plt.axis('off')

	plt.tight_layout()
	st.pyplot(fig)

	with col2:
	st.markdown("""
	### LSTM Component

	The LSTM network:

	- Processes sequences of CNN-extracted features
	- Captures temporal dependencies between frames
	- Maintains memory of previous facial states
	- Enables detection of dynamic gestures over time
	""")

	# Add interactive LSTM cell visualization
	st.markdown("#### LSTM Cell Structure")

	st.image("https://upload.wikimedia.org/wikipedia/commons/9/93/LSTM_Cell.svg", caption="LSTM Cell Structure", use_container_width=True)

	st.markdown("""
	### Combined Model Benefits

	This hybrid architecture provides several advantages:

	1. Spatial-Temporal Processing: Captures both spatial features and temporal patterns
	2. Sequence Understanding: Recognizes gestures that develop over multiple frames
	3. Contextual Awareness: Considers the progression of facial movements
	4. Robust Classification: Higher accuracy for dynamic gestures
	""")

	def render_process_section():
	"""Render the process flow section"""
	section_header("Process Flow")

	st.markdown("""
	## System Workflow

	The facial gesture recognition process follows these key steps:
	""")

	# Create tabs for different stages of the process
	tab1, tab2, tab3 = st.tabs(["Data Collection", "Image Processing", "Model Training"])

	with tab1:
	col1, col2 = st.columns([3, 2])

	with col1:
	st.markdown("""
	### Data Collection

	The system requires a comprehensive dataset of facial gestures:

	- Video Capture: Short video clips recorded using webcam
	- Gesture Performance: Subjects perform predefined facial gestures
	- Labeling: Each video is labeled with the corresponding gesture
	- Dataset Diversity: Multiple subjects, lighting conditions, and angles

	A balanced dataset with various examples of each gesture is crucial for model generalization.
	""")

	with col2:

	st.caption("")

	with tab2:
	col1, col2 = st.columns([2, 3])

	with col1:
	st.image(AI_DATA_VIZ_IMAGES[0], use_container_width=True)
	st.caption("Image processing visualization")

	with col2:
	st.markdown("""
	### Image Processing

	Raw video frames undergo several preprocessing steps:

	1. Facial Detection: Locating the face in each frame
	2. Landmark Extraction: Identifying 68 key facial points
	3. Region Isolation: Extracting regions of interest (eyes, eyebrows)
	4. Normalization: Converting to grayscale, normalizing pixel values
	5. Augmentation: Generating additional training samples through transformations

	These steps ensure the input data is optimized for the neural network.
	""")

	# Interactive element - landmark detection demo
	show_landmarks = st.checkbox("Show facial landmarks example (eyes and eyebrows)")
	if show_landmarks:
	landmark_cols = st.columns(2)
	with landmark_cols[0]:
	# Mock landmark visualization using matplotlib - focusing on eyes and eyebrows
	fig, ax = plt.subplots(figsize=(4, 4))

	# Create a simple face outline
	circle = plt.Circle((0.5, 0.5), 0.4, fill=False, color='blue')
	ax.add_patch(circle)

	# Add eye landmarks with extra detail (6 points per eye)
	# Left eye
	left_eye_x = [0.30, 0.33, 0.37, 0.41, 0.38, 0.34]
	left_eye_y = [0.60, 0.58, 0.58, 0.60, 0.62, 0.62]
	ax.plot(left_eye_x, left_eye_y, 'g-', linewidth=2)
	for x, y in zip(left_eye_x, left_eye_y):
	ax.plot(x, y, 'go', markersize=4)

	# Right eye
	right_eye_x = [0.59, 0.62, 0.66, 0.70, 0.67, 0.63]
	right_eye_y = [0.60, 0.58, 0.58, 0.60, 0.62, 0.62]
	ax.plot(right_eye_x, right_eye_y, 'g-', linewidth=2)
	for x, y in zip(right_eye_x, right_eye_y):
	ax.plot(x, y, 'go', markersize=4)

	# Add detailed eyebrow landmarks (5 points per eyebrow)
	# Left eyebrow
	left_brow_x = [0.25, 0.30, 0.35, 0.40, 0.45]
	left_brow_y = [0.70, 0.72, 0.73, 0.72, 0.70]
	ax.plot(left_brow_x, left_brow_y, 'r-', linewidth=2)
	for x, y in zip(left_brow_x, left_brow_y):
	ax.plot(x, y, 'ro', markersize=4)

	# Right eyebrow
	right_brow_x = [0.55, 0.60, 0.65, 0.70, 0.75]
	right_brow_y = [0.70, 0.72, 0.73, 0.72, 0.70]
	ax.plot(right_brow_x, right_brow_y, 'r-', linewidth=2)
	for x, y in zip(right_brow_x, right_brow_y):
	ax.plot(x, y, 'ro', markersize=4)

	# Add labels
	ax.text(0.36, 0.67, "Left Eye", fontsize=9, ha='center')
	ax.text(0.64, 0.67, "Right Eye", fontsize=9, ha='center')
	ax.text(0.35, 0.76, "Left Eyebrow", fontsize=9, ha='center')
	ax.text(0.65, 0.76, "Right Eyebrow", fontsize=9, ha='center')

	ax.set_xlim(0, 1)
	ax.set_ylim(0, 1)
	ax.set_title("Eye and Eyebrow Landmarks")
	ax.axis('off')

	st.pyplot(fig)

	with landmark_cols[1]:
	st.markdown("""
	Focused Facial Landmarks Analysis:

	This system specifically analyzes:

	- Eyes (6 points each): Tracks eye openness, blinks, and winking
	- Eyebrows (5 points each): Detects eyebrow raising, furrowing, and expressions

	While the shape_predictor_68_face_landmarks model can identify 68 facial landmarks including:
	- 9 points for the nose
	- 20 points for the mouth
	- 17 points for the face contour

	This implementation focuses exclusively on eye and eyebrow movements for gesture recognition.
	""")

	with tab3:
	st.markdown("""
	### Model Training

	The CNN-LSTM model is trained using the processed dataset:

	1. Data Splitting: Division into training, validation, and test sets
	2. CNN Training: Learning spatial feature extraction
	3. LSTM Training: Learning temporal patterns
	4. Hyperparameter Tuning: Optimizing model architecture and parameters
	5. Validation: Evaluating performance on validation set
	6. Testing: Final evaluation on test set
	""")

	# Interactive training visualization
	st.markdown("#### Training Visualization")

	# Mock training metrics
	epochs = 50
	train_loss = 1.5 * np.exp(-0.05 * np.arange(epochs)) + 0.1 * np.random.rand(epochs)
	val_loss = 1.7 * np.exp(-0.04 * np.arange(epochs)) + 0.15 * np.random.rand(epochs)
	train_acc = 1 - train_loss * 0.5
	val_acc = 1 - val_loss * 0.5

	# Create interactive plot
	metric = st.radio("Select metric to visualize", ["Loss", "Accuracy"])

	if metric == "Loss":
	fig = px.line(
	x=list(range(1, epochs+1)),
	y=[train_loss, val_loss],
	labels={"x": "Epoch", "y": "Loss"},
	title="Training and Validation Loss",
	line_shape="spline"
	)
	fig.update_layout(legend_title_text="Legend")
	fig.add_scatter(x=list(range(1, epochs+1)), y=train_loss, name="Training Loss", line=dict(color="blue"))
	fig.add_scatter(x=list(range(1, epochs+1)), y=val_loss, name="Validation Loss", line=dict(color="red"))
	else:
	fig = px.line(
	x=list(range(1, epochs+1)),
	y=[train_acc, val_acc],
	labels={"x": "Epoch", "y": "Accuracy"},
	title="Training and Validation Accuracy",
	line_shape="spline"
	)
	fig.update_layout(legend_title_text="Legend")
	fig.add_scatter(x=list(range(1, epochs+1)), y=train_acc, name="Training Accuracy", line=dict(color="green"))
	fig.add_scatter(x=list(range(1, epochs+1)), y=val_acc, name="Validation Accuracy", line=dict(color="orange"))

	st.plotly_chart(fig)



	def render_technology_section():
	"""Render the technologies section"""
	section_header("Technologies")

	st.markdown("""
	## Core Technologies

	The facial gesture recognition system relies on several key technologies:
	""")

	col1, col2, col3 = st.columns(3)

	with col1:
	st.markdown("""
	### Python Ecosystem

	- Python: Core programming language
	- NumPy: Numerical operations
	- Pandas: Data management
	- Matplotlib/Plotly: Visualization
	""")

	st.image(AI_DATA_VIZ_IMAGES[2], use_container_width=True)
	st.caption("Python data analysis visualization")

	with col2:
	st.markdown("""
	### Deep Learning

	- TensorFlow/Keras: Neural network framework
	- CNN: Spatial feature extraction
	- LSTM: Temporal sequence processing
	- Transfer Learning: Leveraging pre-trained models
	""")

	# Create an interactive visualization of model architecture
	st.markdown("#### Model Architecture")

	fig = go.Figure()

	# Draw rectangles representing layers
	layers = [
	{"name": "Input", "width": 0.8, "height": 0.15, "x": 0.5, "y": 0.9, "color": "lightblue"},
	{"name": "Conv2D", "width": 0.8, "height": 0.1, "x": 0.5, "y": 0.75, "color": "lightgreen"},
	{"name": "MaxPooling", "width": 0.7, "height": 0.1, "x": 0.5, "y": 0.63, "color": "lightgreen"},
	{"name": "Conv2D", "width": 0.6, "height": 0.1, "x": 0.5, "y": 0.51, "color": "lightgreen"},
	{"name": "MaxPooling", "width": 0.5, "height": 0.1, "x": 0.5, "y": 0.39, "color": "lightgreen"},
	{"name": "LSTM", "width": 0.8, "height": 0.1, "x": 0.5, "y": 0.27, "color": "lightpink"},
	{"name": "Dense", "width": 0.6, "height": 0.1, "x": 0.5, "y": 0.15, "color": "lightyellow"},
	{"name": "Output", "width": 0.4, "height": 0.1, "x": 0.5, "y": 0.05, "color": "lightblue"}
	]

	for layer in layers:
	# Add layer rectangle
	fig.add_shape(
	type="rect",
	x0=layer["x"] - layer["width"]/2,
	y0=layer["y"] - layer["height"]/2,
	x1=layer["x"] + layer["width"]/2,
	y1=layer["y"] + layer["height"]/2,
	line=dict(color="black"),
	fillcolor=layer["color"]
	)

	# Add layer name
	fig.add_annotation(
	x=layer["x"],
	y=layer["y"],
	text=layer["name"],
	showarrow=False
	)

	# Add connection lines between layers (except for the last layer)
	if layer != layers[-1]:
	next_layer = layers[layers.index(layer) + 1]
	fig.add_shape(
	type="line",
	x0=layer["x"],
	y0=layer["y"] - layer["height"]/2,
	x1=next_layer["x"],
	y1=next_layer["y"] + next_layer["height"]/2,
	line=dict(color="gray", width=1)
	)

	fig.update_layout(
	showlegend=False,
	width=300,
	height=500,
	xaxis=dict(showgrid=False, zeroline=False, showticklabels=False, range=[0, 1]),
	yaxis=dict(showgrid=False, zeroline=False, showticklabels=False, range=[0, 1])
	)

	st.plotly_chart(fig)

	with col3:
	st.markdown("""
	### Computer Vision

	- OpenCV: Image and video processing
	- Dlib: Facial landmark detection
	- MediaPipe: Real-time face mesh tracking
	- Image augmentation: Diverse training samples
	""")

	st.image(AI_DATA_VIZ_IMAGES[3], use_container_width=True)
	st.caption("Computer vision analysis")

	st.markdown("---")

	# Technology performance comparison
	st.markdown("### Performance Comparison")

	# Create a mock performance comparison chart
	performance_data = {
	'Method': ['Traditional CV', 'CNN Only', 'LSTM Only', 'CNN-LSTM'],
	'Accuracy': [65, 82, 78, 93],
	'Speed (FPS)': [45, 28, 32, 25],
	'Memory (MB)': [120, 350, 280, 420]
	}

	metric_to_show = st.selectbox("Select performance metric", ["Accuracy", "Speed (FPS)", "Memory (MB)"])

	fig = px.bar(
	performance_data,
	x='Method',
	y=metric_to_show,
	color='Method',
	text=performance_data[metric_to_show],
	title=f"Performance Comparison - {metric_to_show}"
	)

	# Customize the chart appearance
	fig.update_traces(texttemplate='%{text}', textposition='outside')
	fig.update_layout(uniformtext_minsize=8, uniformtext_mode='hide')

	st.plotly_chart(fig)

	def render_applications_section():
	"""Render the applications section"""
	section_header("Applications")

	st.markdown("""
	## Potential Applications

	Facial gesture recognition technology has numerous practical applications across various domains:
	""")

	col1, col2 = st.columns([1, 1])

	with col1:


	st.markdown("""
	### Human-Computer Interaction

	- Hands-free Computing: Control computers without physical input devices
	- Accessible Technology: Enable computer usage for people with mobility limitations
	- Interactive Presentations: Control slides and demonstrations with facial gestures
	- Gaming: Enhanced immersion through facial expression controls
	""")

	st.markdown("""
	### Healthcare

	- Patient Monitoring: Track patient attentiveness or consciousness
	- Rehabilitation: Provide feedback for facial exercises
	- Pain Assessment: Detect discomfort through facial expressions
	- Mental Health: Analyze emotional responses during therapy
	""")

	with col2:
	st.markdown("""
	### Automotive Applications

	- Driver Monitoring: Detect drowsiness or distraction
	- In-car Controls: Adjust settings with facial gestures
	- Personalized Experience: Recognize driver identity and preferences
	- Security: Additional authentication layer
	""")

	st.markdown("""
	### Accessibility

	- Assistive Technology: Enable computer control for users with mobility impairments
	- Communication Aids: Help non-verbal individuals express themselves
	- Smart Home Control: Manage home automation with facial gestures
	- Public Kiosks: Enable gesture-based interaction with public information systems
	""")



	# Interactive application explorer
	st.markdown("### Application Explorer")

	application_area = st.selectbox(
	"Select an application area to explore",
	["Human-Computer Interaction", "Healthcare", "Automotive", "Accessibility", "Education"]
	)

	if application_area == "Human-Computer Interaction":
	st.info("""
	Featured Application: Gesture-Controlled Presentation System

	A system that allows presenters to control slideshows using facial gestures:
	- Eye blinks to advance slides
	- Eyebrow raises to go back
	- Head nods/shakes to confirm/cancel actions

	This enables hands-free presentations, allowing speakers to maintain natural gestures while speaking.
	""")
	elif application_area == "Healthcare":
	st.info("""
	Featured Application: Pain Assessment Tool

	A system that monitors patient facial expressions to detect signs of pain:
	- Real-time monitoring without requiring verbal communication
	- Particularly useful for non-verbal patients or those with cognitive impairments
	- Alerts medical staff when pain indicators are detected
	- Maintains a log of pain expression events for medical review
	""")
	elif application_area == "Automotive":
	st.info("""
	Featured Application: Driver Alertness Monitoring

	A system that detects signs of driver fatigue or distraction:
	- Monitors eye closure duration and blink rate
	- Detects head nodding indicative of drowsiness
	- Provides audio alerts when fatigue signs are detected
	- Suggests breaks when sustained fatigue patterns are observed
	""")
	elif application_area == "Accessibility":
	st.info("""
	Featured Application: Facial Gesture Computer Control

	A complete computer control system for people with limited mobility:
	- Cursor movement through slight head movements
	- Selection through eye blinks or eyebrow raises
	- Scrolling through specific eye movements
	- Text input through an on-screen keyboard navigated by facial gestures
	""")
	elif application_area == "Education":
	st.info("""
	Featured Application: Student Engagement Analytics

	A system that monitors student facial expressions during online learning:
	- Tracks attentiveness and engagement through eye movements
	- Identifies confusion through facial expressions
	- Provides analytics to instructors about student engagement
	- Helps identify content that may need additional explanation
	""")

	# Conclusion
	st.markdown("---")
	st.markdown("""
	## Conclusion

	Facial gesture recognition using AI represents a significant advancement in human-computer interaction. By combining CNN and LSTM architectures, we've created a system that can:

	- Accurately recognize facial gestures in real-time
	- Process video streams with minimal latency
	- Adapt to different users and environments
	- Enable new possibilities for accessibility and interaction

	This technology continues to evolve, with ongoing improvements in accuracy, speed, and adaptability.
	""")

	st.success("Thank you for exploring this presentation on Facial Gesture Recognition using AI!")

	# Using the SVG file from assets instead of embedding directly
	st.image("assets/workflow_diagram.svg")

	def get_landmark_point_from_detector(landmarks, index):
	"""Helper function from eye_eyebrow_detector.py"""
	return (landmarks.part(index).x, landmarks.part(index).y)

	def eye_aspect_ratio_from_detector(eye_pts):
	"""Helper function from eye_eyebrow_detector.py"""
	A = dist.euclidean(eye_pts[1], eye_pts[5])
	B = dist.euclidean(eye_pts[2], eye_pts[4])
	C = dist.euclidean(eye_pts[0], eye_pts[3])
	ear_val = (A + B) / (2.0 * C)
	return ear_val

	def initialize_dlib_components():
	"""Initializes dlib detector and predictor."""
	try:
	detector = dlib.get_frontal_face_detector()
	predictor = dlib.shape_predictor(DLIB_SHAPE_PREDICTOR_PATH)
	return detector, predictor
	except RuntimeError as e:
	st.error(f"Failed to load dlib model: {e}. Please ensure '{DLIB_SHAPE_PREDICTOR_PATH}' is in the correct path.")
	return None, None

	def render_live_demo_section():
	"""Render the live facial gesture recognition demo section"""
	section_header("Live Facial Gesture Demo")
	st.write("This demo uses your webcam to perform real-time eye and eyebrow gesture detection.")
	st.warning("Ensure you have a webcam connected and have granted permission if prompted by your browser. Also, make sure `shape_predictor_68_face_landmarks.dat` is in the application's root directory.")

	if 'detector' not in st.session_state or 'predictor' not in st.session_state:
	st.session_state.detector, st.session_state.predictor = initialize_dlib_components()

	if st.session_state.detector is None or st.session_state.predictor is None:
	st.error("Dlib components could not be initialized. The demo cannot run.")
	return

	# Initialize session state variables for the demo
	if 'run_demo' not in st.session_state:
	st.session_state.run_demo = False
	if 'calibration_counter' not in st.session_state:
	st.session_state.calibration_counter = 0
	if 'calibration_data_user_L_eyebrow_y' not in st.session_state:
	st.session_state.calibration_data_user_L_eyebrow_y = []
	if 'calibration_data_user_R_eyebrow_y' not in st.session_state:
	st.session_state.calibration_data_user_R_eyebrow_y = []
	if 'calibration_data_user_L_eye_top_y' not in st.session_state:
	st.session_state.calibration_data_user_L_eye_top_y = []
	if 'calibration_data_user_R_eye_top_y' not in st.session_state:
	st.session_state.calibration_data_user_R_eye_top_y = []
	if 'normal_user_L_eyebrow_y_avg' not in st.session_state:
	st.session_state.normal_user_L_eyebrow_y_avg = 0
	if 'normal_user_R_eyebrow_y_avg' not in st.session_state:
	st.session_state.normal_user_R_eyebrow_y_avg = 0
	if 'normal_user_L_eye_top_y_avg' not in st.session_state:
	st.session_state.normal_user_L_eye_top_y_avg = 0
	if 'normal_user_R_eye_top_y_avg' not in st.session_state:
	st.session_state.normal_user_R_eye_top_y_avg = 0
	if 'normal_dist_L_eyebrow_to_eye' not in st.session_state:
	st.session_state.normal_dist_L_eyebrow_to_eye = 0
	if 'normal_dist_R_eyebrow_to_eye' not in st.session_state:
	st.session_state.normal_dist_R_eyebrow_to_eye = 0
	if 'current_state_demo' not in st.session_state:
	st.session_state.current_state_demo = STATE_CALIBRATING
	if 'camera_active' not in st.session_state:
	st.session_state.camera_active = False


	col1, col2 = st.columns(2)
	with col1:
	if st.button("Start/Restart Demo"):
	st.session_state.run_demo = True
	st.session_state.camera_active = True
	# Reset calibration
	st.session_state.calibration_counter = 0
	st.session_state.calibration_data_user_L_eyebrow_y = []
	st.session_state.calibration_data_user_R_eyebrow_y = []
	st.session_state.calibration_data_user_L_eye_top_y = []
	st.session_state.calibration_data_user_R_eye_top_y = []
	st.session_state.current_state_demo = STATE_CALIBRATING
	st.info("Calibration started. Look at the camera with a normal expression.")
	with col2:
	if st.button("Stop Demo"):
	st.session_state.run_demo = False
	st.session_state.camera_active = False


	if st.session_state.run_demo and st.session_state.camera_active:
	# Placeholder for video feed
	frame_placeholder = st.empty()

	# Attempt to open the webcam
	# We manage cap in session_state to persist it across reruns if needed,
	# but for a continuous loop, it's tricky.
	# A common pattern is to release it if we stop.
	if 'cap' not in st.session_state or not st.session_state.cap.isOpened():
	st.session_state.cap = cv2.VideoCapture(0)

	if not st.session_state.cap.isOpened():
	st.error("Cannot open webcam.")
	st.session_state.run_demo = False # Stop demo if camera fails
	return

	detector = st.session_state.detector
	predictor = st.session_state.predictor

	while st.session_state.run_demo and st.session_state.cap.isOpened():
	ret, frame = st.session_state.cap.read()
	if not ret:
	st.error("Failed to grab frame from webcam.")
	break

	gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
	faces = detector(gray)

	display_text = st.session_state.current_state_demo

	if st.session_state.calibration_counter < CALIBRATION_FRAMES:
	st.session_state.current_state_demo = STATE_CALIBRATING
	display_text = f"{STATE_CALIBRATING} ({st.session_state.calibration_counter}/{CALIBRATION_FRAMES})"


	for face in faces:
	landmarks = predictor(gray, face)

	user_L_eyebrow_current_y_pts = [landmarks.part(i).y for i in user_L_eyebrow_y_calc_indices]
	current_user_L_eyebrow_y_avg = np.mean(user_L_eyebrow_current_y_pts) if user_L_eyebrow_current_y_pts else 0

	user_R_eyebrow_current_y_pts = [landmarks.part(i).y for i in user_R_eyebrow_y_calc_indices]
	current_user_R_eyebrow_y_avg = np.mean(user_R_eyebrow_current_y_pts) if user_R_eyebrow_current_y_pts else 0

	user_L_eye_top_current_y_pts = [landmarks.part(i).y for i in user_L_eye_top_indices]
	current_user_L_eye_top_y_avg = np.mean(user_L_eye_top_current_y_pts) if user_L_eye_top_current_y_pts else 0

	user_R_eye_top_current_y_pts = [landmarks.part(i).y for i in user_R_eye_top_indices]
	current_user_R_eye_top_y_avg = np.mean(user_R_eye_top_current_y_pts) if user_R_eye_top_current_y_pts else 0

	user_L_eye_all_pts = np.array([get_landmark_point_from_detector(landmarks, i) for i in range(user_L_eye_indices_start, user_L_eye_indices_end)], dtype="int")
	user_R_eye_all_pts = np.array([get_landmark_point_from_detector(landmarks, i) for i in range(user_R_eye_indices_start, user_R_eye_indices_end)], dtype="int")

	left_ear = eye_aspect_ratio_from_detector(user_L_eye_all_pts)
	right_ear = eye_aspect_ratio_from_detector(user_R_eye_all_pts)
	avg_ear = (left_ear + right_ear) / 2.0

	if st.session_state.calibration_counter < CALIBRATION_FRAMES:
	st.session_state.calibration_data_user_L_eyebrow_y.append(current_user_L_eyebrow_y_avg)
	st.session_state.calibration_data_user_R_eyebrow_y.append(current_user_R_eyebrow_y_avg)
	st.session_state.calibration_data_user_L_eye_top_y.append(current_user_L_eye_top_y_avg)
	st.session_state.calibration_data_user_R_eye_top_y.append(current_user_R_eye_top_y_avg)
	st.session_state.calibration_counter += 1

	display_text = f"{STATE_CALIBRATING} ({st.session_state.calibration_counter}/{CALIBRATION_FRAMES})"

	if st.session_state.calibration_counter == CALIBRATION_FRAMES:
	st.session_state.normal_user_L_eyebrow_y_avg = np.mean(st.session_state.calibration_data_user_L_eyebrow_y) if st.session_state.calibration_data_user_L_eyebrow_y else 0
	st.session_state.normal_user_R_eyebrow_y_avg = np.mean(st.session_state.calibration_data_user_R_eyebrow_y) if st.session_state.calibration_data_user_R_eyebrow_y else 0
	st.session_state.normal_user_L_eye_top_y_avg = np.mean(st.session_state.calibration_data_user_L_eye_top_y) if st.session_state.calibration_data_user_L_eye_top_y else 0
	st.session_state.normal_user_R_eye_top_y_avg = np.mean(st.session_state.calibration_data_user_R_eye_top_y) if st.session_state.calibration_data_user_R_eye_top_y else 0

	st.session_state.normal_dist_L_eyebrow_to_eye = st.session_state.normal_user_L_eye_top_y_avg - st.session_state.normal_user_L_eyebrow_y_avg
	st.session_state.normal_dist_R_eyebrow_to_eye = st.session_state.normal_user_R_eye_top_y_avg - st.session_state.normal_user_R_eyebrow_y_avg

	st.session_state.current_state_demo = STATE_NORMAL
	display_text = STATE_NORMAL
	st.success("Calibration finished.")
	else: # Detection Phase
	st.session_state.current_state_demo = STATE_NORMAL # Default to normal after calibration
	display_text = STATE_NORMAL
	if st.session_state.normal_dist_L_eyebrow_to_eye != 0 and st.session_state.normal_dist_R_eyebrow_to_eye != 0:
	if avg_ear < EAR_THRESHOLD:
	st.session_state.current_state_demo = STATE_YES
	display_text = STATE_YES
	else:
	current_dist_L = current_user_L_eye_top_y_avg - current_user_L_eyebrow_y_avg
	current_dist_R = current_user_R_eye_top_y_avg - current_user_R_eyebrow_y_avg

	threshold_dist_L = st.session_state.normal_dist_L_eyebrow_to_eye * (1 + EYEBROW_TO_EYE_VERTICAL_DISTANCE_INCREASE_FACTOR)
	threshold_dist_R = st.session_state.normal_dist_R_eyebrow_to_eye * (1 + EYEBROW_TO_EYE_VERTICAL_DISTANCE_INCREASE_FACTOR)

	if st.session_state.normal_dist_L_eyebrow_to_eye <= 0: threshold_dist_L = st.session_state.normal_dist_L_eyebrow_to_eye + abs(st.session_state.normal_dist_L_eyebrow_to_eye * EYEBROW_TO_EYE_VERTICAL_DISTANCE_INCREASE_FACTOR) + 5
	if st.session_state.normal_dist_R_eyebrow_to_eye <= 0: threshold_dist_R = st.session_state.normal_dist_R_eyebrow_to_eye + abs(st.session_state.normal_dist_R_eyebrow_to_eye * EYEBROW_TO_EYE_VERTICAL_DISTANCE_INCREASE_FACTOR) + 5

	if current_dist_L > threshold_dist_L and current_dist_R > threshold_dist_R:
	st.session_state.current_state_demo = STATE_NO
	display_text = STATE_NO

	# Display the detected state on the frame
	color = (255, 255, 0) # Default for Normal/Calibrating
	if st.session_state.current_state_demo == STATE_YES:
	color = (0, 255, 0)
	elif st.session_state.current_state_demo == STATE_NO:
	color = (0, 0, 255)

	# Make text larger and position it higher
	cv2.putText(frame, display_text, (frame.shape[1] // 2 - 100, 50), cv2.FONT_HERSHEY_SIMPLEX, 1.5, color, 3, cv2.LINE_AA)

	# Convert frame to RGB for Streamlit
	frame_rgb = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
	frame_placeholder.image(frame_rgb, channels="RGB")

	# Add a small delay to make the video smoother and allow Streamlit to process
	# time.sleep(0.01) # Removed for faster processing, relying on inherent delays

	# Release camera when demo stops or an error occurs
	if 'cap' in st.session_state and st.session_state.cap.isOpened():
	st.session_state.cap.release()
	if st.session_state.camera_active is False and 'cap' in st.session_state: # if explicitly stopped
	del st.session_state.cap


	elif not st.session_state.run_demo and st.session_state.camera_active:
	# This case handles when Stop Demo is clicked, ensuring camera is released.
	if 'cap' in st.session_state and st.session_state.cap.isOpened():
	st.session_state.cap.release()
	del st.session_state.cap # Ensure it's re-initialized if started again
	st.session_state.camera_active = False
	st.info("Live demo stopped.")

	# Example of how to call this new section in a main app structure:
	# if __name__ == "__main__":
	# st.set_page_config(layout="wide")
	# # Apply custom CSS (optional)
	# # st.markdown(CUSTOM_CSS, unsafe_allow_html=True)
	#
	# render_intro_section()
	# render_objective_section()
	# render_architecture_section()
	# render_process_section()
	# render_technology_section()
	# render_applications_section()
	# render_live_demo_section() # New section added here
	#
	# st.sidebar.title("Navigation")
	# page = st.sidebar.radio("Go to", ["Introduction", "Objective", "Architecture", "Process Flow", "Technologies", "Applications", "Live Demo"])
	#
	# if page == "Introduction": render_intro_section()
	# elif page == "Objective": render_objective_section()
	# # ... etc. for other sections
	# elif page == "Live Demo": render_live_demo_section() # Call if selected from sidebar too.
	# # This part is just an example of how one might structure the main app.
	# # The key is that `render_live_demo_section()` can now be called.