Spaces:
Sleeping
Sleeping
File size: 6,868 Bytes
c7f34f1 5252e41 de96b0e 04eb0d0 fa7427c 365e773 5252e41 c7f34f1 5252e41 de96b0e 5252e41 de96b0e ee3ddaf 04eb0d0 86b7527 04eb0d0 de96b0e 86b7527 de96b0e 365e773 04eb0d0 de96b0e 365e773 de96b0e 365e773 de96b0e 365e773 96faedc 365e773 fa7427c 365e773 5252e41 365e773 44db7f1 7359cdc c7f34f1 7359cdc ee3ddaf de96b0e ee3ddaf 86b7527 7359cdc 86b7527 365e773 86b7527 7359cdc 86b7527 365e773 86b7527 ee3ddaf 7359cdc ee3ddaf 365e773 7359cdc 365e773 7359cdc 365e773 86b7527 7359cdc 86b7527 365e773 86b7527 365e773 7359cdc 04eb0d0 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 |
import streamlit as st
import cv2
import numpy as np
import mediapipe as mp
import joblib
import pandas as pd
from numpy.linalg import norm
import matplotlib.pyplot as plt
import os
st.set_page_config(layout="wide")
# Define the alphabets
all_alphabets = 'ABCDEFGHIJKLMNOPQRSTUVWXYZ'
excluded_alphabets = 'DMNPTUVXZ'
working_alphabets = ''.join(set(all_alphabets) - set(excluded_alphabets))
# Function to load the Random Forest model
@st.cache_resource
def load_model():
try:
return joblib.load('best_random_forest_model.pkl')
except Exception as e:
st.error(f"Error loading model: {e}")
return None
# Load the model using the cached function
model = load_model()
# Ensure the model is loaded before proceeding
if model is None:
st.stop()
# Function to normalize landmarks
def normalize_landmarks(landmarks):
center = np.mean(landmarks, axis=0)
landmarks_centered = landmarks - center
std_dev = np.std(landmarks_centered, axis=0)
landmarks_normalized = landmarks_centered / std_dev
return np.nan_to_num(landmarks_normalized)
# Function to calculate angles between landmarks
def calculate_angles(landmarks):
angles = []
for i in range(20):
for j in range(i + 1, 21):
vector = landmarks[j] - landmarks[i]
angle_x = np.arccos(np.clip(vector[0] / norm(vector), -1.0, 1.0))
angle_y = np.arccos(np.clip(vector[1] / norm(vector), -1.0, 1.0))
angles.extend([angle_x, angle_y])
return angles
# Function to process image and predict alphabet
def process_and_predict(image):
mp_hands = mp.solutions.hands
with mp_hands.Hands(static_image_mode=True, max_num_hands=1, min_detection_confidence=0.5) as hands:
image_rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
results = hands.process(image_rgb)
if results.multi_hand_landmarks:
landmarks = np.array([[lm.x, lm.y] for lm in results.multi_hand_landmarks[0].landmark])
landmarks_normalized = normalize_landmarks(landmarks)
angles = calculate_angles(landmarks_normalized)
angle_columns = [f'angle_{i}' for i in range(len(angles))]
angles_df = pd.DataFrame([angles], columns=angle_columns)
probabilities = model.predict_proba(angles_df)[0]
return probabilities, landmarks
return None, None
# Function to plot hand landmarks
def plot_hand_landmarks(landmarks, title):
fig, ax = plt.subplots(figsize=(5, 5))
ax.scatter(landmarks[:, 0], landmarks[:, 1], c='blue', s=20)
mp_hands = mp.solutions.hands
for connection in mp_hands.HAND_CONNECTIONS:
start_idx = connection[0]
end_idx = connection[1]
ax.plot([landmarks[start_idx, 0], landmarks[end_idx, 0]],
[landmarks[start_idx, 1], landmarks[end_idx, 1]], 'r-', linewidth=1)
ax.invert_yaxis()
ax.set_title(title, fontsize=12)
ax.axis('off')
return fig
# README content
readme_content = f"""
## How it works
This ASL Recognition App uses image processing and machine learning to recognize American Sign Language (ASL) hand signs.
1. **Image Upload**: Users can upload an image of an ASL hand sign.
2. **Hand Detection**: The app uses MediaPipe to detect hand landmarks in the image.
3. **Feature Extraction**: Angles between hand landmarks are calculated and normalized.
4. **Prediction**: A Random Forest model predicts the ASL sign based on the extracted features.
5. **Visualization**: The app displays the detected hand landmarks and top predictions.
### Supported Alphabets
The app currently works for the following ASL alphabets:
{', '.join(working_alphabets)}
The app does not support or may not work correctly for:
{', '.join(excluded_alphabets)}
Note: The model's performance may vary and is subject to improvement.
The "View Hand Landmarks" tab allows users to see hand landmarks for pre-loaded ASL signs.
"""
# Streamlit app
st.title("ASL Recognition App")
# Display README content
st.sidebar.markdown(readme_content)
# Create tabs for different functionalities
tab1, tab2 = st.tabs(["Predict ASL Sign", "View Hand Landmarks"])
with tab1:
st.header("Predict ASL Sign")
uploaded_file = st.file_uploader("Upload an image of an ASL sign", type=["jpg", "jpeg", "png"])
if uploaded_file is not None:
try:
image = cv2.imdecode(np.frombuffer(uploaded_file.read(), np.uint8), 1)
if image is not None:
col1, col2 = st.columns(2)
with col1:
st.image(image, caption="Uploaded Image", use_column_width=True)
probabilities, landmarks = process_and_predict(image)
if probabilities is not None and landmarks is not None:
with col2:
st.subheader("Top 5 Predictions:")
top_indices = np.argsort(probabilities)[::-1][:5]
for i in top_indices:
st.write(f"{model.classes_[i]}: {probabilities[i]:.2f}")
fig = plot_hand_landmarks(landmarks, "Detected Hand Landmarks")
st.pyplot(fig)
else:
st.write("No hand detected in the image.")
else:
st.error("Failed to load the image. The file might be corrupted.")
except Exception as e:
st.error(f"An error occurred while processing the image: {str(e)}")
with tab2:
st.header("View Hand Landmarks")
selected_alphabets = st.multiselect("Select alphabets to view landmarks:", list(working_alphabets))
if selected_alphabets:
cols = st.columns(4) # 4 columns for smaller images
for idx, alphabet in enumerate(selected_alphabets):
with cols[idx % 4]:
image_path = os.path.join('asl test set', f'{alphabet.lower()}.jpeg')
if os.path.exists(image_path):
try:
image = cv2.imread(image_path)
if image is not None:
probabilities, landmarks = process_and_predict(image)
if landmarks is not None:
fig = plot_hand_landmarks(landmarks, f"Hand Landmarks for {alphabet}")
st.pyplot(fig)
else:
st.error(f"No hand detected for {alphabet}")
else:
st.error(f"Failed to load image for {alphabet}")
except Exception as e:
st.error(f"Error processing image for {alphabet}")
else:
st.error(f"Image not found for {alphabet}") |