File size: 6,868 Bytes
c7f34f1
 
 
 
5252e41
 
 
de96b0e
 
04eb0d0
fa7427c
365e773
 
 
 
 
 
5252e41
 
 
 
 
 
 
 
 
 
 
 
 
 
 
c7f34f1
5252e41
 
 
 
 
 
de96b0e
5252e41
 
 
 
 
 
 
 
 
 
 
 
de96b0e
ee3ddaf
04eb0d0
 
 
 
86b7527
04eb0d0
 
 
 
 
 
 
 
 
 
de96b0e
86b7527
de96b0e
 
 
365e773
 
04eb0d0
 
de96b0e
 
 
365e773
de96b0e
365e773
de96b0e
 
 
365e773
 
 
96faedc
365e773
 
 
 
 
 
 
 
 
 
 
 
fa7427c
365e773
 
 
 
 
 
 
 
 
5252e41
 
365e773
 
44db7f1
7359cdc
 
c7f34f1
7359cdc
ee3ddaf
 
de96b0e
ee3ddaf
86b7527
7359cdc
86b7527
365e773
 
 
 
86b7527
7359cdc
86b7527
365e773
 
 
 
 
86b7527
 
 
 
 
 
 
 
 
ee3ddaf
7359cdc
 
ee3ddaf
365e773
7359cdc
 
365e773
7359cdc
365e773
86b7527
7359cdc
86b7527
 
 
 
 
 
 
 
 
 
365e773
86b7527
365e773
7359cdc
04eb0d0
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
import streamlit as st
import cv2
import numpy as np
import mediapipe as mp
import joblib
import pandas as pd
from numpy.linalg import norm
import matplotlib.pyplot as plt
import os

st.set_page_config(layout="wide")

# Define the alphabets
all_alphabets = 'ABCDEFGHIJKLMNOPQRSTUVWXYZ'
excluded_alphabets = 'DMNPTUVXZ'
working_alphabets = ''.join(set(all_alphabets) - set(excluded_alphabets))

# Function to load the Random Forest model
@st.cache_resource
def load_model():
    try:
        return joblib.load('best_random_forest_model.pkl')
    except Exception as e:
        st.error(f"Error loading model: {e}")
        return None

# Load the model using the cached function
model = load_model()

# Ensure the model is loaded before proceeding
if model is None:
    st.stop()

# Function to normalize landmarks
def normalize_landmarks(landmarks):
    center = np.mean(landmarks, axis=0)
    landmarks_centered = landmarks - center
    std_dev = np.std(landmarks_centered, axis=0)
    landmarks_normalized = landmarks_centered / std_dev
    return np.nan_to_num(landmarks_normalized)

# Function to calculate angles between landmarks
def calculate_angles(landmarks):
    angles = []
    for i in range(20):
        for j in range(i + 1, 21):
            vector = landmarks[j] - landmarks[i]
            angle_x = np.arccos(np.clip(vector[0] / norm(vector), -1.0, 1.0))
            angle_y = np.arccos(np.clip(vector[1] / norm(vector), -1.0, 1.0))
            angles.extend([angle_x, angle_y])
    return angles

# Function to process image and predict alphabet
def process_and_predict(image):
    mp_hands = mp.solutions.hands
    with mp_hands.Hands(static_image_mode=True, max_num_hands=1, min_detection_confidence=0.5) as hands:
        image_rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
        results = hands.process(image_rgb)
        
        if results.multi_hand_landmarks:
            landmarks = np.array([[lm.x, lm.y] for lm in results.multi_hand_landmarks[0].landmark])
            landmarks_normalized = normalize_landmarks(landmarks)
            angles = calculate_angles(landmarks_normalized)
            
            angle_columns = [f'angle_{i}' for i in range(len(angles))]
            angles_df = pd.DataFrame([angles], columns=angle_columns)
            
            probabilities = model.predict_proba(angles_df)[0]
            return probabilities, landmarks
    
    return None, None

# Function to plot hand landmarks
def plot_hand_landmarks(landmarks, title):
    fig, ax = plt.subplots(figsize=(5, 5))
    ax.scatter(landmarks[:, 0], landmarks[:, 1], c='blue', s=20)
    mp_hands = mp.solutions.hands
    for connection in mp_hands.HAND_CONNECTIONS:
        start_idx = connection[0]
        end_idx = connection[1]
        ax.plot([landmarks[start_idx, 0], landmarks[end_idx, 0]],
                [landmarks[start_idx, 1], landmarks[end_idx, 1]], 'r-', linewidth=1)
    ax.invert_yaxis()
    ax.set_title(title, fontsize=12)
    ax.axis('off')
    return fig

# README content
readme_content = f"""
## How it works

This ASL Recognition App uses image processing and machine learning to recognize American Sign Language (ASL) hand signs.

1. **Image Upload**: Users can upload an image of an ASL hand sign.
2. **Hand Detection**: The app uses MediaPipe to detect hand landmarks in the image.
3. **Feature Extraction**: Angles between hand landmarks are calculated and normalized.
4. **Prediction**: A Random Forest model predicts the ASL sign based on the extracted features.
5. **Visualization**: The app displays the detected hand landmarks and top predictions.

### Supported Alphabets

The app currently works for the following ASL alphabets:
{', '.join(working_alphabets)}

The app does not support or may not work correctly for:
{', '.join(excluded_alphabets)}

Note: The model's performance may vary and is subject to improvement.

The "View Hand Landmarks" tab allows users to see hand landmarks for pre-loaded ASL signs.
"""

# Streamlit app
st.title("ASL Recognition App")

# Display README content
st.sidebar.markdown(readme_content)

# Create tabs for different functionalities
tab1, tab2 = st.tabs(["Predict ASL Sign", "View Hand Landmarks"])

with tab1:
    st.header("Predict ASL Sign")
    uploaded_file = st.file_uploader("Upload an image of an ASL sign", type=["jpg", "jpeg", "png"])

    if uploaded_file is not None:
        try:
            image = cv2.imdecode(np.frombuffer(uploaded_file.read(), np.uint8), 1)
            if image is not None:
                col1, col2 = st.columns(2)
                with col1:
                    st.image(image, caption="Uploaded Image", use_column_width=True)
                
                probabilities, landmarks = process_and_predict(image)
                
                if probabilities is not None and landmarks is not None:
                    with col2:
                        st.subheader("Top 5 Predictions:")
                        top_indices = np.argsort(probabilities)[::-1][:5]
                        for i in top_indices:
                            st.write(f"{model.classes_[i]}: {probabilities[i]:.2f}")
                    
                    fig = plot_hand_landmarks(landmarks, "Detected Hand Landmarks")
                    st.pyplot(fig)
                else:
                    st.write("No hand detected in the image.")
            else:
                st.error("Failed to load the image. The file might be corrupted.")
        except Exception as e:
            st.error(f"An error occurred while processing the image: {str(e)}")

with tab2:
    st.header("View Hand Landmarks")
    
    selected_alphabets = st.multiselect("Select alphabets to view landmarks:", list(working_alphabets))

    if selected_alphabets:
        cols = st.columns(4)  # 4 columns for smaller images
        for idx, alphabet in enumerate(selected_alphabets):
            with cols[idx % 4]:
                image_path = os.path.join('asl test set', f'{alphabet.lower()}.jpeg')
                if os.path.exists(image_path):
                    try:
                        image = cv2.imread(image_path)
                        if image is not None:
                            probabilities, landmarks = process_and_predict(image)
                            if landmarks is not None:
                                fig = plot_hand_landmarks(landmarks, f"Hand Landmarks for {alphabet}")
                                st.pyplot(fig)
                            else:
                                st.error(f"No hand detected for {alphabet}")
                        else:
                            st.error(f"Failed to load image for {alphabet}")
                    except Exception as e:
                        st.error(f"Error processing image for {alphabet}")
                else:
                    st.error(f"Image not found for {alphabet}")