Spaces:

Niharmahesh
/

slr-easz

Sleeping

App Files Files Community

Niharmahesh commited on Oct 19, 2024

Commit

5252e41

verified ·

1 Parent(s): 313ea3a

Update app.py

Browse files

Files changed (1) hide show

app.py +99 -102

app.py CHANGED Viewed

@@ -2,109 +2,106 @@ import streamlit as st
 import cv2
 import numpy as np
 import mediapipe as mp
-import pickle
-# Load models directly
-with open('random_forest_model.pkl', 'rb') as file:
-    random_forest_model = pickle.load(file)
-with open('svm_model.pkl', 'rb') as file:
-    svm_model = pickle.load(file)
-with open('hard_voting_classifier.pkl', 'rb') as file:
-    hard_voting_model = pickle.load(file)
-with open('soft_voting_classifier.pkl', 'rb') as file:
-    soft_voting_model = pickle.load(file)
-label_classes = np.load('label_classes.npy', allow_pickle=True)
-models = {
-    'Random Forest': random_forest_model,
-    'SVM': svm_model,
-    'Hard Voting': hard_voting_model,
-    'Soft Voting': soft_voting_model
-}
 # Initialize MediaPipe Hands
-mp_hands = mp.solutions.hands
-hands = mp_hands.Hands(static_image_mode=True, max_num_hands=1, min_detection_confidence=0.5)
-def process_landmarks(hand_landmarks):
-    x_ = [landmark.x for landmark in hand_landmarks.landmark]
-    y_ = [landmark.y for landmark in hand_landmarks.landmark]
-    min_x, min_y = min(x_), min(y_)
-    return [coord - min_val for landmark in hand_landmarks.landmark for coord, min_val in zip((landmark.x, landmark.y), (min_x, min_y))]
-def get_model_predictions(data_aux, model):
-    if hasattr(model, 'predict_proba'):
-        probabilities = model.predict_proba([data_aux])[0]
-    elif hasattr(model, 'decision_function'):
-        scores = model.decision_function([data_aux])[0]
-        probabilities = (scores - scores.min()) / (scores.max() - scores.min())
-    else:
-        class_pred = model.predict([data_aux])[0]
-        probabilities = np.zeros(len(label_classes))
-        probabilities[class_pred] = 1
-    # Add this check
-    if not hasattr(model, 'monotonic_cst'):
-        model.monotonic_cst = None
-    top_index = np.argmax(probabilities)
-    return label_classes[top_index], probabilities[top_index]
-def predict_alphabet(image):
-    image_rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
-    results = hands.process(image_rgb)
-    if not results.multi_hand_landmarks:
-        return None, None
-    data_aux = process_landmarks(results.multi_hand_landmarks[0])
-    predictions = {}
-    for model_name, model in models.items():
-        prediction, probability = get_model_predictions(data_aux, model)
-        predictions[model_name] = (prediction, probability)
-    return predictions, results.multi_hand_landmarks[0]
-def draw_hand_landmarks(image, hand_landmarks):
-    for landmark in hand_landmarks.landmark:
-        h, w, _ = image.shape
-        cx, cy = int(landmark.x * w), int(landmark.y * h)
-        cv2.circle(image, (cx, cy), 5, (0, 255, 0), -1)
-    return image
-# Streamlit App
-st.title("ASL Hand Shape Recognition App")
-uploaded_file = st.file_uploader("Choose a hand image...", type=["jpg", "jpeg", "png"])
 if uploaded_file is not None:
-    image = cv2.imdecode(np.frombuffer(uploaded_file.read(), np.uint8), 1)
-    st.image(image, channels="BGR", caption="Uploaded Hand Image")
-    predictions, hand_landmarks = predict_alphabet(image)
-    if predictions and hand_landmarks:
-        st.subheader("Predictions:")
-        for model_name, (prediction, probability) in predictions.items():
-            st.write(f"{model_name}: {prediction} (Probability: {probability:.2f})")
-        st.subheader("Hand Landmarks:")
-        landmark_image = draw_hand_landmarks(image.copy(), hand_landmarks)
-        st.image(landmark_image, channels="BGR", caption="Hand Landmarks")
-    else:
-        st.write("No hand detected in the image.")
-# User input to draw hand sign (placeholder)
-user_input = st.text_input("Enter alphabet to draw hand sign:")
-if user_input:
-    if len(user_input) == 1 and user_input.isalpha():
-        st.write(f"Drawing hand sign for alphabet: {user_input.upper()}")
-        # Placeholder for drawing hand sign
-        st.write("(Hand sign drawing functionality not implemented)")
-    else:
-        st.error("Please enter a single alphabet.")
-# Release MediaPipe resources
-hands.close()

 import cv2
 import numpy as np
 import mediapipe as mp
+import joblib
+import pandas as pd
+from numpy.linalg import norm
+# Function to load the Random Forest model
+@st.cache_resource
+def load_model():
+    try:
+        return joblib.load('best_random_forest_model.pkl')
+    except Exception as e:
+        st.error(f"Error loading model: {e}")
+        return None
+# Load the model using the cached function
+model = load_model()
+# Ensure the model is loaded before proceeding
+if model is None:
+    st.stop()
 # Initialize MediaPipe Hands
+@st.cache_resource
+def load_mediapipe_model():
+    mp_hands = mp.solutions.hands
+    return mp_hands.Hands(static_image_mode=True, max_num_hands=1, min_detection_confidence=0.5)
+hands = load_mediapipe_model()
+mp_drawing = mp.solutions.drawing_utils
+# Function to normalize landmarks
+def normalize_landmarks(landmarks):
+    # Center the landmarks
+    center = np.mean(landmarks, axis=0)
+    landmarks_centered = landmarks - center
+    # Scale the landmarks to unit variance
+    std_dev = np.std(landmarks_centered, axis=0)
+    landmarks_normalized = landmarks_centered / std_dev
+    # Replace NaN values with 0 (in case of division by zero)
+    landmarks_normalized = np.nan_to_num(landmarks_normalized)
+    return landmarks_normalized
+# Function to calculate angles between landmarks
+def calculate_angles(landmarks):
+    angles = []
+    for i in range(20):
+        for j in range(i + 1, 21):
+            vector = landmarks[j] - landmarks[i]
+            angle_x = np.arccos(np.clip(vector[0] / norm(vector), -1.0, 1.0))
+            angle_y = np.arccos(np.clip(vector[1] / norm(vector), -1.0, 1.0))
+            angles.extend([angle_x, angle_y])
+    return angles
+# Streamlit app
+st.title("ASL Recognition App")
+# Upload image using Streamlit's file uploader
+uploaded_file = st.file_uploader("Upload an image of an ASL sign", type=["jpg", "jpeg", "png"])
 if uploaded_file is not None:
+    try:
+        # Read the image
+        image = cv2.imdecode(np.frombuffer(uploaded_file.read(), np.uint8), cv2.IMREAD_COLOR)
+        image_rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+        # Process the image and find hand landmarks
+        results = hands.process(image_rgb)
+        if results.multi_hand_landmarks:
+            for hand_landmarks in results.multi_hand_landmarks:
+                # Draw landmarks on the image
+                mp_drawing.draw_landmarks(image, hand_landmarks, mp.solutions.hands.HAND_CONNECTIONS)
+                # Extract and normalize landmarks
+                landmarks = np.array([[lm.x, lm.y] for lm in hand_landmarks.landmark])
+                landmarks_normalized = normalize_landmarks(landmarks)
+                # Calculate angles using normalized landmarks
+                angles = calculate_angles(landmarks_normalized)
+                # Prepare input with feature names
+                angle_columns = [f'angle_{i}' for i in range(len(angles))]
+                angles_df = pd.DataFrame([angles], columns=angle_columns)
+                # Predict the alphabet
+                probabilities = model.predict_proba(angles_df)[0]
+                top_indices = np.argsort(probabilities)[::-1][:5]
+                top_probabilities = probabilities[top_indices]
+                top_classes = model.classes_[top_indices]
+                # Display the top 5 predictions
+                st.write("Top 5 Predicted Alphabets:")
+                for i in range(5):
+                    st.write(f"{top_classes[i]}: {top_probabilities[i]:.2f}")
+            # Display the image with landmarks
+            st.image(image, caption="Processed Image with Landmarks", use_column_width=True)
+        else:
+            st.write("No hands detected. Please try another image.")
+    except Exception as e:
+        st.error(f"Error processing image: {e}")