SignTranslateProject/functions.py at main · kjs1019/SignTranslateProject

90 lines (76 loc) · 5.03 KB
from packages import *
def mediapipe_detection(image, model):
    image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)      # Convert BGR -> RGB
    image.flags.writeable = False                       # Set the image to read-only mode
    results = model.process(image)                      # MediaPipe Model Prediction
    image.flags.writeable = True                        # Set the image back to writeable mode
    image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)      # Convert back to RGB -> BGR
    return results
def mediapipe_detection_draw_landmarks(image, results):
    mediapipe_drawing.draw_landmarks(image, results.face_landmarks, mediapipe_holistic.FACEMESH_TESSELATION,
                                     mediapipe_drawing.DrawingSpec(color=(255,0,0), thickness=1, circle_radius=1),  # Dot Color/Size
                                          mediapipe_drawing.DrawingSpec(color=(0,255,0), thickness=1, circle_radius=1))  # Line Color/Size
    mediapipe_drawing.draw_landmarks(image, results.pose_landmarks, mediapipe_holistic.POSE_CONNECTIONS,
                                     mediapipe_drawing.DrawingSpec(color=(255, 0, 0), thickness=2, circle_radius=3), # Dot Color/Size
                                     mediapipe_drawing.DrawingSpec(color=(0, 255, 0), thickness=2, circle_radius=2)) # Line Color/Size
    mediapipe.solutions.drawing_utils.draw_landmarks(image, results.left_hand_landmarks, mediapipe_holistic.HAND_CONNECTIONS,
                                    mediapipe_drawing.DrawingSpec(color=(255, 0, 0), thickness=2, circle_radius=3), # Dot Color/Size
                                    mediapipe_drawing.DrawingSpec(color=(0, 255, 0), thickness=2, circle_radius=2)) # Line Color/Size
    mediapipe.solutions.drawing_utils.draw_landmarks(image, results.right_hand_landmarks, mediapipe_holistic.HAND_CONNECTIONS,
                                    mediapipe_drawing.DrawingSpec(color=(255, 0, 0), thickness=2, circle_radius=3), # Dot Color/Size
                                    mediapipe_drawing.DrawingSpec(color=(0, 255, 0), thickness=2, circle_radius=2)) # Line Color/Size
def keypoint_value_extraction(results):
    if results.face_landmarks:
        face = np.array([[res.x, res.y, res.z] for res in results.face_landmarks.landmark]).flatten()     # Flatten into 1-D array
        face = np.zeros(468 * 3)  # Fill with zeros if no face detected
    if results.pose_landmarks:
        pose = np.array([[res.x, res.y, res.z, res.visibility] for res in results.pose_landmarks.landmark]).flatten()     # Flatten into 1-D array
        pose = np.zeros(33 * 4)  # Fill with zeros if no pose detected
    if results.left_hand_landmarks:
        left_hand = np.array([[res.x, res.y, res.z] for res in results.left_hand_landmarks.landmark]).flatten()     # Flatten into 1-D array
        left_hand = np.zeros(21 * 3)  # Fill with zeros if no left hand detected
    if results.right_hand_landmarks:
        right_hand = np.array([[res.x, res.y, res.z] for res in results.right_hand_landmarks.landmark]).flatten()   # Flatten into 1-D array
        right_hand = np.zeros(21 * 3)  # Fill with zeros if no right hand detected
    keypoints = np.concatenate([face, pose, left_hand, right_hand]) # Concatenate into one array
    #keypoints = np.concatenate([pose, left_hand, right_hand])  # Concatenate into one array
    #keypoints = np.concatenate([left_hand, right_hand])  # Concatenate into one array
    return keypoints
def myPutText(src, text, pos, font_size, font_color) :
    img_pil = Image.fromarray(src)
    draw = ImageDraw.Draw(img_pil)
    font = ImageFont.truetype('fonts/gulim.ttc', font_size)
    draw.text(pos, text, font=font, fill= font_color)
    return np.array(img_pil)
def interpolate_keypoints(keypoints1, keypoints2, num_transition_frames):
    # Smoothly transition between two sets of keypoints over a number of frames.
    transition_frames = []
    for t in range(1, num_transition_frames + 1):
        alpha = t / (num_transition_frames + 1)  # Interpolation factor
        interpolated_keypoints = keypoints1 * (1 - alpha) + keypoints2 * alpha
        transition_frames.append(interpolated_keypoints)
    return transition_frames
def load_word_data(word_path):
    # Load all sequences and frames for a word.
    all_frames = []
    for sequence in sorted(os.listdir(word_path), key=lambda x: int(x)):
        sequence_path = os.path.join(word_path, sequence)
        if not os.path.isdir(sequence_path):
            continue
        for frame_file in sorted(os.listdir(sequence_path), key=lambda x: int(x.split('.')[0])):
            frame_path = os.path.join(sequence_path, frame_file)
            all_frames.append(np.load(frame_path))
    return all_frames
def extract_words_from_output_textfile(file_path):
    words = []
    with open(file_path, 'r', encoding='utf-8') as file:
        for line in file:
            # Split the line by '=' and extract the word (strip quotes and spaces)
            if '=' in line:
                _, word = line.split('=')
                words.append(word.strip().strip('"'))
    return words
Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

functions.py

Latest commit

History

functions.py

File metadata and controls