a_voiceless_voice / classifier.py
Mackenzie Eng
Upload app
import pandas as pd #dependncies
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from tqdm.notebook import tqdm
import pyarrow.parquet as pq
import tensorflow as tf
import os
def classifier():
BASE_DIR = 'data/asl-signs/' #data directory
train = pd.read_csv(f'{BASE_DIR}/train.csv')
def run_model(model_path, frames): #classifier itself
# Initialize the TensorFlow Lite interpreter
interpreter = tf.lite.Interpreter(model_path=model_path)
# Get the list of available signatures
found_signatures = list(interpreter.get_signature_list().keys())
REQUIRED_SIGNATURE = "serving_default"
# Check if the required signature is available
if REQUIRED_SIGNATURE not in found_signatures:
raise Exception('Required input signature not found.')
# Get the prediction function from the interpreter
prediction_fn = interpreter.get_signature_runner(REQUIRED_SIGNATURE)
# Run the prediction function with the input frames
output = prediction_fn(inputs=frames)
sign = np.argmax(output["outputs"])
return sign
train['sign_ord'] = train['sign'].astype('category').cat.codes #helper functions to convert sign to ordinal and vice versa
SIGN2ORD = train[['sign', 'sign_ord']].set_index('sign').squeeze().to_dict()
ORD2SIGN = train[['sign_ord', 'sign']].set_index('sign_ord').squeeze().to_dict()
def load_relevant_data_subset(pq_path): #load data in proper format
data_columns = ['x', 'y', 'z']
data = pd.read_parquet(pq_path, columns=data_columns)
n_frames = int(len(data) / ROWS_PER_FRAME)
data = data.values.reshape(n_frames, ROWS_PER_FRAME, len(data_columns))
return data.astype(np.float32)
model_path = "model.tflite" #model path
pq_path = 'landmarks.parquet' #landmark path, this is the file that will be used to predict the sign
frames = load_relevant_data_subset(pq_path)
sign = ORD2SIGN[run_model(model_path, frames)]
#print(f"Predicted sign: {sign}")
return sign
if __name__ == "__main__":