| import gradio as gr |
| import joblib |
| from gensim.models import Word2Vec |
| import numpy as np |
|
|
| |
| classifier = joblib.load("random_forest_model.pkl") |
| word2vec_model = Word2Vec.load("word2vec_model.bin") |
| label_encoder = joblib.load("label_encoder.pkl") |
|
|
| def predict_comment(comment): |
| tokenized_comment = comment.split() |
| comment_vector = get_average_word2vec(tokenized_comment, word2vec_model, 100) |
| comment_vector = comment_vector.reshape(1, -1) |
| prediction = classifier.predict(comment_vector) |
| return "Based on Experience" if label_encoder.inverse_transform(prediction)[0] == 1 else "Not Based on Experience" |
|
|
| def get_average_word2vec(comment, model, num_features): |
| feature_vec = np.zeros((num_features,), dtype="float32") |
| n_words = 0 |
| for word in comment: |
| if word in model.wv.key_to_index: |
| n_words += 1 |
| feature_vec = np.add(feature_vec, model.wv[word]) |
| if n_words > 0: |
| feature_vec = np.divide(feature_vec, n_words) |
| return feature_vec |
|
|
| |
| iface = gr.Interface(fn=predict_comment, inputs="text", outputs="text") |
| iface.launch() |
|
|