TheBridgeMachineLearningPythonLibrary
diff --git a/‎requeriments.txt‎
Lines changed: 3 additions & 1 deletion b/‎requeriments.txt‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎toolkit/machine_learning.py‎
Lines changed: 29 additions & 1 deletion b/‎toolkit/machine_learning.py‎
Lines changed: 29 additions & 1 deletion
diff --git a/‎toolkit/plot.py‎
Lines changed: 27 additions & 0 deletions b/‎toolkit/plot.py‎
Lines changed: 27 additions & 0 deletions
diff --git a/‎toolkit/quickregression.py‎
Lines changed: 0 additions & 34 deletions b/‎toolkit/quickregression.py‎
Lines changed: 0 additions & 34 deletions
diff --git a/‎toolkit/wordcloudviz.py‎
Lines changed: 0 additions & 26 deletions b/‎toolkit/wordcloudviz.py‎
Lines changed: 0 additions & 26 deletions
@@ -55,4 +55,6 @@ missingno==0.5.1
 
 zipfile36==0.1.3
 
-imblearn==0.0
+imblearn==0.0
+
+wordcloud==1.7.0
@@ -140,4 +140,32 @@ def create_multiclass_prediction_df(model, class_names: List[str], X_test: Union
     if only_wrong:
         model_predictions_df = model_predictions_df[model_predictions_df['Top Prediction'] != model_predictions_df['Label']]
     # return the dataframe
-    return model_predictions_df
+    return model_predictions_df
+
+def quickregression(name):
+    from sklearn.metrics import mean_absolute_error, mean_squared_error, mean_absolute_percentage_error
+    """
+    Function to save time when doing Machine Learning models. 
+    It only asks the name of the model to train and returns the scoring.
+
+    Parameters
+    ----------
+    name = Name of the ML model.
+           Input Example = LinearRegression
+    
+    Returns
+    ----------
+    MAE, MAPE, MSE, RMSE and R2 Scores.
+    """
+
+    # Fit of the model in the previously split X_train, y_train
+    model = name()
+    model.fit(X_train, y_train)
+    # Predict of the model with X_test
+    modpred = model.predict(X_test)
+    # Scores of the model with y_test and the predict values.
+    print("MAE test:", mean_absolute_error(y_test, modpred))
+    print("MAPE test:", mean_absolute_percentage_error(y_test, modpred))
+    print("MSE test:", mean_squared_error(y_test, modpred))
+    print("RMSE test:", np.sqrt(mean_squared_error(y_test, modpred)))
+    return(model.score(X_train, y_train))
@@ -138,3 +138,30 @@ def sunburst(df, interior:str, exterior:str, col_num:str, title:str):
     fig = px.sunburst(df, path=[interior, exterior], values=col_num, template = 'plotly_dark')
     fig.update_layout(width=800, height=600, title = title)
     fig.show()
+
+def wordcloudviz(column):
+    import matplotlib.pyplot as plt
+    from wordcloud import WordCloud
+    """
+    Function to create a quick visualization of wordclouds in a given column of a dataframe called df.
+
+    Parameters
+    ----------
+    column = name of the column of the dataframe. 
+             Input example: df['column_name']
+
+    Return
+    ---------
+        A wordcloud visualization of the words in the column.
+    """
+    # First, it concatenates the text in a "single" text.
+    text = " ".join(comment for comment in column)
+
+    # Creates a wordcloud visualization
+    wordcloud = WordCloud(width=800, height=800, background_color='white').generate(text)
+
+    plt.figure(figsize=(8, 8), facecolor=None)
+    plt.imshow(wordcloud)
+    plt.axis("off")
+    plt.tight_layout(pad=0)
+    plt.show()