mhamoody commited on
Commit
6fd8aeb
·
1 Parent(s): a758cb5

report edit

Browse files
notebooks/07_support_vector_machine.ipynb CHANGED
@@ -767,7 +767,7 @@
767
  "print(f\" - Max Iterations: {svm_classifier.max_iter}\")\n",
768
  "print(f\"\\nFeature Engineering:\")\n",
769
  "print(f\" - Vectorizer: TF-IDF\")\n",
770
- "print(f\" - Max Features: 5000\")\n",
771
  "print(f\" - N-gram Range: (1, 2)\")\n",
772
  "print(f\" - Min Document Frequency: 5\")\n",
773
  "print(f\" - Max Document Frequency: 0.8\")\n",
 
767
  "print(f\" - Max Iterations: {svm_classifier.max_iter}\")\n",
768
  "print(f\"\\nFeature Engineering:\")\n",
769
  "print(f\" - Vectorizer: TF-IDF\")\n",
770
+ "print(f\" - Max Features: 100000\")\n",
771
  "print(f\" - N-gram Range: (1, 2)\")\n",
772
  "print(f\" - Min Document Frequency: 5\")\n",
773
  "print(f\" - Max Document Frequency: 0.8\")\n",
notebooks/08_k_nearest_neighbors.ipynb CHANGED
@@ -580,7 +580,7 @@
580
  "print(f\" - Best CV F1-Score: {random_search.best_score_:.4f}\")\n",
581
  "print(f\"\\nFeature Engineering:\")\n",
582
  "print(f\" - Vectorizer: TF-IDF\")\n",
583
- "print(f\" - Max Features: 5000\")\n",
584
  "print(f\" - N-gram Range: (1, 2)\")\n",
585
  "print(f\" - Min Document Frequency: 5\")\n",
586
  "print(f\" - Max Document Frequency: 0.8\")\n",
 
580
  "print(f\" - Best CV F1-Score: {random_search.best_score_:.4f}\")\n",
581
  "print(f\"\\nFeature Engineering:\")\n",
582
  "print(f\" - Vectorizer: TF-IDF\")\n",
583
+ "print(f\" - Max Features: 100000\")\n",
584
  "print(f\" - N-gram Range: (1, 2)\")\n",
585
  "print(f\" - Min Document Frequency: 5\")\n",
586
  "print(f\" - Max Document Frequency: 0.8\")\n",
notebooks/09_decision_trees.ipynb CHANGED
@@ -701,7 +701,7 @@
701
  "print(f\" - Min Samples Leaf: {dt_classifier.min_samples_leaf}\")\n",
702
  "print(f\"\\nFeature Engineering:\")\n",
703
  "print(f\" - Vectorizer: TF-IDF\")\n",
704
- "print(f\" - Max Features: 5000\")\n",
705
  "print(f\" - N-gram Range: (1, 2)\")\n",
706
  "print(f\" - Min Document Frequency: 5\")\n",
707
  "print(f\" - Max Document Frequency: 0.8\")\n",
 
701
  "print(f\" - Min Samples Leaf: {dt_classifier.min_samples_leaf}\")\n",
702
  "print(f\"\\nFeature Engineering:\")\n",
703
  "print(f\" - Vectorizer: TF-IDF\")\n",
704
+ "print(f\" - Max Features: 100000\")\n",
705
  "print(f\" - N-gram Range: (1, 2)\")\n",
706
  "print(f\" - Min Document Frequency: 5\")\n",
707
  "print(f\" - Max Document Frequency: 0.8\")\n",
notebooks/10_random_forest.ipynb CHANGED
@@ -712,7 +712,7 @@
712
  "print(f\" - Max Features: {rf_classifier.max_features}\")\n",
713
  "print(f\"\\nFeature Engineering:\")\n",
714
  "print(f\" - Vectorizer: TF-IDF\")\n",
715
- "print(f\" - Max Features: 5000\")\n",
716
  "print(f\" - N-gram Range: (1, 2)\")\n",
717
  "print(f\" - Min Document Frequency: 5\")\n",
718
  "print(f\" - Max Document Frequency: 0.8\")\n",
 
712
  "print(f\" - Max Features: {rf_classifier.max_features}\")\n",
713
  "print(f\"\\nFeature Engineering:\")\n",
714
  "print(f\" - Vectorizer: TF-IDF\")\n",
715
+ "print(f\" - Max Features: 100000\")\n",
716
  "print(f\" - N-gram Range: (1, 2)\")\n",
717
  "print(f\" - Min Document Frequency: 5\")\n",
718
  "print(f\" - Max Document Frequency: 0.8\")\n",
notebooks/11_stochastic_gradient_descent.ipynb CHANGED
@@ -768,7 +768,7 @@
768
  "print(f\" - Early Stopping: {sgd_classifier.early_stopping}\")\n",
769
  "print(f\"\\nFeature Engineering:\")\n",
770
  "print(f\" - Vectorizer: TF-IDF\")\n",
771
- "print(f\" - Max Features: 5000\")\n",
772
  "print(f\" - N-gram Range: (1, 2)\")\n",
773
  "print(f\" - Min Document Frequency: 5\")\n",
774
  "print(f\" - Max Document Frequency: 0.8\")\n",
 
768
  "print(f\" - Early Stopping: {sgd_classifier.early_stopping}\")\n",
769
  "print(f\"\\nFeature Engineering:\")\n",
770
  "print(f\" - Vectorizer: TF-IDF\")\n",
771
+ "print(f\" - Max Features: 100000\")\n",
772
  "print(f\" - N-gram Range: (1, 2)\")\n",
773
  "print(f\" - Min Document Frequency: 5\")\n",
774
  "print(f\" - Max Document Frequency: 0.8\")\n",
notebooks/12_xgboost.ipynb CHANGED
@@ -735,7 +735,7 @@
735
  },
736
  {
737
  "cell_type": "code",
738
- "execution_count": 19,
739
  "id": "24",
740
  "metadata": {
741
  "colab": {
@@ -793,7 +793,7 @@
793
  "print(f\" - Min Child Weight: {xgb_classifier.min_child_weight}\")\n",
794
  "print(f\"\\nFeature Engineering:\")\n",
795
  "print(f\" - Vectorizer: TF-IDF\")\n",
796
- "print(f\" - Max Features: 5000\")\n",
797
  "print(f\" - N-gram Range: (1, 2)\")\n",
798
  "print(f\" - Min Document Frequency: 5\")\n",
799
  "print(f\" - Max Document Frequency: 0.8\")\n",
 
735
  },
736
  {
737
  "cell_type": "code",
738
+ "execution_count": null,
739
  "id": "24",
740
  "metadata": {
741
  "colab": {
 
793
  "print(f\" - Min Child Weight: {xgb_classifier.min_child_weight}\")\n",
794
  "print(f\"\\nFeature Engineering:\")\n",
795
  "print(f\" - Vectorizer: TF-IDF\")\n",
796
+ "print(f\" - Max Features: 100000\")\n",
797
  "print(f\" - N-gram Range: (1, 2)\")\n",
798
  "print(f\" - Min Document Frequency: 5\")\n",
799
  "print(f\" - Max Document Frequency: 0.8\")\n",
notebooks/13_lightgbm.ipynb CHANGED
@@ -739,7 +739,7 @@
739
  },
740
  {
741
  "cell_type": "code",
742
- "execution_count": 17,
743
  "id": "24",
744
  "metadata": {
745
  "colab": {
@@ -798,7 +798,7 @@
798
  "print(f\" - Colsample by Tree: {lgb_classifier.colsample_bytree}\")\n",
799
  "print(f\"\\nFeature Engineering:\")\n",
800
  "print(f\" - Vectorizer: TF-IDF\")\n",
801
- "print(f\" - Max Features: 5000\")\n",
802
  "print(f\" - N-gram Range: (1, 2)\")\n",
803
  "print(f\" - Min Document Frequency: 5\")\n",
804
  "print(f\" - Max Document Frequency: 0.8\")\n",
 
739
  },
740
  {
741
  "cell_type": "code",
742
+ "execution_count": null,
743
  "id": "24",
744
  "metadata": {
745
  "colab": {
 
798
  "print(f\" - Colsample by Tree: {lgb_classifier.colsample_bytree}\")\n",
799
  "print(f\"\\nFeature Engineering:\")\n",
800
  "print(f\" - Vectorizer: TF-IDF\")\n",
801
+ "print(f\" - Max Features: 100000\")\n",
802
  "print(f\" - N-gram Range: (1, 2)\")\n",
803
  "print(f\" - Min Document Frequency: 5\")\n",
804
  "print(f\" - Max Document Frequency: 0.8\")\n",