Spaces:
Sleeping
Sleeping
report edit
Browse files
notebooks/07_support_vector_machine.ipynb
CHANGED
|
@@ -767,7 +767,7 @@
|
|
| 767 |
"print(f\" - Max Iterations: {svm_classifier.max_iter}\")\n",
|
| 768 |
"print(f\"\\nFeature Engineering:\")\n",
|
| 769 |
"print(f\" - Vectorizer: TF-IDF\")\n",
|
| 770 |
-
"print(f\" - Max Features:
|
| 771 |
"print(f\" - N-gram Range: (1, 2)\")\n",
|
| 772 |
"print(f\" - Min Document Frequency: 5\")\n",
|
| 773 |
"print(f\" - Max Document Frequency: 0.8\")\n",
|
|
|
|
| 767 |
"print(f\" - Max Iterations: {svm_classifier.max_iter}\")\n",
|
| 768 |
"print(f\"\\nFeature Engineering:\")\n",
|
| 769 |
"print(f\" - Vectorizer: TF-IDF\")\n",
|
| 770 |
+
"print(f\" - Max Features: 100000\")\n",
|
| 771 |
"print(f\" - N-gram Range: (1, 2)\")\n",
|
| 772 |
"print(f\" - Min Document Frequency: 5\")\n",
|
| 773 |
"print(f\" - Max Document Frequency: 0.8\")\n",
|
notebooks/08_k_nearest_neighbors.ipynb
CHANGED
|
@@ -580,7 +580,7 @@
|
|
| 580 |
"print(f\" - Best CV F1-Score: {random_search.best_score_:.4f}\")\n",
|
| 581 |
"print(f\"\\nFeature Engineering:\")\n",
|
| 582 |
"print(f\" - Vectorizer: TF-IDF\")\n",
|
| 583 |
-
"print(f\" - Max Features:
|
| 584 |
"print(f\" - N-gram Range: (1, 2)\")\n",
|
| 585 |
"print(f\" - Min Document Frequency: 5\")\n",
|
| 586 |
"print(f\" - Max Document Frequency: 0.8\")\n",
|
|
|
|
| 580 |
"print(f\" - Best CV F1-Score: {random_search.best_score_:.4f}\")\n",
|
| 581 |
"print(f\"\\nFeature Engineering:\")\n",
|
| 582 |
"print(f\" - Vectorizer: TF-IDF\")\n",
|
| 583 |
+
"print(f\" - Max Features: 100000\")\n",
|
| 584 |
"print(f\" - N-gram Range: (1, 2)\")\n",
|
| 585 |
"print(f\" - Min Document Frequency: 5\")\n",
|
| 586 |
"print(f\" - Max Document Frequency: 0.8\")\n",
|
notebooks/09_decision_trees.ipynb
CHANGED
|
@@ -701,7 +701,7 @@
|
|
| 701 |
"print(f\" - Min Samples Leaf: {dt_classifier.min_samples_leaf}\")\n",
|
| 702 |
"print(f\"\\nFeature Engineering:\")\n",
|
| 703 |
"print(f\" - Vectorizer: TF-IDF\")\n",
|
| 704 |
-
"print(f\" - Max Features:
|
| 705 |
"print(f\" - N-gram Range: (1, 2)\")\n",
|
| 706 |
"print(f\" - Min Document Frequency: 5\")\n",
|
| 707 |
"print(f\" - Max Document Frequency: 0.8\")\n",
|
|
|
|
| 701 |
"print(f\" - Min Samples Leaf: {dt_classifier.min_samples_leaf}\")\n",
|
| 702 |
"print(f\"\\nFeature Engineering:\")\n",
|
| 703 |
"print(f\" - Vectorizer: TF-IDF\")\n",
|
| 704 |
+
"print(f\" - Max Features: 100000\")\n",
|
| 705 |
"print(f\" - N-gram Range: (1, 2)\")\n",
|
| 706 |
"print(f\" - Min Document Frequency: 5\")\n",
|
| 707 |
"print(f\" - Max Document Frequency: 0.8\")\n",
|
notebooks/10_random_forest.ipynb
CHANGED
|
@@ -712,7 +712,7 @@
|
|
| 712 |
"print(f\" - Max Features: {rf_classifier.max_features}\")\n",
|
| 713 |
"print(f\"\\nFeature Engineering:\")\n",
|
| 714 |
"print(f\" - Vectorizer: TF-IDF\")\n",
|
| 715 |
-
"print(f\" - Max Features:
|
| 716 |
"print(f\" - N-gram Range: (1, 2)\")\n",
|
| 717 |
"print(f\" - Min Document Frequency: 5\")\n",
|
| 718 |
"print(f\" - Max Document Frequency: 0.8\")\n",
|
|
|
|
| 712 |
"print(f\" - Max Features: {rf_classifier.max_features}\")\n",
|
| 713 |
"print(f\"\\nFeature Engineering:\")\n",
|
| 714 |
"print(f\" - Vectorizer: TF-IDF\")\n",
|
| 715 |
+
"print(f\" - Max Features: 100000\")\n",
|
| 716 |
"print(f\" - N-gram Range: (1, 2)\")\n",
|
| 717 |
"print(f\" - Min Document Frequency: 5\")\n",
|
| 718 |
"print(f\" - Max Document Frequency: 0.8\")\n",
|
notebooks/11_stochastic_gradient_descent.ipynb
CHANGED
|
@@ -768,7 +768,7 @@
|
|
| 768 |
"print(f\" - Early Stopping: {sgd_classifier.early_stopping}\")\n",
|
| 769 |
"print(f\"\\nFeature Engineering:\")\n",
|
| 770 |
"print(f\" - Vectorizer: TF-IDF\")\n",
|
| 771 |
-
"print(f\" - Max Features:
|
| 772 |
"print(f\" - N-gram Range: (1, 2)\")\n",
|
| 773 |
"print(f\" - Min Document Frequency: 5\")\n",
|
| 774 |
"print(f\" - Max Document Frequency: 0.8\")\n",
|
|
|
|
| 768 |
"print(f\" - Early Stopping: {sgd_classifier.early_stopping}\")\n",
|
| 769 |
"print(f\"\\nFeature Engineering:\")\n",
|
| 770 |
"print(f\" - Vectorizer: TF-IDF\")\n",
|
| 771 |
+
"print(f\" - Max Features: 100000\")\n",
|
| 772 |
"print(f\" - N-gram Range: (1, 2)\")\n",
|
| 773 |
"print(f\" - Min Document Frequency: 5\")\n",
|
| 774 |
"print(f\" - Max Document Frequency: 0.8\")\n",
|
notebooks/12_xgboost.ipynb
CHANGED
|
@@ -735,7 +735,7 @@
|
|
| 735 |
},
|
| 736 |
{
|
| 737 |
"cell_type": "code",
|
| 738 |
-
"execution_count":
|
| 739 |
"id": "24",
|
| 740 |
"metadata": {
|
| 741 |
"colab": {
|
|
@@ -793,7 +793,7 @@
|
|
| 793 |
"print(f\" - Min Child Weight: {xgb_classifier.min_child_weight}\")\n",
|
| 794 |
"print(f\"\\nFeature Engineering:\")\n",
|
| 795 |
"print(f\" - Vectorizer: TF-IDF\")\n",
|
| 796 |
-
"print(f\" - Max Features:
|
| 797 |
"print(f\" - N-gram Range: (1, 2)\")\n",
|
| 798 |
"print(f\" - Min Document Frequency: 5\")\n",
|
| 799 |
"print(f\" - Max Document Frequency: 0.8\")\n",
|
|
|
|
| 735 |
},
|
| 736 |
{
|
| 737 |
"cell_type": "code",
|
| 738 |
+
"execution_count": null,
|
| 739 |
"id": "24",
|
| 740 |
"metadata": {
|
| 741 |
"colab": {
|
|
|
|
| 793 |
"print(f\" - Min Child Weight: {xgb_classifier.min_child_weight}\")\n",
|
| 794 |
"print(f\"\\nFeature Engineering:\")\n",
|
| 795 |
"print(f\" - Vectorizer: TF-IDF\")\n",
|
| 796 |
+
"print(f\" - Max Features: 100000\")\n",
|
| 797 |
"print(f\" - N-gram Range: (1, 2)\")\n",
|
| 798 |
"print(f\" - Min Document Frequency: 5\")\n",
|
| 799 |
"print(f\" - Max Document Frequency: 0.8\")\n",
|
notebooks/13_lightgbm.ipynb
CHANGED
|
@@ -739,7 +739,7 @@
|
|
| 739 |
},
|
| 740 |
{
|
| 741 |
"cell_type": "code",
|
| 742 |
-
"execution_count":
|
| 743 |
"id": "24",
|
| 744 |
"metadata": {
|
| 745 |
"colab": {
|
|
@@ -798,7 +798,7 @@
|
|
| 798 |
"print(f\" - Colsample by Tree: {lgb_classifier.colsample_bytree}\")\n",
|
| 799 |
"print(f\"\\nFeature Engineering:\")\n",
|
| 800 |
"print(f\" - Vectorizer: TF-IDF\")\n",
|
| 801 |
-
"print(f\" - Max Features:
|
| 802 |
"print(f\" - N-gram Range: (1, 2)\")\n",
|
| 803 |
"print(f\" - Min Document Frequency: 5\")\n",
|
| 804 |
"print(f\" - Max Document Frequency: 0.8\")\n",
|
|
|
|
| 739 |
},
|
| 740 |
{
|
| 741 |
"cell_type": "code",
|
| 742 |
+
"execution_count": null,
|
| 743 |
"id": "24",
|
| 744 |
"metadata": {
|
| 745 |
"colab": {
|
|
|
|
| 798 |
"print(f\" - Colsample by Tree: {lgb_classifier.colsample_bytree}\")\n",
|
| 799 |
"print(f\"\\nFeature Engineering:\")\n",
|
| 800 |
"print(f\" - Vectorizer: TF-IDF\")\n",
|
| 801 |
+
"print(f\" - Max Features: 100000\")\n",
|
| 802 |
"print(f\" - N-gram Range: (1, 2)\")\n",
|
| 803 |
"print(f\" - Min Document Frequency: 5\")\n",
|
| 804 |
"print(f\" - Max Document Frequency: 0.8\")\n",
|