[ { "cell": null, "code": "I001", "end_location": { "column": 2, "row": 39 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/data_cleaning.py", "fix": { "applicability": "safe", "edits": [ { "content": "from datetime import datetime\nimport json\nfrom pathlib import Path\nfrom typing import Dict, Tuple\n\nimport numpy as np\nimport pandas as pd\nfrom sklearn.model_selection import train_test_split\n\nfrom hopcroft_skill_classification_tool_competition.config import PROCESSED_DATA_DIR\nfrom hopcroft_skill_classification_tool_competition.features import (\n create_feature_dataset,\n extract_tfidf_features,\n get_label_columns,\n load_data_from_db,\n prepare_labels,\n)\n\n\n", "end_location": { "column": 1, "row": 42 }, "location": { "column": 1, "row": 24 } } ], "message": "Organize imports" }, "location": { "column": 1, "row": 24 }, "message": "Import block is un-sorted or un-formatted", "noqa_row": 24, "url": "https://docs.astral.sh/ruff/rules/unsorted-imports" }, { "cell": null, "code": "F401", "end_location": { "column": 27, "row": 34 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/data_cleaning.py", "fix": { "applicability": "safe", "edits": [ { "content": "", "end_location": { "column": 1, "row": 40 }, "location": { "column": 1, "row": 33 } } ], "message": "Remove unused import" }, "location": { "column": 5, "row": 34 }, "message": "`hopcroft_skill_classification_tool_competition.features.create_feature_dataset` imported but unused", "noqa_row": 34, "url": "https://docs.astral.sh/ruff/rules/unused-import" }, { "cell": null, "code": "F401", "end_location": { "column": 22, "row": 35 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/data_cleaning.py", "fix": { "applicability": "safe", "edits": [ { "content": "", "end_location": { "column": 1, "row": 40 }, "location": { "column": 1, "row": 33 } } ], "message": "Remove unused import" }, "location": { "column": 5, "row": 35 }, "message": "`hopcroft_skill_classification_tool_competition.features.load_data_from_db` imported but unused", "noqa_row": 35, "url": "https://docs.astral.sh/ruff/rules/unused-import" }, { "cell": null, "code": "F401", "end_location": { "column": 22, "row": 36 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/data_cleaning.py", "fix": { "applicability": "safe", "edits": [ { "content": "", "end_location": { "column": 1, "row": 40 }, "location": { "column": 1, "row": 33 } } ], "message": "Remove unused import" }, "location": { "column": 5, "row": 36 }, "message": "`hopcroft_skill_classification_tool_competition.features.get_label_columns` imported but unused", "noqa_row": 36, "url": "https://docs.astral.sh/ruff/rules/unused-import" }, { "cell": null, "code": "F401", "end_location": { "column": 27, "row": 37 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/data_cleaning.py", "fix": { "applicability": "safe", "edits": [ { "content": "", "end_location": { "column": 1, "row": 40 }, "location": { "column": 1, "row": 33 } } ], "message": "Remove unused import" }, "location": { "column": 5, "row": 37 }, "message": "`hopcroft_skill_classification_tool_competition.features.extract_tfidf_features` imported but unused", "noqa_row": 37, "url": "https://docs.astral.sh/ruff/rules/unused-import" }, { "cell": null, "code": "F401", "end_location": { "column": 19, "row": 38 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/data_cleaning.py", "fix": { "applicability": "safe", "edits": [ { "content": "", "end_location": { "column": 1, "row": 40 }, "location": { "column": 1, "row": 33 } } ], "message": "Remove unused import" }, "location": { "column": 5, "row": 38 }, "message": "`hopcroft_skill_classification_tool_competition.features.prepare_labels` imported but unused", "noqa_row": 38, "url": "https://docs.astral.sh/ruff/rules/unused-import" }, { "cell": null, "code": "F541", "end_location": { "column": 58, "row": 149 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/data_cleaning.py", "fix": { "applicability": "safe", "edits": [ { "content": "\"Conflicts resolved using majority voting\"", "end_location": { "column": 58, "row": 149 }, "location": { "column": 15, "row": 149 } } ], "message": "Remove extraneous `f` prefix" }, "location": { "column": 15, "row": 149 }, "message": "f-string without any placeholders", "noqa_row": 149, "url": "https://docs.astral.sh/ruff/rules/f-string-missing-placeholders" }, { "cell": null, "code": "F541", "end_location": { "column": 38, "row": 306 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/data_cleaning.py", "fix": { "applicability": "safe", "edits": [ { "content": "\"No data leakage detected\"", "end_location": { "column": 38, "row": 306 }, "location": { "column": 11, "row": 306 } } ], "message": "Remove extraneous `f` prefix" }, "location": { "column": 11, "row": 306 }, "message": "f-string without any placeholders", "noqa_row": 306, "url": "https://docs.astral.sh/ruff/rules/f-string-missing-placeholders" }, { "cell": null, "code": "E712", "end_location": { "column": 96, "row": 385 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/data_cleaning.py", "fix": { "applicability": "unsafe", "edits": [ { "content": "not stats.get(\"split\", {}).get(\"data_leakage\", True)", "end_location": { "column": 96, "row": 385 }, "location": { "column": 39, "row": 385 } } ], "message": "Replace with `not stats.get(\"split\", {}).get(\"data_leakage\", True)`" }, "location": { "column": 39, "row": 385 }, "message": "Avoid equality comparisons to `False`; use `not stats.get(\"split\", {}).get(\"data_leakage\", True):` for false checks", "noqa_row": 385, "url": "https://docs.astral.sh/ruff/rules/true-false-comparison" }, { "cell": null, "code": "I001", "end_location": { "column": 10, "row": 438 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/data_cleaning.py", "fix": { "applicability": "safe", "edits": [ { "content": " from hopcroft_skill_classification_tool_competition.features import (\n extract_tfidf_features,\n get_label_columns,\n get_text_columns,\n load_data_from_db,\n prepare_labels,\n )\n", "end_location": { "column": 1, "row": 439 }, "location": { "column": 1, "row": 435 } } ], "message": "Organize imports" }, "location": { "column": 9, "row": 435 }, "message": "Import block is un-sorted or un-formatted", "noqa_row": 435, "url": "https://docs.astral.sh/ruff/rules/unsorted-imports" }, { "cell": null, "code": "F541", "end_location": { "column": 35, "row": 460 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/data_cleaning.py", "fix": { "applicability": "safe", "edits": [ { "content": "\"\\nInitial data shape:\"", "end_location": { "column": 35, "row": 460 }, "location": { "column": 11, "row": 460 } } ], "message": "Remove extraneous `f` prefix" }, "location": { "column": 11, "row": 460 }, "message": "f-string without any placeholders", "noqa_row": 460, "url": "https://docs.astral.sh/ruff/rules/f-string-missing-placeholders" }, { "cell": null, "code": "F541", "end_location": { "column": 24, "row": 498 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/data_cleaning.py", "fix": { "applicability": "safe", "edits": [ { "content": "\"\\nSummary:\"", "end_location": { "column": 24, "row": 498 }, "location": { "column": 11, "row": 498 } } ], "message": "Remove extraneous `f` prefix" }, "location": { "column": 11, "row": 498 }, "message": "f-string without any placeholders", "noqa_row": 498, "url": "https://docs.astral.sh/ruff/rules/f-string-missing-placeholders" }, { "cell": null, "code": "F541", "end_location": { "column": 45, "row": 509 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/data_cleaning.py", "fix": { "applicability": "safe", "edits": [ { "content": "\"\\nData quality issues resolved:\"", "end_location": { "column": 45, "row": 509 }, "location": { "column": 11, "row": 509 } } ], "message": "Remove extraneous `f` prefix" }, "location": { "column": 11, "row": 509 }, "message": "f-string without any placeholders", "noqa_row": 509, "url": "https://docs.astral.sh/ruff/rules/f-string-missing-placeholders" }, { "cell": null, "code": "F541", "end_location": { "column": 36, "row": 510 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/data_cleaning.py", "fix": { "applicability": "safe", "edits": [ { "content": "\" - Duplicates removed\"", "end_location": { "column": 36, "row": 510 }, "location": { "column": 11, "row": 510 } } ], "message": "Remove extraneous `f` prefix" }, "location": { "column": 11, "row": 510 }, "message": "f-string without any placeholders", "noqa_row": 510, "url": "https://docs.astral.sh/ruff/rules/f-string-missing-placeholders" }, { "cell": null, "code": "F541", "end_location": { "column": 42, "row": 511 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/data_cleaning.py", "fix": { "applicability": "safe", "edits": [ { "content": "\" - Label conflicts resolved\"", "end_location": { "column": 42, "row": 511 }, "location": { "column": 11, "row": 511 } } ], "message": "Remove extraneous `f` prefix" }, "location": { "column": 11, "row": 511 }, "message": "f-string without any placeholders", "noqa_row": 511, "url": "https://docs.astral.sh/ruff/rules/f-string-missing-placeholders" }, { "cell": null, "code": "F541", "end_location": { "column": 40, "row": 512 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/data_cleaning.py", "fix": { "applicability": "safe", "edits": [ { "content": "\" - Sparse samples removed\"", "end_location": { "column": 40, "row": 512 }, "location": { "column": 11, "row": 512 } } ], "message": "Remove extraneous `f` prefix" }, "location": { "column": 11, "row": 512 }, "message": "f-string without any placeholders", "noqa_row": 512, "url": "https://docs.astral.sh/ruff/rules/f-string-missing-placeholders" }, { "cell": null, "code": "F541", "end_location": { "column": 37, "row": 513 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/data_cleaning.py", "fix": { "applicability": "safe", "edits": [ { "content": "\" - Rare labels removed\"", "end_location": { "column": 37, "row": 513 }, "location": { "column": 11, "row": 513 } } ], "message": "Remove extraneous `f` prefix" }, "location": { "column": 11, "row": 513 }, "message": "f-string without any placeholders", "noqa_row": 513, "url": "https://docs.astral.sh/ruff/rules/f-string-missing-placeholders" }, { "cell": null, "code": "F541", "end_location": { "column": 48, "row": 514 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/data_cleaning.py", "fix": { "applicability": "safe", "edits": [ { "content": "\" - Clean train/test split created\"", "end_location": { "column": 48, "row": 514 }, "location": { "column": 11, "row": 514 } } ], "message": "Remove extraneous `f` prefix" }, "location": { "column": 11, "row": 514 }, "message": "f-string without any placeholders", "noqa_row": 514, "url": "https://docs.astral.sh/ruff/rules/f-string-missing-placeholders" }, { "cell": null, "code": "F541", "end_location": { "column": 42, "row": 515 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/data_cleaning.py", "fix": { "applicability": "safe", "edits": [ { "content": "\" - No data leakage verified\"", "end_location": { "column": 42, "row": 515 }, "location": { "column": 11, "row": 515 } } ], "message": "Remove extraneous `f` prefix" }, "location": { "column": 11, "row": 515 }, "message": "f-string without any placeholders", "noqa_row": 515, "url": "https://docs.astral.sh/ruff/rules/f-string-missing-placeholders" }, { "cell": null, "code": "I001", "end_location": { "column": 2, "row": 14 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/dataset.py", "fix": { "applicability": "safe", "edits": [ { "content": "from pathlib import Path\nimport shutil\nimport zipfile\n\nfrom huggingface_hub import hf_hub_download\n\nfrom hopcroft_skill_classification_tool_competition.config import (\n DB_PATH,\n HF_FILENAME,\n HF_REPO_ID,\n RAW_DATA_DIR,\n)\n\n\n", "end_location": { "column": 1, "row": 17 }, "location": { "column": 1, "row": 3 } } ], "message": "Organize imports" }, "location": { "column": 1, "row": 3 }, "message": "Import block is un-sorted or un-formatted", "noqa_row": 3, "url": "https://docs.astral.sh/ruff/rules/unsorted-imports" }, { "cell": null, "code": "F401", "end_location": { "column": 12, "row": 10 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/dataset.py", "fix": { "applicability": "safe", "edits": [ { "content": "from hopcroft_skill_classification_tool_competition.config import (\n HF_FILENAME,\n HF_REPO_ID,\n RAW_DATA_DIR,\n)", "end_location": { "column": 2, "row": 14 }, "location": { "column": 1, "row": 9 } } ], "message": "Remove unused import: `hopcroft_skill_classification_tool_competition.config.DB_PATH`" }, "location": { "column": 5, "row": 10 }, "message": "`hopcroft_skill_classification_tool_competition.config.DB_PATH` imported but unused", "noqa_row": 10, "url": "https://docs.astral.sh/ruff/rules/unused-import" }, { "cell": null, "code": "I001", "end_location": { "column": 99, "row": 33 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/features.py", "fix": { "applicability": "safe", "edits": [ { "content": "from pathlib import Path\nimport re\nimport sqlite3\nfrom typing import Optional, Tuple\n\n# Import per lo Stemming\nimport nltk\nfrom nltk.stem import PorterStemmer\nimport numpy as np\nimport pandas as pd\nfrom sklearn.feature_extraction.text import TfidfVectorizer\n\nfrom hopcroft_skill_classification_tool_competition.config import PROCESSED_DATA_DIR, RAW_DATA_DIR\n\n", "end_location": { "column": 1, "row": 35 }, "location": { "column": 1, "row": 21 } } ], "message": "Organize imports" }, "location": { "column": 1, "row": 21 }, "message": "Import block is un-sorted or un-formatted", "noqa_row": 21, "url": "https://docs.astral.sh/ruff/rules/unsorted-imports" }, { "cell": null, "code": "F401", "end_location": { "column": 12, "row": 30 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/features.py", "fix": { "applicability": "safe", "edits": [ { "content": "", "end_location": { "column": 1, "row": 31 }, "location": { "column": 1, "row": 30 } } ], "message": "Remove unused import: `nltk`" }, "location": { "column": 8, "row": 30 }, "message": "`nltk` imported but unused", "noqa_row": 30, "url": "https://docs.astral.sh/ruff/rules/unused-import" }, { "cell": null, "code": "I001", "end_location": { "column": 47, "row": 8 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/mlsmote.py", "fix": { "applicability": "safe", "edits": [ { "content": "import random\n\nimport numpy as np\nimport pandas as pd\nfrom sklearn.datasets import make_classification\nfrom sklearn.neighbors import NearestNeighbors\n\n\n", "end_location": { "column": 1, "row": 10 }, "location": { "column": 1, "row": 4 } } ], "message": "Organize imports" }, "location": { "column": 1, "row": 4 }, "message": "Import block is un-sorted or un-formatted", "noqa_row": 4, "url": "https://docs.astral.sh/ruff/rules/unsorted-imports" }, { "cell": null, "code": "I001", "end_location": { "column": 2, "row": 23 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/modeling/train.py", "fix": { "applicability": "safe", "edits": [ { "content": "import argparse\nimport os\nfrom pathlib import Path\n\nfrom imblearn.over_sampling import ADASYN, SMOTE, RandomOverSampler\nimport joblib\nimport lightgbm as lgb\nimport mlflow\nimport mlflow.sklearn\nimport numpy as np\nfrom sklearn.decomposition import PCA\nfrom sklearn.ensemble import RandomForestClassifier\nfrom sklearn.metrics import f1_score, precision_score, recall_score\nfrom sklearn.model_selection import GridSearchCV, KFold, train_test_split\nfrom sklearn.multioutput import MultiOutputClassifier\n\nfrom hopcroft_skill_classification_tool_competition.config import (\n ADASYN_CONFIG,\n DATA_PATHS,\n MLFLOW_CONFIG,\n MODEL_CONFIG,\n PCA_CONFIG,\n TRAINING_CONFIG,\n)\n\n", "end_location": { "column": 1, "row": 25 }, "location": { "column": 1, "row": 1 } } ], "message": "Organize imports" }, "location": { "column": 1, "row": 1 }, "message": "Import block is un-sorted or un-formatted", "noqa_row": 1, "url": "https://docs.astral.sh/ruff/rules/unsorted-imports" }, { "cell": null, "code": "F401", "end_location": { "column": 41, "row": 13 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/modeling/train.py", "fix": { "applicability": "safe", "edits": [ { "content": "from imblearn.over_sampling import RandomOverSampler, ADASYN", "end_location": { "column": 68, "row": 13 }, "location": { "column": 1, "row": 13 } } ], "message": "Remove unused import: `imblearn.over_sampling.SMOTE`" }, "location": { "column": 36, "row": 13 }, "message": "`imblearn.over_sampling.SMOTE` imported but unused", "noqa_row": 13, "url": "https://docs.astral.sh/ruff/rules/unused-import" }, { "cell": null, "code": "I001", "end_location": { "column": 24, "row": 31 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/modeling/train.py", "fix": { "applicability": "safe", "edits": [ { "content": " import pandas as pd\n\n from hopcroft_skill_classification_tool_competition.mlsmote import MLSMOTE as mlsmote_function\n from hopcroft_skill_classification_tool_competition.mlsmote import get_minority_instace\n", "end_location": { "column": 1, "row": 32 }, "location": { "column": 1, "row": 27 } } ], "message": "Organize imports" }, "location": { "column": 5, "row": 27 }, "message": "Import block is un-sorted or un-formatted", "noqa_row": 27, "url": "https://docs.astral.sh/ruff/rules/unsorted-imports" }, { "cell": null, "code": "F541", "end_location": { "column": 84, "row": 340 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/modeling/train.py", "fix": { "applicability": "safe", "edits": [ { "content": "\"⚠️ Local MLSMOTE not available; falling back to RandomOverSampler\"", "end_location": { "column": 84, "row": 340 }, "location": { "column": 15, "row": 340 } } ], "message": "Remove extraneous `f` prefix" }, "location": { "column": 15, "row": 340 }, "message": "f-string without any placeholders", "noqa_row": 340, "url": "https://docs.astral.sh/ruff/rules/f-string-missing-placeholders" }, { "cell": null, "code": "F841", "end_location": { "column": 13, "row": 386 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/modeling/train.py", "fix": { "applicability": "unsafe", "edits": [ { "content": "", "end_location": { "column": 16, "row": 386 }, "location": { "column": 5, "row": 386 } } ], "message": "Remove assignment to unused variable `n_labels`" }, "location": { "column": 5, "row": 386 }, "message": "Local variable `n_labels` is assigned to but never used", "noqa_row": 386, "url": "https://docs.astral.sh/ruff/rules/unused-variable" }, { "cell": null, "code": "F541", "end_location": { "column": 84, "row": 568 }, "filename": "/home/giuto/Desktop/Uni/Magistrale/2° Anno/I° Semestre/Software Engineering for AI-Enabled Systems/Hopcroft/hopcroft_skill_classification_tool_competition/modeling/train.py", "fix": { "applicability": "safe", "edits": [ { "content": "\"⚠️ Local MLSMOTE not available; falling back to RandomOverSampler\"", "end_location": { "column": 84, "row": 568 }, "location": { "column": 15, "row": 568 } } ], "message": "Remove extraneous `f` prefix" }, "location": { "column": 15, "row": 568 }, "message": "f-string without any placeholders", "noqa_row": 568, "url": "https://docs.astral.sh/ruff/rules/f-string-missing-placeholders" } ]