Spaces:
Running
Running
copernicusai / computer-science-processes-database /processes /machine_learning /machine_learning-feature-engineering-pipeline.json
| { | |
| "id": "machine_learning-feature-engineering-pipeline", | |
| "name": "Feature Engineering Pipeline", | |
| "category": "computer_science", | |
| "subcategory": "machine_learning", | |
| "subcategory_name": "Machine Learning", | |
| "description": "Feature Engineering Pipeline process visualization. This process flowchart outlines key steps, checks, and outputs.", | |
| "complexity": { | |
| "nodes": 13, | |
| "edges": 14, | |
| "conditionals": 2, | |
| "logicGates": { | |
| "orGates": 3, | |
| "andGates": 1, | |
| "notGates": 0, | |
| "total": 4 | |
| }, | |
| "level": "high", | |
| "detailLevel": "source_grounded_rebuild", | |
| "loops": 1 | |
| }, | |
| "colorScheme": { | |
| "red": { | |
| "hex": "#ff6b6b", | |
| "category": "Triggers & Inputs" | |
| }, | |
| "yellow": { | |
| "hex": "#ffd43b", | |
| "category": "Structures & Objects" | |
| }, | |
| "green": { | |
| "hex": "#51cf66", | |
| "category": "Processing & Operations" | |
| }, | |
| "blue": { | |
| "hex": "#74c0fc", | |
| "category": "Intermediates & States" | |
| }, | |
| "violet": { | |
| "hex": "#b197fc", | |
| "category": "Products & Outputs" | |
| } | |
| }, | |
| "mermaid": "graph TD\n N1[\"Feature Engineering Pipeline...\"]\n N2[\"Raw Data\"]\n N3[\"Target Definition\"]\n N4[\"Schema + Types\"]\n N5[\"Train/Val Split\"]\n N6[\"Clean/Impute\"]\n N7[\"Encode/Scale\"]\n N8[\"Generate Features\"]\n N9{\"Select Features\"}\n N10[\"Feature Dataset Artifact\"]\n N11[\"Model-Ready Features\"]\n N12{\"Source-grounded check: Feature...\"}\n N13[\"Feature Engineering Pipeline...\"]\n\n N1 --> N2\n N2 --> N3\n N3 --> N4\n N4 --> N5\n N5 --> N6\n N6 --> N7\n N7 --> N8\n N8 --> N9\n N9 -->|yes| N10\n N10 --> N11\n N11 --> N12\n N12 -->|yes| N13\n N8 -->|iterate| N3\n N4 -->|skip/opt| N7\n\n style N1 fill:#ff6b6b,color:#fff\n style N2 fill:#ff6b6b,color:#fff\n style N3 fill:#ff6b6b,color:#fff\n style N4 fill:#ffd43b,color:#000\n style N5 fill:#ffd43b,color:#000\n style N6 fill:#51cf66,color:#fff\n style N7 fill:#51cf66,color:#fff\n style N8 fill:#51cf66,color:#fff\n style N9 fill:#51cf66,color:#fff\n style N10 fill:#74c0fc,color:#fff\n style N11 fill:#b197fc,color:#fff\n style N12 fill:#ffd43b,color:#000\n style N13 fill:#b197fc,color:#fff", | |
| "sources": [ | |
| { | |
| "title": "Feature Selection and Feature Engineering", | |
| "authors": "El-Amir, Hisham; Hamdy, Mahmoud", | |
| "journal": "Deep Learning Pipeline", | |
| "year": "2019", | |
| "pubmed": null, | |
| "doi": "10.1007/978-1-4842-5349-6_8", | |
| "url": "https://doi.org/10.1007/978-1-4842-5349-6_8" | |
| }, | |
| { | |
| "title": "Pattern Recognition and Machine Learning", | |
| "authors": "Bishop, C. M.", | |
| "journal": "Springer", | |
| "year": "2006", | |
| "pubmed": null, | |
| "doi": null, | |
| "url": "https://link.springer.com/book/9780387310732" | |
| }, | |
| { | |
| "title": "The Elements of Statistical Learning", | |
| "authors": "Hastie, T.; Tibshirani, R.; Friedman, J.", | |
| "journal": "Springer", | |
| "year": "2009", | |
| "pubmed": null, | |
| "doi": "10.1007/978-0-387-84858-7", | |
| "url": "https://doi.org/10.1007/978-0-387-84858-7" | |
| }, | |
| { | |
| "title": "Deep Learning", | |
| "authors": "Goodfellow, I.; Bengio, Y.; Courville, A.", | |
| "journal": "MIT Press", | |
| "year": "2016", | |
| "pubmed": null, | |
| "doi": null, | |
| "url": "https://www.deeplearningbook.org/" | |
| } | |
| ], | |
| "keywords": [ | |
| "feature", | |
| "engineering", | |
| "pipeline" | |
| ], | |
| "relatedProcesses": [], | |
| "created": "2026-01-15", | |
| "lastUpdated": "2026-04-30", | |
| "verified": false, | |
| "notes": "Corrective rebuild: replaces the generic scaffold with a process-specific step structure and records topology for duplicate detection.", | |
| "namedCollections": [], | |
| "graphMetrics": { | |
| "nodes": 13, | |
| "edges": 14, | |
| "conditionals": 2, | |
| "andGates": 1, | |
| "orGates": 3, | |
| "notGates": 0, | |
| "loops": 1 | |
| }, | |
| "nodeDetails": [ | |
| { | |
| "id": "N1", | |
| "label": "Feature Engineering Pipeline...", | |
| "detail": "Feature Engineering Pipeline research question", | |
| "type": "process", | |
| "role": "Triggers & Inputs" | |
| }, | |
| { | |
| "id": "N2", | |
| "label": "Raw Data", | |
| "detail": "Raw Data", | |
| "type": "process", | |
| "role": "Triggers & Inputs" | |
| }, | |
| { | |
| "id": "N3", | |
| "label": "Target Definition", | |
| "detail": "Target Definition", | |
| "type": "process", | |
| "role": "Triggers & Inputs" | |
| }, | |
| { | |
| "id": "N4", | |
| "label": "Schema + Types", | |
| "detail": "Schema + Types", | |
| "type": "process", | |
| "role": "Structures & Objects" | |
| }, | |
| { | |
| "id": "N5", | |
| "label": "Train/Val Split", | |
| "detail": "Train/Val Split", | |
| "type": "process", | |
| "role": "Structures & Objects" | |
| }, | |
| { | |
| "id": "N6", | |
| "label": "Clean/Impute", | |
| "detail": "Clean/Impute", | |
| "type": "process", | |
| "role": "Processing & Operations" | |
| }, | |
| { | |
| "id": "N7", | |
| "label": "Encode/Scale", | |
| "detail": "Encode/Scale", | |
| "type": "process", | |
| "role": "Processing & Operations" | |
| }, | |
| { | |
| "id": "N8", | |
| "label": "Generate Features", | |
| "detail": "Generate Features", | |
| "type": "process", | |
| "role": "Processing & Operations" | |
| }, | |
| { | |
| "id": "N9", | |
| "label": "Select Features", | |
| "detail": "Select Features", | |
| "type": "decision", | |
| "role": "Processing & Operations" | |
| }, | |
| { | |
| "id": "N10", | |
| "label": "Feature Dataset Artifact", | |
| "detail": "Feature Dataset Artifact", | |
| "type": "process", | |
| "role": "Intermediates & States" | |
| }, | |
| { | |
| "id": "N11", | |
| "label": "Model-Ready Features", | |
| "detail": "Model-Ready Features", | |
| "type": "process", | |
| "role": "Products & Outputs" | |
| }, | |
| { | |
| "id": "N12", | |
| "label": "Source-grounded check: Feature...", | |
| "detail": "Source-grounded check: Feature Selection and Feature Engineering", | |
| "type": "decision", | |
| "role": "Structures & Objects" | |
| }, | |
| { | |
| "id": "N13", | |
| "label": "Feature Engineering Pipeline...", | |
| "detail": "Feature Engineering Pipeline prediction/readout", | |
| "type": "process", | |
| "role": "Products & Outputs" | |
| } | |
| ], | |
| "flowchartStandard": { | |
| "name": "source_grounded_rebuild_v1", | |
| "applied": "2026-04-30", | |
| "curationStatus": "source_grounded_draft", | |
| "basis": "cs_exact_template", | |
| "topologySignature": "2bb2c0ba4603444c", | |
| "sourceGrounding": "Graph steps are derived from the process title, existing source metadata, and curated process/subfield templates; citations support the process topic and should be reviewed for node-level claims before marking verified." | |
| } | |
| } | |