Spaces:
Sleeping
Sleeping
Update data/profile.json
Browse files- data/profile.json +83 -101
data/profile.json
CHANGED
|
@@ -2,7 +2,7 @@
|
|
| 2 |
{
|
| 3 |
"type": "Personal Profile",
|
| 4 |
"name": "RONALD NYASHA KANYEPI",
|
| 5 |
-
"summary": "Data Scientist
|
| 6 |
"contact": {
|
| 7 |
"email": "kanyepironald@gmail.com",
|
| 8 |
"linkedin": "https://www.linkedin.com/in/ronald-nyasha-kanyepi/",
|
|
@@ -15,14 +15,14 @@
|
|
| 15 |
"location": "Atlanta, GA",
|
| 16 |
"degree": "Master of Science in Business Analytics",
|
| 17 |
"graduation_year": 2025,
|
| 18 |
-
"notes": "Graduated with MSBA Rigor Award for
|
| 19 |
},
|
| 20 |
{
|
| 21 |
"institution": "UNIVERSITY OF ZIMBABWE",
|
| 22 |
"location": "Harare, Zimbabwe",
|
| 23 |
"degree": "Bachelor of Business Studies and Computing Science",
|
| 24 |
"graduation_year": 2021,
|
| 25 |
-
"notes": "Graduated with
|
| 26 |
}
|
| 27 |
],
|
| 28 |
"certifications": [
|
|
@@ -38,10 +38,10 @@
|
|
| 38 |
"company": "Pennybacker Capital - Austin, Texas",
|
| 39 |
"dates": "Dec 2024 - May 2025",
|
| 40 |
"achievements": [
|
| 41 |
-
"Designed and deployed
|
| 42 |
-
"Engineered
|
| 43 |
-
"
|
| 44 |
-
"Translated complex
|
| 45 |
]
|
| 46 |
},
|
| 47 |
{
|
|
@@ -49,10 +49,10 @@
|
|
| 49 |
"company": "AFC Commercial Bank - Harare, Zimbabwe",
|
| 50 |
"dates": "Mar 2024 – Jun 2024",
|
| 51 |
"achievements": [
|
| 52 |
-
|
| 53 |
-
|
| 54 |
-
|
| 55 |
-
|
| 56 |
]
|
| 57 |
},
|
| 58 |
{
|
|
@@ -60,98 +60,80 @@
|
|
| 60 |
"company": "AFC Commercial Bank - Harare, Zimbabwe",
|
| 61 |
"dates": "Jun 2022 – Feb 2024",
|
| 62 |
"achievements": [
|
| 63 |
-
"
|
| 64 |
-
"
|
| 65 |
-
"
|
| 66 |
-
"Modernized a monolithic reconciliation
|
| 67 |
]
|
| 68 |
}
|
| 69 |
],
|
| 70 |
"technical_capabilities": {
|
| 71 |
-
"Programming & Machine Learning": [
|
| 72 |
-
|
| 73 |
-
|
| 74 |
-
|
| 75 |
-
|
| 76 |
-
|
| 77 |
-
|
| 78 |
-
|
| 79 |
-
|
| 80 |
-
|
| 81 |
-
|
| 82 |
-
"
|
| 83 |
-
|
| 84 |
-
|
| 85 |
-
|
| 86 |
-
|
| 87 |
-
"
|
| 88 |
-
|
| 89 |
-
|
| 90 |
-
|
| 91 |
-
|
| 92 |
-
|
| 93 |
-
"
|
| 94 |
-
|
| 95 |
-
|
| 96 |
-
|
| 97 |
-
|
| 98 |
-
|
| 99 |
-
|
| 100 |
-
|
| 101 |
-
|
| 102 |
-
|
| 103 |
-
|
| 104 |
-
|
| 105 |
-
|
| 106 |
-
|
| 107 |
-
|
| 108 |
-
|
| 109 |
-
|
| 110 |
-
|
| 111 |
-
|
| 112 |
-
|
| 113 |
-
|
| 114 |
-
|
| 115 |
-
|
| 116 |
-
|
| 117 |
-
|
| 118 |
-
|
| 119 |
-
|
| 120 |
-
|
| 121 |
-
|
| 122 |
-
|
| 123 |
-
|
| 124 |
-
|
| 125 |
-
|
| 126 |
-
|
| 127 |
-
|
| 128 |
-
|
| 129 |
-
|
| 130 |
-
|
| 131 |
-
|
| 132 |
-
|
| 133 |
-
|
| 134 |
-
|
| 135 |
-
|
| 136 |
-
|
| 137 |
-
|
| 138 |
-
"Developed an interactive dashboard in Dash with real-time updates for SLA metrics, error rates, and response times.",
|
| 139 |
-
"Containerized the entire architecture using Docker-compose, including Zookeeper, Kafka, DynamoDB, and a Spark-Jupyter environment."
|
| 140 |
-
],
|
| 141 |
-
"technologies": ["Python", "Apache Kafka", "Apache Spark", "DynamoDB", "HDFS", "Parquet", "Docker", "Dash", "Plotly"],
|
| 142 |
-
"source_url": "https://github.com/ronaldkanyepi/Log-Realtime-Analysis"
|
| 143 |
-
},
|
| 144 |
-
{
|
| 145 |
-
"type": "Project",
|
| 146 |
-
"project_name": "Zim Docs OCR-to-JSON Extractor",
|
| 147 |
-
"summary": "A web application built with Gradio that allows users to upload scanned documents (PDFs) or images. It uses a vision AI model to perform OCR and extract structured information into a JSON format for various document types like licenses, passports, and invoices.",
|
| 148 |
-
"my_role_and_achievements": [
|
| 149 |
-
"Built a user-friendly web application using Gradio.",
|
| 150 |
-
"Integrated a vision AI model to perform OCR and structured data extraction.",
|
| 151 |
-
"Handled both PDF and image file uploads using Gradio-PDF and PyMuPDF.",
|
| 152 |
-
"Managed API key integration via environment variables for use with services like OpenRouter.ai, making it compatible with Hugging Face Spaces secrets."
|
| 153 |
-
],
|
| 154 |
-
"technologies": ["Python", "Gradio", "Gradio-PDF", "PyMuPDF (fitz)", "OpenAI-compatible APIs"],
|
| 155 |
-
"source_url": {"demo":"https://huggingface.co/spaces/NyashaK/DocOCR2JSON","github": "https://github.com/ronaldkanyepi/docs-ocr-2-json"}
|
| 156 |
}
|
| 157 |
-
]
|
|
|
|
| 2 |
{
|
| 3 |
"type": "Personal Profile",
|
| 4 |
"name": "RONALD NYASHA KANYEPI",
|
| 5 |
+
"summary": "Data Scientist & Applied AI Engineer with 3+ years of experience in machine learning, applied AI, and data-driven innovation. Focused on building scalable systems, operational efficiency, and actionable insights. Skilled in designing and deploying end-to-end ML pipelines, agentic workflows, RAG-enabled systems, and real-time data solutions using Python, SQL, Spark, and AWS. Experienced in leveraging LLMs, LangGraph, LangChain, and Generative AI to optimize business processes, enable decision intelligence, and deliver measurable impact across financial services, real estate, and enterprise analytics.",
|
| 6 |
"contact": {
|
| 7 |
"email": "kanyepironald@gmail.com",
|
| 8 |
"linkedin": "https://www.linkedin.com/in/ronald-nyasha-kanyepi/",
|
|
|
|
| 15 |
"location": "Atlanta, GA",
|
| 16 |
"degree": "Master of Science in Business Analytics",
|
| 17 |
"graduation_year": 2025,
|
| 18 |
+
"notes": "Graduated with MSBA Rigor Award for proficiency in advanced analytics, statistical modeling, ML deployment, and data engineering to solve complex business problems with clarity, precision, and strategic impact."
|
| 19 |
},
|
| 20 |
{
|
| 21 |
"institution": "UNIVERSITY OF ZIMBABWE",
|
| 22 |
"location": "Harare, Zimbabwe",
|
| 23 |
"degree": "Bachelor of Business Studies and Computing Science",
|
| 24 |
"graduation_year": 2021,
|
| 25 |
+
"notes": "Graduated with First Class Honors and awarded the UZ Book Prize for top academic performance, demonstrating strong foundation in computing, analytics, and business strategy."
|
| 26 |
}
|
| 27 |
],
|
| 28 |
"certifications": [
|
|
|
|
| 38 |
"company": "Pennybacker Capital - Austin, Texas",
|
| 39 |
"dates": "Dec 2024 - May 2025",
|
| 40 |
"achievements": [
|
| 41 |
+
"Designed and deployed ML models forecasting quarterly Gross Asset Value (GAV) for a $4B+ real estate portfolio with 1% error (MAPE), mitigating ~$2M in potential losses.",
|
| 42 |
+
"Engineered end-to-end data pipelines integrating 50+ internal and external sources on Databricks for predictive modeling, automated reporting, and risk monitoring.",
|
| 43 |
+
"Developed a sentiment-driven early warning system using Google Reviews to detect operational risks and opportunities across 11 multifamily properties.",
|
| 44 |
+
"Translated complex ML predictions into actionable business strategies using SHAP and LIME, improving executive decision-making."
|
| 45 |
]
|
| 46 |
},
|
| 47 |
{
|
|
|
|
| 49 |
"company": "AFC Commercial Bank - Harare, Zimbabwe",
|
| 50 |
"dates": "Mar 2024 – Jun 2024",
|
| 51 |
"achievements": [
|
| 52 |
+
"Led analytics for OK Grand Challenge promotion, increasing POS transactions by 200% across 70+ outlets.",
|
| 53 |
+
"Developed dashboards with Python, Apache Spark, and Dash Plotly to monitor 20,000+ ATM and POS transactions in real-time, enabling rapid operational interventions.",
|
| 54 |
+
"Implemented XGBoost-based churn prediction models, improving retention effectiveness by 25% and reducing customer churn by 15%.",
|
| 55 |
+
"Automated data migration workflows from T24 to IDC Core Banking System, achieving 99.4% accuracy while minimizing downtime."
|
| 56 |
]
|
| 57 |
},
|
| 58 |
{
|
|
|
|
| 60 |
"company": "AFC Commercial Bank - Harare, Zimbabwe",
|
| 61 |
"dates": "Jun 2022 – Feb 2024",
|
| 62 |
"achievements": [
|
| 63 |
+
"Built FastAPI backend integrating RBZ API for CRB, reducing processing time by 40% and enhancing compliance.",
|
| 64 |
+
"Created Kafka-Python ETL pipelines standardizing core banking data for branch-wide KPIs.",
|
| 65 |
+
"Optimized reporting services using Airflow and DBT, automating manual processes and increasing efficiency by 80%.",
|
| 66 |
+
"Modernized a monolithic reconciliation application into microservices with Docker, Kubernetes, FastAPI, and Angular, boosting throughput by 150%."
|
| 67 |
]
|
| 68 |
}
|
| 69 |
],
|
| 70 |
"technical_capabilities": {
|
| 71 |
+
"Programming & Machine Learning": [
|
| 72 |
+
"Python", "R", "TypeScript", "SQL", "scikit-learn", "Darts", "Statsmodels", "ARIMA/SARIMA",
|
| 73 |
+
"TensorFlow", "PyTorch", "LightGBM", "XGBoost", "CatBoost", "Large Language Models (LLMs)",
|
| 74 |
+
"Retrieval-Augmented Generation (RAG)", "LangGraph", "LangChain", "LlamaIndex",
|
| 75 |
+
"OpenAI APIs", "HuggingFace Transformers", "SHAP", "Optuna", "MCP", "Chainlit"
|
| 76 |
+
],
|
| 77 |
+
"Data Engineering & MLOps": [
|
| 78 |
+
"Apache Spark", "Kafka", "Airflow", "Docker", "Kubernetes", "dbt", "Great Expectations",
|
| 79 |
+
"AWS S3, Glue, EMR", "REST APIs", "Feature Stores", "CI/CD with GitHub Actions",
|
| 80 |
+
"Model Deployment with FastAPI, MLflow, Chainlit"
|
| 81 |
+
],
|
| 82 |
+
"Visualization & Analytics": [
|
| 83 |
+
"Dash (Plotly)", "Streamlit", "Tableau", "Power BI", "Excel", "Matplotlib", "Seaborn",
|
| 84 |
+
"Time Series Forecasting", "A/B Testing", "Uplift Modeling", "Segmentation",
|
| 85 |
+
"Deep Exploratory Data Analysis (EDA)"
|
| 86 |
+
],
|
| 87 |
+
"Cloud, Databases & Storage": [
|
| 88 |
+
"AWS (S3, SageMaker, Redshift)", "Databricks", "PostgreSQL", "SQL Server", "MySQL",
|
| 89 |
+
"DynamoDB", "MongoDB", "DuckDB", "Vector Stores (FAISS, Chroma)", "NoSQL", "ElasticSearch",
|
| 90 |
+
"Parquet", "ORC", "JSON", "Avro"
|
| 91 |
+
]
|
| 92 |
+
},
|
| 93 |
+
"projects": [
|
| 94 |
+
{
|
| 95 |
+
"project_name": "QueryCraft AI",
|
| 96 |
+
"summary": "Conversational AI platform enabling natural language queries over complex databases, leveraging LangGraph, RAG, and multi-step LLM orchestration for automated SQL generation, validation, execution, and summarization.",
|
| 97 |
+
"my_role_and_achievements": [
|
| 98 |
+
"Built full-stack solution with Next.js frontend, FastAPI backend, Docker/Kubernetes deployment, LangFuse observability, MCP integration, and ZITADEL authentication.",
|
| 99 |
+
"Implemented agentic workflows orchestrating LLM reasoning, schema-aware SQL generation, and automated validation pipelines."
|
| 100 |
+
],
|
| 101 |
+
"technologies": ["Python", "FastAPI", "Next.js", "Docker", "Kubernetes", "LangGraph", "RAG", "LangFuse", "MCP", "ZITADEL"],
|
| 102 |
+
"source_url": "https://github.com/ronaldkanyepi/PersonalRAG"
|
| 103 |
+
},
|
| 104 |
+
{
|
| 105 |
+
"project_name": "Sports Ticket Sales Forecasting",
|
| 106 |
+
"summary": "Predictive model for Atlanta Braves ticket sales integrating attendance, promotions, and weather data.",
|
| 107 |
+
"my_role_and_achievements": [
|
| 108 |
+
"Achieved 3.3% forecast error using XGBoost and LSTM ensembles.",
|
| 109 |
+
"Optimized feature engineering and model selection pipelines for precise forecasting."
|
| 110 |
+
],
|
| 111 |
+
"technologies": ["Python", "XGBoost", "LSTM", "Pandas", "NumPy", "Scikit-learn"],
|
| 112 |
+
"source_url": "https://github.com/ronaldkanyepi/Sports-Ticket-Forecasting"
|
| 113 |
+
},
|
| 114 |
+
{
|
| 115 |
+
"project_name": "Log Real-Time Analysis",
|
| 116 |
+
"summary": "High-throughput log aggregation and visualization system handling 60,000 events/sec.",
|
| 117 |
+
"my_role_and_achievements": [
|
| 118 |
+
"Designed Kafka-Spark ETL pipelines and integrated DynamoDB for real-time metrics.",
|
| 119 |
+
"Visualized operational insights using Dash Plotly and deployed scalable architecture via Docker-compose."
|
| 120 |
+
],
|
| 121 |
+
"technologies": ["Python", "Kafka", "Spark", "DynamoDB", "Dash", "Plotly", "Docker"],
|
| 122 |
+
"source_url": "https://github.com/ronaldkanyepi/Log-Realtime-Analysis"
|
| 123 |
+
},
|
| 124 |
+
{
|
| 125 |
+
"project_name": "Zim Docs OCR-to-JSON Extractor",
|
| 126 |
+
"summary": "Web app converting scanned documents into structured JSON format using vision AI for licenses, passports, and invoices.",
|
| 127 |
+
"my_role_and_achievements": [
|
| 128 |
+
"Built scalable OCR pipeline with Gradio, PyMuPDF, and OpenAI-compatible APIs.",
|
| 129 |
+
"Handled both PDFs and image inputs for structured, machine-readable outputs."
|
| 130 |
+
],
|
| 131 |
+
"technologies": ["Python", "Gradio", "PyMuPDF", "OpenAI APIs"],
|
| 132 |
+
"source_url": {
|
| 133 |
+
"demo": "https://huggingface.co/spaces/NyashaK/DocOCR2JSON",
|
| 134 |
+
"github": "https://github.com/ronaldkanyepi/docs-ocr-2-json"
|
| 135 |
+
}
|
| 136 |
+
}
|
| 137 |
+
]
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 138 |
}
|
| 139 |
+
]
|