{"id":21865444,"url":"https://github.com/wa-lead/ml485_blind_preprocessing_prediction_comp","last_synced_at":"2026-05-19T15:11:31.920Z","repository":{"id":166460334,"uuid":"641949324","full_name":"Wa-lead/ML485_blind_preprocessing_prediction_comp","owner":"Wa-lead","description":"This project aims to achieve the best prediction results by applying various preprocessing techniques and blind data engineering.","archived":false,"fork":false,"pushed_at":"2023-05-17T14:09:13.000Z","size":1449,"stargazers_count":0,"open_issues_count":0,"forks_count":0,"subscribers_count":2,"default_branch":"main","last_synced_at":"2025-01-26T15:46:02.782Z","etag":null,"topics":["data-engineering","data-visualization","machine-learning","python"],"latest_commit_sha":null,"homepage":"","language":"Jupyter Notebook","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":null,"status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/Wa-lead.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":null,"code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null}},"created_at":"2023-05-17T13:54:50.000Z","updated_at":"2023-05-17T14:13:35.000Z","dependencies_parsed_at":null,"dependency_job_id":"ab4dc64e-2bc8-4b71-9840-ffaa746572eb","html_url":"https://github.com/Wa-lead/ML485_blind_preprocessing_prediction_comp","commit_stats":null,"previous_names":["Wa-lead/ML485_blind_preprocessing_prediction_comp"],"tags_count":0,"template":false,"template_full_name":null,"repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/Wa-lead%2FML485_blind_preprocessing_prediction_comp","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/Wa-lead%2FML485_blind_preprocessing_prediction_comp/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/Wa-lead%2FML485_blind_preprocessing_prediction_comp/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/Wa-lead%2FML485_blind_preprocessing_prediction_comp/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/Wa-lead","download_url":"https://codeload.github.com/Wa-lead/ML485_blind_preprocessing_prediction_comp/tar.gz/refs/heads/main","host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":244868752,"owners_count":20523591,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"keywords":["data-engineering","data-visualization","machine-learning","python"],"created_at":"2024-11-28T04:16:39.619Z","updated_at":"2026-05-19T15:11:31.882Z","avatar_url":"https://github.com/Wa-lead.png","language":"Jupyter Notebook","funding_links":[],"categories":[],"sub_categories":[],"readme":"# ML485_blind_preprocessing_prediction_comp\nThis project aims to achieve the best prediction results by applying various preprocessing techniques and blind data engineering.\n\n# Data Preprocessing\nTo gain an understanding of the data structure and the separation of classes, the initial step involved using UMAP (Uniform Manifold Approximation and Projection). Additionally, the data was imputed, and generic data engineering techniques were applied. Finally, feature selection was performed using mutual information.\n\n# Prediction\nSeveral models were evaluated, and XGBoost emerged as the top-performing model for prediction.\n\n# Gain Further Insights into the Data\nTo gain insights into the weaknesses of the model, various techniques were employed to understand the reasons behind incorrect predictions (details can be found in the \"main.ipynb\" file).\n\nPlease refer to the \"main.ipynb\" file for a more comprehensive analysis and implementation details.\n\n\" Won first place btw 🥱 \"\n","project_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fwa-lead%2Fml485_blind_preprocessing_prediction_comp","html_url":"https://awesome.ecosyste.ms/projects/github.com%2Fwa-lead%2Fml485_blind_preprocessing_prediction_comp","lists_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fwa-lead%2Fml485_blind_preprocessing_prediction_comp/lists"}