

{"id":146623,"date":"2025-08-18T12:27:27","date_gmt":"2025-08-18T06:57:27","guid":{"rendered":"https:\/\/data-flair.training\/blogs\/?p=146623"},"modified":"2025-08-18T12:27:27","modified_gmt":"2025-08-18T06:57:27","slug":"diabetes-prediction-using-gradient-boosting","status":"publish","type":"post","link":"https:\/\/data-flair.training\/blogs\/diabetes-prediction-using-gradient-boosting\/","title":{"rendered":"ML Project &#8211; Diabetes Prediction using Gradient Boosting"},"content":{"rendered":"<h3>Program 1<\/h3>\n<p><a href=\"https:\/\/drive.google.com\/file\/d\/1PDqQrUmLuJW1Sd95vS-XTFYhvjkmbEKw\/view?usp=sharing\" target=\"_blank\" rel=\"noopener\"><strong>Diabetes Prediction Dataset<\/strong><\/a><\/p>\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"generic\"># Import libraries\r\nimport pandas as pd\r\nfrom sklearn.model_selection import train_test_split\r\nfrom sklearn.preprocessing import LabelEncoder\r\nfrom sklearn.ensemble import GradientBoostingClassifier\r\nfrom sklearn.metrics import accuracy_score, confusion_matrix\r\n\r\n# Load dataset\r\ndf = pd.read_csv(\"D:\/\/scikit_data\/diabetes\/diabetes_prediction_dataset.csv\")\r\ndf.info()\r\n\r\n# Label Encoding for categorical column\r\nle = LabelEncoder()\r\ndf[\"Gender\"] = le.fit_transform(df[\"Gender\"])  # Male = 1, Female = 0\r\ndf.head()\r\n\r\n# Separate Independed and depended variables\r\nX = df.drop(\"Outcome\", axis=1) # Input\r\ny = df[\"Outcome\"] #Output\r\ny\r\n\r\n#  Split dataset\r\nX_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)\r\nlen(X_test)\r\n\r\n#  Train Gradient Boosting Classifier\r\n\r\nmodel = GradientBoostingClassifier(n_estimators=100, learning_rate=0.1, max_depth=3, random_state=42)\r\nmodel.fit(X_train, y_train) #Trained\r\n\r\n#  Evaluate model\r\ny_pred = model.predict(X_test)\r\nacc = accuracy_score(y_test, y_pred)\r\ncm = confusion_matrix(y_test, y_pred)\r\nprint(\" Model Performance\")\r\nprint(f\"Accuracy: {acc:.2f}\")\r\nprint(\"Confusion Matrix:\")\r\nprint(cm)\r\n\r\n# Step 8: User input for prediction (updated)\r\nprint(\"\\n Enter patient details to predict diabetes (1=Diabetic, 0=Not Diabetic):\")\r\n\r\nGender = input(\"Gender (Male\/Female): \").strip().capitalize()\r\nif Gender == \"Female\":\r\n    Pregnancies = int(input(\"Number of Pregnancies: \"))\r\n    Gender_encoded=0\r\nelse:\r\n    Pregnancies=0\r\n    Gender_encoded=1\r\n    # Not applicable to males\r\n\r\nGlucose = int(input(\"Glucose Level: \"))\r\nBloodPressure = int(input(\"Blood Pressure: \"))\r\nSkinThickness = int(input(\"Skin Thickness: \"))\r\nInsulin = int(input(\"Insulin Level: \"))\r\nBMI = float(input(\"BMI: \"))\r\nDPF = float(input(\"Diabetes Pedigree Function: \"))\r\nAge = int(input(\"Age: \"))\r\n\r\n\r\n# Create input DataFrame\r\ninput_data = pd.DataFrame([{\r\n    \"Pregnancies\": Pregnancies,\r\n    \"Glucose\": Glucose,\r\n    \"BloodPressure\": BloodPressure,\r\n    \"SkinThickness\": SkinThickness,\r\n    \"Insulin\": Insulin,\r\n    \"BMI\": BMI,\r\n    \"DiabetesPedigreeFunction\": DPF,\r\n    \"Age\": Age,\r\n    \"Gender\": Gender_encoded\r\n}])\r\n\r\n# Predict\r\nresult = model.predict(input_data)[0]\r\nprint(f\"\\n Prediction: {'Diabetic' if result == 1 else 'Not Diabetic'}\")\r\n<\/pre>\n<p>&nbsp;<span hidden class=\"__iawmlf-post-loop-links\" data-iawmlf-links=\"[{&quot;id&quot;:16,&quot;href&quot;:&quot;https:\\\/\\\/drive.google.com\\\/file\\\/d\\\/1PDqQrUmLuJW1Sd95vS-XTFYhvjkmbEKw\\\/view?usp=sharing&quot;,&quot;archived_href&quot;:&quot;&quot;,&quot;redirect_href&quot;:&quot;&quot;,&quot;checks&quot;:[],&quot;broken&quot;:false,&quot;last_checked&quot;:null,&quot;process&quot;:&quot;done&quot;}]\"><\/span><\/p>\n","protected":false},"excerpt":{"rendered":"<p>Program 1 Diabetes Prediction Dataset # Import libraries import pandas as pd from sklearn.model_selection import train_test_split from sklearn.preprocessing import LabelEncoder from sklearn.ensemble import GradientBoostingClassifier from sklearn.metrics import accuracy_score, confusion_matrix # Load dataset df =&#46;&#46;&#46;<\/p>\n","protected":false},"author":581,"featured_media":0,"comment_status":"open","ping_status":"closed","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[36],"tags":[35079,35077,35078,8431,33127,33128,35080,20697],"class_list":["post-146623","post","type-post","status-publish","format-standard","hentry","category-machine-learning","tag-diabetes-prediction","tag-diabetes-prediction-using-gradient-boosting","tag-diabetes-prediction-using-machine-learning","tag-machine-learning","tag-machine-learning-practical","tag-machine-learning-program","tag-machine-learning-program-on-diabetes-prediction","tag-machine-learning-project"],"yoast_head":"<!-- This site is optimized with the Yoast SEO plugin v27.8 - https:\/\/yoast.com\/product\/yoast-seo-wordpress\/ -->\n<title>ML Project - Diabetes Prediction using Gradient Boosting - DataFlair<\/title>\n<meta name=\"robots\" content=\"index, follow, max-snippet:-1, max-image-preview:large, max-video-preview:-1\" \/>\n<link rel=\"canonical\" href=\"https:\/\/data-flair.training\/blogs\/diabetes-prediction-using-gradient-boosting\/\" \/>\n<meta property=\"og:locale\" content=\"en_US\" \/>\n<meta property=\"og:type\" content=\"article\" \/>\n<meta property=\"og:title\" content=\"ML Project - Diabetes Prediction using Gradient Boosting - DataFlair\" \/>\n<meta property=\"og:description\" content=\"Program 1 Diabetes Prediction Dataset # Import libraries import pandas as pd from sklearn.model_selection import train_test_split from sklearn.preprocessing import LabelEncoder from sklearn.ensemble import GradientBoostingClassifier from sklearn.metrics import accuracy_score, confusion_matrix # Load dataset df =&#046;&#046;&#046;\" \/>\n<meta property=\"og:url\" content=\"https:\/\/data-flair.training\/blogs\/diabetes-prediction-using-gradient-boosting\/\" \/>\n<meta property=\"og:site_name\" content=\"DataFlair\" \/>\n<meta property=\"article:publisher\" content=\"https:\/\/www.facebook.com\/DataFlairWS\/\" \/>\n<meta property=\"article:published_time\" content=\"2025-08-18T06:57:27+00:00\" \/>\n<meta name=\"author\" content=\"DataFlair Team\" \/>\n<meta name=\"twitter:card\" content=\"summary_large_image\" \/>\n<meta name=\"twitter:creator\" content=\"@DataFlairWS\" \/>\n<meta name=\"twitter:site\" content=\"@DataFlairWS\" \/>\n<meta name=\"twitter:label1\" content=\"Written by\" \/>\n\t<meta name=\"twitter:data1\" content=\"DataFlair Team\" \/>\n\t<meta name=\"twitter:label2\" content=\"Est. reading time\" \/>\n\t<meta name=\"twitter:data2\" content=\"1 minute\" \/>\n<!-- \/ Yoast SEO plugin. -->","yoast_head_json":{"title":"ML Project - Diabetes Prediction using Gradient Boosting - DataFlair","robots":{"index":"index","follow":"follow","max-snippet":"max-snippet:-1","max-image-preview":"max-image-preview:large","max-video-preview":"max-video-preview:-1"},"canonical":"https:\/\/data-flair.training\/blogs\/diabetes-prediction-using-gradient-boosting\/","og_locale":"en_US","og_type":"article","og_title":"ML Project - Diabetes Prediction using Gradient Boosting - DataFlair","og_description":"Program 1 Diabetes Prediction Dataset # Import libraries import pandas as pd from sklearn.model_selection import train_test_split from sklearn.preprocessing import LabelEncoder from sklearn.ensemble import GradientBoostingClassifier from sklearn.metrics import accuracy_score, confusion_matrix # Load dataset df =&#46;&#46;&#46;","og_url":"https:\/\/data-flair.training\/blogs\/diabetes-prediction-using-gradient-boosting\/","og_site_name":"DataFlair","article_publisher":"https:\/\/www.facebook.com\/DataFlairWS\/","article_published_time":"2025-08-18T06:57:27+00:00","author":"DataFlair Team","twitter_card":"summary_large_image","twitter_creator":"@DataFlairWS","twitter_site":"@DataFlairWS","twitter_misc":{"Written by":"DataFlair Team","Est. reading time":"1 minute"},"schema":{"@context":"https:\/\/schema.org","@graph":[{"@type":"Article","@id":"https:\/\/data-flair.training\/blogs\/diabetes-prediction-using-gradient-boosting\/#article","isPartOf":{"@id":"https:\/\/data-flair.training\/blogs\/diabetes-prediction-using-gradient-boosting\/"},"author":{"name":"DataFlair Team","@id":"https:\/\/data-flair.training\/blogs\/#\/schema\/person\/c187795dc82ab948373cca526df7c445"},"headline":"ML Project &#8211; Diabetes Prediction using Gradient Boosting","datePublished":"2025-08-18T06:57:27+00:00","mainEntityOfPage":{"@id":"https:\/\/data-flair.training\/blogs\/diabetes-prediction-using-gradient-boosting\/"},"wordCount":13,"commentCount":0,"publisher":{"@id":"https:\/\/data-flair.training\/blogs\/#organization"},"keywords":["diabetes prediction","diabetes prediction using gradient boosting","diabetes prediction using machine learning","machine learning","machine learning practical","machine learning program","machine learning program on diabetes prediction","machine learning project"],"articleSection":["Machine Learning Tutorials"],"inLanguage":"en-US","potentialAction":[{"@type":"CommentAction","name":"Comment","target":["https:\/\/data-flair.training\/blogs\/diabetes-prediction-using-gradient-boosting\/#respond"]}]},{"@type":"WebPage","@id":"https:\/\/data-flair.training\/blogs\/diabetes-prediction-using-gradient-boosting\/","url":"https:\/\/data-flair.training\/blogs\/diabetes-prediction-using-gradient-boosting\/","name":"ML Project - Diabetes Prediction using Gradient Boosting - DataFlair","isPartOf":{"@id":"https:\/\/data-flair.training\/blogs\/#website"},"datePublished":"2025-08-18T06:57:27+00:00","breadcrumb":{"@id":"https:\/\/data-flair.training\/blogs\/diabetes-prediction-using-gradient-boosting\/#breadcrumb"},"inLanguage":"en-US","potentialAction":[{"@type":"ReadAction","target":["https:\/\/data-flair.training\/blogs\/diabetes-prediction-using-gradient-boosting\/"]}]},{"@type":"BreadcrumbList","@id":"https:\/\/data-flair.training\/blogs\/diabetes-prediction-using-gradient-boosting\/#breadcrumb","itemListElement":[{"@type":"ListItem","position":1,"name":"Blog Home","item":"https:\/\/data-flair.training\/blogs\/"},{"@type":"ListItem","position":2,"name":"Machine Learning Tutorials","item":"https:\/\/data-flair.training\/blogs\/category\/machine-learning\/"},{"@type":"ListItem","position":3,"name":"ML Project &#8211; Diabetes Prediction using Gradient Boosting"}]},{"@type":"WebSite","@id":"https:\/\/data-flair.training\/blogs\/#website","url":"https:\/\/data-flair.training\/blogs\/","name":"DataFlair","description":"Learn Today. Lead Tomorrow.","publisher":{"@id":"https:\/\/data-flair.training\/blogs\/#organization"},"potentialAction":[{"@type":"SearchAction","target":{"@type":"EntryPoint","urlTemplate":"https:\/\/data-flair.training\/blogs\/?s={search_term_string}"},"query-input":{"@type":"PropertyValueSpecification","valueRequired":true,"valueName":"search_term_string"}}],"inLanguage":"en-US"},{"@type":"Organization","@id":"https:\/\/data-flair.training\/blogs\/#organization","name":"DataFlair","url":"https:\/\/data-flair.training\/blogs\/","logo":{"@type":"ImageObject","inLanguage":"en-US","@id":"https:\/\/data-flair.training\/blogs\/#\/schema\/logo\/image\/","url":"https:\/\/data-flair.training\/blogs\/wp-content\/uploads\/sites\/2\/2016\/07\/Data-Flair.png","contentUrl":"https:\/\/data-flair.training\/blogs\/wp-content\/uploads\/sites\/2\/2016\/07\/Data-Flair.png","width":106,"height":48,"caption":"DataFlair"},"image":{"@id":"https:\/\/data-flair.training\/blogs\/#\/schema\/logo\/image\/"},"sameAs":["https:\/\/www.facebook.com\/DataFlairWS\/","https:\/\/x.com\/DataFlairWS","https:\/\/www.linkedin.com\/company\/dataflair-web-services-pvt-ltd\/","https:\/\/www.youtube.com\/user\/DataFlairWS"]},{"@type":"Person","@id":"https:\/\/data-flair.training\/blogs\/#\/schema\/person\/c187795dc82ab948373cca526df7c445","name":"DataFlair Team","image":{"@type":"ImageObject","inLanguage":"en-US","@id":"https:\/\/secure.gravatar.com\/avatar\/2302ebc438084d2f1f993edc1996a0aae01332e81f3227cba8df0c48ec010ca4?s=96&d=mm&r=g","url":"https:\/\/secure.gravatar.com\/avatar\/2302ebc438084d2f1f993edc1996a0aae01332e81f3227cba8df0c48ec010ca4?s=96&d=mm&r=g","contentUrl":"https:\/\/secure.gravatar.com\/avatar\/2302ebc438084d2f1f993edc1996a0aae01332e81f3227cba8df0c48ec010ca4?s=96&d=mm&r=g","caption":"DataFlair Team"},"description":"DataFlair Team provides high-impact content on programming, Java, Python, C++, DSA, AI, ML, data Science, Android, Flutter, MERN, Web Development, and technology. We make complex concepts easy to grasp, helping learners of all levels succeed in their tech careers.","url":"https:\/\/data-flair.training\/blogs\/author\/dfteam6\/"}]}},"amp_enabled":true,"_links":{"self":[{"href":"https:\/\/data-flair.training\/blogs\/wp-json\/wp\/v2\/posts\/146623","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/data-flair.training\/blogs\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/data-flair.training\/blogs\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/data-flair.training\/blogs\/wp-json\/wp\/v2\/users\/581"}],"replies":[{"embeddable":true,"href":"https:\/\/data-flair.training\/blogs\/wp-json\/wp\/v2\/comments?post=146623"}],"version-history":[{"count":3,"href":"https:\/\/data-flair.training\/blogs\/wp-json\/wp\/v2\/posts\/146623\/revisions"}],"predecessor-version":[{"id":146640,"href":"https:\/\/data-flair.training\/blogs\/wp-json\/wp\/v2\/posts\/146623\/revisions\/146640"}],"wp:attachment":[{"href":"https:\/\/data-flair.training\/blogs\/wp-json\/wp\/v2\/media?parent=146623"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/data-flair.training\/blogs\/wp-json\/wp\/v2\/categories?post=146623"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/data-flair.training\/blogs\/wp-json\/wp\/v2\/tags?post=146623"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}