15:[["$","$L133",null,{"props":{"lessonContent":{"components":[{"type":"SlateHTML","content":{"html":"

Finding the optimal split

Similar to classification trees, the CART algorithm has to find optimal regression tree splits efficiently. In the case of numeric features, this is a challenge because numeric features have many unique values. Once again, the CART algorithm utilizes an optimization to evaluate potential split points efficiently.

Consider training a CART regression tree model to impute missing values of the Age ...

","comp_id":"aHLMnPwhkaqcT8kz0EiQK"},"hash":0,"iteration":0}],"summary":{"description":"Learn how CART regression trees split training data using numeric features.","titleUpdated":true},"content":[{"type":"SlateHTML","content":{"html":"

Finding the optimal split

Consider training a CART regression tree model to impute missing values of the Age ...

","comp_id":"aHLMnPwhkaqcT8kz0EiQK"},"hash":0,"iteration":0}],"darkModeContent":[{"type":"SlateHTML","content":{"html":"

Finding the optimal split

Consider training a CART regression tree model to impute missing values of the Age ...

","comp_id":"aHLMnPwhkaqcT8kz0EiQK"},"hash":0,"iteration":0}]},"isPreviewLesson":false,"pageType":"collection_lesson","aiCoachVideoUrl":"https://youtu.be/kgl8y9J3O6c","collectionDetailsSSR":{"title":"Data Science with R: Decision Trees and Random Forests","summary":"The R programming language is widely used in the field of data science. Machine learning is a fundamental skill for learners looking to master industry algorithms in the field of data science.\n\nIn this course, you’ll learn about several essential algorithms used in machine learning, including classification and regression trees (CART), random forest, and XGBoost. CART is a decision tree algorithm that’s used for both classification and regression problems. Random forest is an ensemble learning method that uses multiple decision trees to improve the accuracy of predictions. XGBoost, short for Extreme Gradient Boosting, is a powerful algorithm that’s also used for regression and classification problems. You’ll also learn about cross-validation and model tuning, which are essential skills for crafting valuable machine learning models. \n\nAfter taking this course, you’ll have the crucial skills to ensure that the machine learning models you create are accurate, robust, and reliable.","details":"

Placeholder text - revise later.

","clos":["An understanding of the basics of machine learning and supervised learning","Familiarity with the differences between classification and regression trees","A working knowledge of XGBoost algorithm","Familiarity with random forest"],"arabic_available":false,"page_tags":{"6286392844091392":"","6420773042651136":"","5485115541291008":"","5745850255147008":"","5182900301725696":"","5248020696530944":"","5121639488684032":"","6580324316479488":"","5093693747101696":"","4534837887369216":"","4830903941726208":"","6277861109661696":"","4977384489222144":"","4841749052915712":"","5472779271143424":"","6392196293197824":"","4783490791112704":"","6503547011334144":"","5223002595917824":"","6746499075801088":"","5120841228746752":"","6704072038285312":"","6393659325153280":"","6652551036665856":"","6362714110951424":"","6693522239651840":"","6464617243213824":"","5112385897758720":"","6501700762599424":"","6027611845427200":"","5267976330936320":"","6279341002719232":"","6241183862095872":"","6233221756092416":"","4651883248746496":"","6660473157320704":"","6653498672545792":"","5893851640496128":"","6614892360761344":"","6550321011884032":"","5638641734123520":"","5888362269638656":"","4880476202598400":"","6545121489453056":"","5257396895350784":"","6691198150639616":"","6533184886145024":"","6063127441702912":"","5641571720757248":"","5756978901286912":"","4933405567614976":"","5338139948482560":"","5018544560668672":"","4766676353810432":"","4506610279120896":"","5077109234204672":"","5817961162211328":"","5714070273785856":"","4849781983936512":"","4935661876674560":"","6187325999284224":"","5453158919438336":"","5509753502171136":"","5036837639553024":"","5713765460606976":""},"collection_toc_is_enabled":true,"page_count":null,"docker":{"container":{"file":{"name":"Dockerfile.tar.gz","size":273},"imageName":"author-6586453712175104-collection-6161393571332096-rev-19-container-5112188626010112-dockerfile","buildStatus":"SUCCESS","buildStatusUrl":"https://www.educative.io/api/author/6586453712175104/collection/6161393571332096/containers/5112188626010112/build/status","buildLogUrl":"https://www.educative.io/api/author/6586453712175104/collection/6161393571332096/containers/5112188626010112/build/log","metadata":{"sizeInBytes":273},"id":-1,"tarballDownloadUrl":"https://www.educative.io/api/author/6586453712175104/collection/6161393571332096/containers/5112188626010112/download","rebuildImageUrl":"https://www.educative.io/api/author/6586453712175104/collection/6161393571332096/containers/5112188626010112/rebuild","track":false},"envs":[],"jobs":[{"key":"h21jvdVWiHKdc7xVMc7JE","jobType":"Default","name":"tidymodels","inputFileName":"main.r","runScript":"Rscript main.r","runInLiveContainer":false}],"testRunners":[],"version":3,"loaded":true},"discounted_price":29,"cover_image_id":4847458744139776,"cover_image_metadata":"{\"width\":1024,\"height\":512,\"sizeInBytes\":32485,\"name\":\"Data Science with R Machine Learning.png\"}","cover_image_serving_url":"/v2api/collection/6586453712175104/6161393571332096/image/4847458744139776","tags":[],"intro_video_url":"","intro_video_thumbnail_url":"","aggregated_widget_stats":{"projects":0,"assessments":0,"SlateHTML":294,"codeExerciseCount":0,"codeRunnableCount":67,"codeSnippetCount":29,"illustrations":62,"Table":41,"Code":96,"Columns":5,"Image":4,"Latex":45,"Quiz":11,"DrawIOWidget":58,"cloudlabs":0},"default_themes":{"code_themes":{"Code":"default","Markdown":"default","RunJS":"default","SPA":"default","isForced":{"Code":false,"Markdown":false,"RunJS":false,"SPA":false}}},"api_keys":{"api_keys":[]},"skills":["Data Science","Machine Learning","Machine Learning Fundamentals"],"testimonials":[],"licensing":null,"target_audience":"intermediate","author_id":"6586453712175104","collection_id":"6161393571332096","approval_status":3005,"price":29,"is_private":false,"path_type":"regular","organization_id":null,"is_mini":false,"is_priced":true,"brief_summary":"Gain insights into essential machine learning algorithms in R, including CART, random forest, and XGBoost. Discover model tuning and cross-validation to create accurate, robust data science models.","approval_update_time":"2023-11-14T10:48:42.804Z","rating_visibility":true,"update_last_published_on_homepage":true,"show_developed_by":true,"udata_files":[],"CodeThemes":{"Code":"default","Markdown":"default","RunJS":"default","SPA":"default","isForced":{"Code":false,"Markdown":false,"RunJS":false,"SPA":false}},"is_marked_for_deletion":false,"transition_page_title":"","is_redirectable":false,"collection_type":"collection","adaptive_learning_mode":false,"HLOs_to_toc":{},"is_guide":false,"read_time":50400,"allow_logged_out_executions":false,"unique_live_widget_urls":false,"metadata_status":101,"palified_version":null},"pageSummarySSR":{"title":"Numeric Feature SSE","description":"Learn how CART regression trees split training data using numeric features.","discourse_page_url":"https://discuss.educative.io/tag/numeric-feature-sse__regression-trees__data-science-with-r-decision-trees-and-random-forests?open=true&ctag=data-science-with-r-decision-trees-and-random-forests__david-langer&cslug=data-science-with-r-decision-trees-and-random-forests&pslug=numeric-feature-sse"},"adaptiveLearningConfigConstantSSR":0,"enableLessonPageLockedBannerV2":true,"allowAllLessonPreview":false,"lockedBannerStatsSSR":{"b2cTrialStats":{"is_b2c_trial_active":true,"b2c_trial_active_duration":7,"b2c_trial_categories":"$134"},"b2cStatus":100,"learnerTags":"$135","workStats":1590,"interviewWorksStats":93,"inL2cStarterPack":false,"l2cWorkStats":44,"enableL2cStarterPackPaymentWidget":"false"},"pageTocSSR":"

","authorId":"6586453712175104","collectionId":"6161393571332096","pageId":"6545121489453056","isCollectionPageLockedCachingEnabled":true,"aceFeatureFlags":{"enableAceEditor":true,"enableAceEditorForAnswers":true},"meta":{"type":["Article","TechArticle"],"title":"Numeric Feature SSE","name":"Data Science with R: Decision Trees and Random Forests","description":"Learn how CART regression trees split training data using numeric features.","image":"https://educative.io/api/collection/6586453712175104/6161393571332096/image/4847458744139776.png","isAccessibleForFree":false,"keywords":"$135","provider":"Educative","publisher":"Educative","id":"courses/data-science-with-r-decision-trees-and-random-forests/numeric-feature-sse","author":"Educative","educationalLevel":"intermediate","noIndex":true,"isForcedNoIndex":true,"noFollow":false,"redirectInfo":{"isDeletedCollectionPageRedirectable":false},"page_titles":{"4534837887369216":"Course Expectations","4830903941726208":"Machine Learning Is Predictive Analytics","6277861109661696":"The Course Datasets","4977384489222144":"What Is Machine Learning?","4841749052915712":"Forms of Supervised Learning","6286392844091392":"Why Decision Trees?","6420773042651136":"Decision Tree Intuition","5485115541291008":"Overfitting Intuition","5745850255147008":"Model Tuning Intuition","5182900301725696":"Gini Impurity","5248020696530944":"Gini Change","5121639488684032":"Classification Tree Training Example","6580324316479488":"Many Categories Impurity","5093693747101696":"Numeric Feature Impurity","5472779271143424":"Introducing tidymodels","6392196293197824":"Crafting the Recipe","6704072038285312":"Underfitting and Overfitting","5120841228746752":"The Bias-Variance Tradeoff","6362714110951424":"Cross-Validation","6652551036665856":"Model Tuning Intuition 201","6464617243213824":"Pruning Classification Trees","5112385897758720":"Measuring Model Accuracy","6501700762599424":"Performing Cross-Validation","6653498672545792":"Feature Engineering Intuition","5893851640496128":"Information Leakage","6614892360761344":"Decision Boundaries","5888362269638656":"Missing Data","4880476202598400":"Regression Tree Basics","6545121489453056":"Numeric Feature SSE","5257396895350784":"Many Categories SSE","6691198150639616":"Regression Trees with tidymodels","6533184886145024":"Decision Trees and Ensembles","6063127441702912":"Bagging","5641571720757248":"Feature Randomization","5338139948482560":"Tuning Random Forests","4933405567614976":"Feature Importance","5077109234204672":"How Gradient Boosting Works","5817961162211328":"Gradient Boosting with XGBoost","5714070273785856":"Using XGBoost with tidymodels","5756978901286912":"Random Forests with tidymodels","4849781983936512":"Tuning XGBoost with tidymodels","4935661876674560":"Evaluating XGBoost with tidymodels","4783490791112704":"Exploratory Data Analysis—Profiling","6503547011334144":"Quiz: Data Basics","5223002595917824":"Quiz: Machine Learning Concepts","6746499075801088":"Quiz: Classification Tree Math","6393659325153280":"Quiz: Underfitting, Overfitting, and the Bias-Variance Tradeoff","6693522239651840":"Controlling Complexity","6027611845427200":"Specify the Algorithm and Workflow","5267976330936320":"Fitting the Model","6279341002719232":"Exploratory Data Analysis: Visualization","6241183862095872":"Quiz: Fitting Models","6233221756092416":"Tuning a Classification Tree","4651883248746496":"Visualizing a Tuned Classification Tree","6660473157320704":"Quiz: Model Tuning","6550321011884032":"Engineering Features for Decision Trees","5638641734123520":"Quiz: Feature Engineering","5018544560668672":"Preparing the Test Dataset","4766676353810432":"Testing the Titanic Dataset","4506610279120896":"Making Predictions","6187325999284224":"Quiz: Regression Trees","5453158919438336":"Quiz: Random Forests","5509753502171136":"Quiz: Using Random Forests","5036837639553024":"Quiz: XGBoost","5713765460606976":"What's Next?"},"is_marked_for_deletion":false,"transition_page_title":"","is_redirectable":false,"deleted_course_lesson_redirect":{"author_id":null,"collection_id":null,"page_id":null,"redirect_url_slug":null},"metadata_status":101,"additional_course_alternatives":[]},"requestUrl":"/courses/data-science-with-r-decision-trees-and-random-forests/numeric-feature-sse","requestUrlInfo":{"authorId":6586453712175104,"collectionId":6161393571332096,"pageId":6545121489453056,"courseUrlSlug":"data-science-with-r-decision-trees-and-random-forests","pageUrlSlug":"numeric-feature-sse"},"isExternalContent":false}}],[["$","script",null,{"id":"generate-data","type":"application/ld+json","dangerouslySetInnerHTML":{"__html":"$136"}}],false,"$undefined"]]