[{"data":1,"prerenderedAt":368},["ShallowReactive",2],{"i-kinnu:logo":3,"i-kinnu:origami-folding":8,"tile-science-statistics-for-data-science-introductory-level-samples-and-populations":12,"i-lucide:chevron-right":363,"i-lucide:menu":366},{"left":4,"top":4,"width":5,"height":5,"rotate":4,"vFlip":6,"hFlip":6,"body":7},0,27,false,"\u003Cg fill=\"none\">\u003Cpath d=\"M0.046875 1.05555C0.046875 1.03541 0.048197 1.01579 0.0507438 0.996728C0.0987149 0.438619 0.586845 0 1.18194 0H25.4398C26.451 0 26.9575 1.171 26.2424 1.85585L15.7301 11.9243L1.31574 0.903476C1.17475 0.79568 1.01137 0.761884 0.859586 0.784111L26.2936 25.1441C27.0086 25.829 26.5022 27 25.4909 27H1.18194C0.555061 27 0.046875 26.5133 0.046875 25.9129V1.05555Z\" fill=\"currentColor\"/>\u003C/g>",{"left":4,"top":4,"width":9,"height":10,"rotate":4,"vFlip":6,"hFlip":6,"body":11},1000,236,"\u003Cg fill=\"none\">\u003Cpath fill-rule=\"evenodd\" clip-rule=\"evenodd\"\n    d=\"M193.68 38.2238C195.994 38.2238 197.87 40.0989 197.87 42.412V231.812C197.87 234.125 195.994 236 193.68 236H4.19013C1.87603 236 2.02305e-07 234.125 0 231.812V42.412C-2.02305e-07 40.0989 1.87603 38.2238 4.19013 38.2238H193.68ZM111.76 89.0072C111.685 87.9474 110.572 87.2905 109.608 87.7376L96.8872 93.641C95.7786 94.1554 95.702 95.7016 96.7545 96.3225L101.579 99.167C94.7045 109.365 90.5733 122.892 90.5732 137.642C90.5733 154.323 95.8569 169.439 104.416 179.945C105.301 181.032 106.9 181.196 107.987 180.311C109.075 179.426 109.238 177.828 108.353 176.741C100.621 167.25 95.6522 153.305 95.6521 137.642C95.6522 123.661 99.6138 111.051 105.963 101.754L110.456 104.403C111.508 105.024 112.826 104.21 112.74 102.991L111.76 89.0072ZM9.63194 136.286C9.14864 136.286 8.75684 136.678 8.75684 137.161C8.7569 137.644 9.14868 138.035 9.63194 138.035H17.2161C17.6993 138.035 18.0912 137.644 18.0912 137.161C18.0912 136.678 17.6994 136.286 17.2161 136.286H9.63194ZM22.6813 136.286C22.198 136.286 21.8062 136.678 21.8062 137.161C21.8063 137.644 22.1981 138.035 22.6813 138.035H30.2655C30.7487 138.035 31.1406 137.644 31.1406 137.161C31.1406 136.678 30.7488 136.286 30.2655 136.286H22.6813ZM35.7464 136.286C35.2631 136.286 34.8713 136.678 34.8713 137.161C34.8713 137.644 35.2631 138.035 35.7464 138.035H44.4973C44.9805 138.035 45.3724 137.644 45.3724 137.161C45.3724 136.678 44.9806 136.286 44.4973 136.286H35.7464ZM49.9977 136.286C49.5144 136.286 49.1226 136.678 49.1226 137.161C49.1226 137.644 49.5144 138.035 49.9977 138.035H57.5819C58.0651 138.035 58.4569 137.644 58.457 137.161C58.457 136.678 58.0651 136.286 57.5819 136.286H49.9977ZM63.0783 136.286C62.595 136.286 62.2032 136.678 62.2032 137.161C62.2033 137.644 62.5951 138.035 63.0783 138.035H70.6625C71.1457 138.035 71.5375 137.644 71.5376 137.161C71.5376 136.678 71.1457 136.286 70.6625 136.286H63.0783ZM76.1277 136.286C75.6444 136.286 75.2526 136.678 75.2526 137.161C75.2527 137.644 75.6445 138.035 76.1277 138.035H83.7119C84.1951 138.035 84.5869 137.644 84.587 137.161C84.587 136.678 84.1951 136.286 83.7119 136.286H76.1277ZM102.266 136.286C101.782 136.286 101.39 136.678 101.39 137.161C101.391 137.644 101.782 138.035 102.266 138.035H109.85C110.333 138.035 110.725 137.644 110.725 137.161C110.725 136.678 110.333 136.286 109.85 136.286H102.266ZM115.338 136.286C114.855 136.286 114.463 136.678 114.463 137.161C114.463 137.644 114.855 138.035 115.338 138.035H122.923C123.406 138.035 123.798 137.644 123.798 137.161C123.798 136.678 123.406 136.286 122.923 136.286H115.338ZM128.403 136.286C127.92 136.286 127.528 136.678 127.528 137.161C127.528 137.644 127.92 138.035 128.403 138.035H135.988C136.471 138.035 136.863 137.644 136.863 137.161C136.863 136.678 136.471 136.286 135.988 136.286H128.403ZM141.468 136.286C140.985 136.286 140.593 136.678 140.593 137.161C140.593 137.644 140.985 138.035 141.468 138.035H149.053C149.536 138.035 149.928 137.644 149.928 137.161C149.928 136.678 149.536 136.286 149.053 136.286H141.468ZM154.541 136.286C154.058 136.286 153.666 136.678 153.666 137.161C153.666 137.644 154.058 138.035 154.541 138.035H162.125C162.609 138.035 163 137.644 163.001 137.161C163.001 136.678 162.609 136.286 162.125 136.286H154.541ZM167.614 136.286C167.131 136.286 166.739 136.678 166.739 137.161C166.739 137.644 167.131 138.035 167.614 138.035H175.198C175.681 138.035 176.073 137.644 176.073 137.161C176.073 136.678 175.681 136.286 175.198 136.286H167.614ZM180.671 136.286C180.188 136.286 179.796 136.678 179.796 137.161C179.796 137.644 180.188 138.035 180.671 138.035H188.255C188.739 138.035 189.13 137.644 189.131 137.161C189.131 136.678 188.739 136.286 188.255 136.286H180.671Z\"\n    fill=\"currentColor\" />\n  \u003Cpath fill-rule=\"evenodd\" clip-rule=\"evenodd\"\n    d=\"M444.85 38.2277C447.164 38.2277 449.04 40.1028 449.04 42.4159V132.928C449.04 135.241 447.164 137.116 444.85 137.116H255.36C253.046 137.116 251.17 135.241 251.17 132.928V42.4159C251.17 40.1028 253.046 38.2277 255.36 38.2277H444.85ZM361.96 125.388C361.618 125.046 361.064 125.046 360.722 125.388L354.534 131.572C354.192 131.914 354.192 132.468 354.534 132.81C354.876 133.151 355.43 133.151 355.772 132.81L361.96 126.624C362.301 126.283 362.301 125.73 361.96 125.388ZM371.047 116.311C370.705 115.969 370.15 115.969 369.809 116.311L364.446 121.671C364.104 122.012 364.104 122.567 364.446 122.908C364.788 123.249 365.342 123.25 365.684 122.908L371.047 117.548C371.388 117.207 371.388 116.652 371.047 116.311ZM380.124 107.246C379.782 106.904 379.227 106.904 378.885 107.246L373.523 112.606C373.181 112.948 373.181 113.502 373.523 113.844C373.864 114.185 374.419 114.185 374.761 113.844L380.124 108.483C380.465 108.142 380.465 107.587 380.124 107.246ZM385.736 65.8841C385.891 64.6727 384.622 63.7845 383.536 64.3434L371.069 70.7636C370.124 71.2504 369.96 72.5334 370.752 73.2424L381.2 82.5938C382.11 83.4081 383.561 82.8672 383.717 81.6557L384.393 76.3725C391.143 77.1933 398.567 80.7709 404.771 86.9711C411.124 93.3213 414.726 100.952 415.43 107.827C415.573 109.221 416.819 110.236 418.214 110.093C419.609 109.95 420.624 108.703 420.481 107.309C419.644 99.1317 415.435 90.4514 408.362 83.3817C401.466 76.489 393.038 72.3185 385.038 71.338L385.736 65.8841ZM389.2 98.1733C388.859 97.8319 388.304 97.8318 387.962 98.1733L382.6 103.534C382.258 103.875 382.258 104.429 382.6 104.771C382.941 105.112 383.496 105.112 383.838 104.771L389.2 99.4108C389.542 99.0693 389.542 98.5149 389.2 98.1733ZM398.262 89.1047C397.92 88.7633 397.365 88.7632 397.024 89.1047L391.661 94.4649C391.319 94.8065 391.319 95.3608 391.661 95.7024C392.002 96.0436 392.557 96.0438 392.899 95.7024L398.262 90.3421C398.603 90.0007 398.603 89.4463 398.262 89.1047ZM416.431 70.9616C416.089 70.6202 415.534 70.6201 415.193 70.9616L409.83 76.3218C409.488 76.6634 409.488 77.2177 409.83 77.5592C410.172 77.9005 410.726 77.9007 411.068 77.5592L416.431 72.199C416.772 71.8575 416.772 71.3032 416.431 70.9616ZM425.508 61.891C425.166 61.5496 424.611 61.5495 424.27 61.891L418.907 67.2512C418.565 67.5928 418.565 68.1471 418.907 68.4887C419.249 68.8299 419.803 68.8301 420.145 68.4887L425.508 63.1284C425.849 62.787 425.849 62.2326 425.508 61.891ZM434.569 52.8146C434.227 52.4731 433.673 52.4731 433.331 52.8146L427.968 58.1748C427.626 58.5163 427.627 59.0706 427.968 59.4122C428.31 59.7534 428.864 59.7537 429.206 59.4122L434.569 54.052C434.91 53.7105 434.91 53.1562 434.569 52.8146ZM443.638 43.7479C443.296 43.4065 442.742 43.4064 442.4 43.7479L437.037 49.1081C436.695 49.4496 436.696 50.004 437.037 50.3455C437.379 50.6868 437.933 50.687 438.275 50.3455L443.638 44.9853C443.98 44.6438 443.979 44.0895 443.638 43.7479Z\"\n    fill=\"currentColor\" />\n  \u003Cpath fill-rule=\"evenodd\" clip-rule=\"evenodd\"\n    d=\"M684.066 38.2277C687.798 38.2281 689.667 42.7391 687.027 45.3773L596.473 135.889C595.687 136.675 594.621 137.116 593.51 137.116H506.335C504.021 137.116 502.145 135.241 502.145 132.928V42.4159C502.145 40.1028 504.021 38.2277 506.335 38.2277H684.066ZM514.603 124.566C514.261 124.224 513.707 124.224 513.365 124.566L507.178 130.751C506.836 131.093 506.836 131.646 507.178 131.988C507.519 132.329 508.073 132.329 508.415 131.988L514.603 125.803C514.945 125.462 514.945 124.908 514.603 124.566ZM523.689 115.491C523.348 115.15 522.794 115.15 522.452 115.491L517.09 120.852C516.748 121.193 516.748 121.747 517.09 122.088C517.431 122.43 517.985 122.43 518.327 122.088L523.689 116.728C524.031 116.386 524.031 115.833 523.689 115.491ZM532.102 65.8295C530.707 65.6872 529.46 66.7017 529.318 68.0957C529.175 69.4896 530.189 70.7355 531.584 70.8787C538.463 71.5825 546.096 75.1826 552.45 81.5329C558.723 87.8037 562.312 95.3226 563.079 102.13L557.738 102.392C556.518 102.452 555.865 103.855 556.607 104.827L565.115 115.969C565.76 116.814 567.051 116.751 567.611 115.847L574.992 103.928C575.635 102.889 574.848 101.555 573.628 101.615L568.161 101.882C568.161 101.878 568.162 101.874 568.161 101.871C567.324 93.6931 563.114 85.0124 556.041 77.9425C548.968 70.873 540.283 66.6668 532.102 65.8295ZM532.766 106.421C532.425 106.079 531.871 106.079 531.529 106.421L526.166 111.781C525.825 112.123 525.825 112.676 526.166 113.018C526.508 113.359 527.062 113.359 527.403 113.018L532.766 107.657C533.108 107.316 533.108 106.762 532.766 106.421ZM541.843 97.3445C541.501 97.003 540.948 97.003 540.606 97.3445L535.243 102.705C534.901 103.046 534.902 103.6 535.243 103.941C535.585 104.283 536.139 104.283 536.48 103.941L541.843 98.5809C542.185 98.2393 542.185 97.686 541.843 97.3445ZM550.92 88.2778C550.578 87.9363 550.025 87.9363 549.683 88.2778L544.32 93.638C543.978 93.9796 543.978 94.5329 544.32 94.8745C544.662 95.2161 545.215 95.2161 545.557 94.8745L550.92 89.5142C551.262 89.1727 551.262 88.6193 550.92 88.2778ZM569.066 70.1405C568.724 69.799 568.17 69.7991 567.829 70.1405L562.466 75.5008C562.124 75.8423 562.124 76.3956 562.466 76.7372C562.808 77.0788 563.361 77.0788 563.703 76.7372L569.066 71.377C569.407 71.0354 569.407 70.4821 569.066 70.1405ZM578.143 61.0699C577.801 60.7284 577.247 60.7285 576.906 61.0699L571.543 66.4302C571.201 66.7717 571.201 67.3251 571.543 67.6666C571.885 68.0082 572.438 68.0082 572.78 67.6666L578.143 62.3064C578.484 61.9648 578.484 61.4115 578.143 61.0699ZM587.219 51.9896C586.878 51.6481 586.324 51.6481 585.982 51.9896L580.62 57.3498C580.278 57.6914 580.278 58.2447 580.62 58.5863C580.961 58.9279 581.515 58.9279 581.857 58.5863L587.219 53.2261C587.561 52.8845 587.561 52.3312 587.219 51.9896ZM596.288 42.9249C595.947 42.5833 595.392 42.5833 595.05 42.9249L589.689 48.2851C589.347 48.6267 589.347 49.18 589.689 49.5216C590.03 49.863 590.584 49.8631 590.926 49.5216L596.288 44.1613C596.63 43.8198 596.63 43.2664 596.288 42.9249Z\"\n    fill=\"currentColor\" />\n  \u003Cpath fill-rule=\"evenodd\" clip-rule=\"evenodd\"\n    d=\"M850.814 38.2277C854.547 38.2281 856.416 42.739 853.777 45.3773L763.223 135.889C762.437 136.674 761.371 137.116 760.26 137.116H673.176C669.443 137.116 667.574 132.605 670.213 129.966L760.768 39.4544C761.554 38.6692 762.62 38.2277 763.731 38.2277H850.814ZM761.338 121.8C760.855 121.8 760.463 122.191 760.463 122.674V131.13H762.213V122.674C762.213 122.191 761.821 121.8 761.338 121.8ZM761.338 108.971C760.855 108.971 760.463 109.363 760.463 109.846V118.301H762.213V109.846C762.213 109.363 761.821 108.971 761.338 108.971ZM761.338 96.1402C760.855 96.1406 760.463 96.5321 760.463 97.0149V105.47H762.213V97.0149C762.213 96.532 761.821 96.1404 761.338 96.1402ZM782.263 71.887C781.043 71.951 780.395 73.3571 781.139 74.3257L784.474 78.6631C779.115 82.951 771.242 85.7443 762.35 85.7444C753.366 85.7442 745.421 82.8944 740.059 78.5305C738.972 77.6461 737.373 77.8099 736.488 78.8961C735.602 79.983 735.766 81.582 736.853 82.467C743.231 87.6574 752.348 90.8207 762.35 90.8209C772.209 90.8208 781.205 87.746 787.568 82.6884L790.833 86.9341C791.577 87.9025 793.103 87.6391 793.479 86.4767L797.791 73.138C798.118 72.127 797.33 71.1017 796.268 71.1566L782.263 71.887ZM761.338 70.4847C760.855 70.4851 760.463 70.8767 760.463 71.3594V79.8147H762.213V71.3594C762.213 70.8766 761.821 70.485 761.338 70.4847ZM761.338 57.656C760.855 57.6564 760.463 58.048 760.463 58.5307V66.986H762.213V58.5307C762.213 58.0479 761.821 57.6563 761.338 57.656ZM761.338 44.8293C760.855 44.8297 760.463 45.2212 760.463 45.704V54.1592H762.213V45.704C762.213 45.2211 761.821 44.8295 761.338 44.8293Z\"\n    fill=\"currentColor\" />\n  \u003Cpath\n    d=\"M995.759 38.2277C999.53 38.228 1001.42 42.5171 998.752 45.0253L959.55 81.9005L905.796 41.5363C905.271 41.1418 904.662 41.0182 904.096 41.0994L997.485 130.319C1000.15 132.828 998.262 137.116 994.491 137.116H905.298C902.96 137.116 901.065 135.333 901.065 133.134V42.0941C901.065 42.0204 901.07 41.9483 901.079 41.8786C901.258 39.8345 903.079 38.2277 905.298 38.2277H995.759Z\"\n    fill=\"currentColor\" />\n  \u003Cpath\n    d=\"M505.873 0C506.657 4.57042e-05 507.307 0.195499 507.823 0.587023C508.338 0.969046 508.596 1.53802 508.596 2.29251C508.596 2.76034 508.467 3.19015 508.209 3.58162C507.951 3.96344 507.497 4.26401 506.848 4.48361V4.54114C507.65 4.67487 508.205 4.96191 508.51 5.4012C508.816 5.83087 508.969 6.31772 508.969 6.86193C508.969 7.74056 508.672 8.41851 508.08 8.89604C507.497 9.38304 506.733 9.62731 505.787 9.62738C504.861 9.62738 504.158 9.42172 503.68 9.0111C503.212 8.60054 502.935 8.08005 502.849 7.44993L503.881 7.10571L503.924 7.24028C504.035 7.54934 504.211 7.82925 504.454 8.07986C504.731 8.36635 505.166 8.50986 505.758 8.50989C506.465 8.50989 506.943 8.32772 507.191 7.9648C507.449 7.6019 507.579 7.20078 507.579 6.7615C507.579 6.2173 507.378 5.80683 506.977 5.52992C506.585 5.25295 505.93 5.10026 505.013 5.07161V4.15402C505.901 4.12537 506.489 3.92484 506.776 3.55237C507.062 3.18009 507.206 2.82242 507.206 2.47876C507.206 1.62801 506.752 1.17539 505.845 1.12237L505.658 1.11749C505.467 1.11752 505.242 1.14605 504.985 1.2033C504.736 1.25105 504.511 1.3274 504.31 1.43245L504.081 2.56457L503.05 2.44951L503.322 0.687461C503.666 0.49653 504.068 0.33454 504.526 0.200875C504.985 0.0671945 505.434 0 505.873 0Z\"\n    fill=\"currentColor\" />\n  \u003Cpath\n    d=\"M905.727 2.30616L904.638 2.4066L904.466 1.26083H901.428V3.72497C901.533 3.71544 901.643 3.71034 901.757 3.71034H902.086C902.755 3.71034 903.386 3.78668 903.979 3.93949C904.58 4.09229 905.068 4.38363 905.44 4.8132C905.822 5.23335 906.014 5.84949 906.014 6.66106C906.014 7.64468 905.722 8.38068 905.14 8.86776C904.557 9.36434 903.783 9.6127 902.818 9.61275C901.91 9.61275 901.213 9.40711 900.725 8.99648C900.248 8.59544 899.96 8.08007 899.865 7.44993L900.911 7.10571C901.007 7.49723 901.203 7.8271 901.499 8.09449C901.795 8.37131 902.211 8.50985 902.746 8.50989C903.395 8.50989 903.869 8.33787 904.165 7.99405C904.461 7.65981 904.609 7.22507 904.609 6.69031C904.609 5.87861 904.337 5.3625 903.792 5.14279C903.248 4.91361 902.612 4.79958 901.886 4.79955C901.695 4.79955 901.489 4.80365 901.27 4.8132C901.059 4.82275 900.854 4.83701 900.653 4.85611L900.224 4.44071V0.143343H905.569L905.727 2.30616Z\"\n    fill=\"currentColor\" />\n  \u003Cpath fill-rule=\"evenodd\" clip-rule=\"evenodd\"\n    d=\"M765.49 6.04576H766.966L766.837 7.14862H765.49V9.48404H764.185V7.14862H759.857L759.713 6.04576L762.909 0.143343H765.49V6.04576ZM760.96 6.04576H764.185V1.26083H763.541L760.96 6.04576Z\"\n    fill=\"currentColor\" />\n  \u003Cpath d=\"M4.80573 6.47481H6.41154V7.60693H1.81068V6.47481H3.50235V1.27546H1.81068V0.143343H4.80573V6.47481Z\"\n    fill=\"currentColor\" />\n  \u003Cpath\n    d=\"M254.359 0C255.353 0 256.055 0.239186 256.466 0.716715C256.877 1.18447 257.083 1.68072 257.083 2.20573C257.083 2.85516 256.849 3.44346 256.38 3.96875C255.912 4.49397 255.348 4.96638 254.689 5.38657C254.039 5.79717 253.437 6.15968 252.883 6.47481H256.423L256.538 5.42948L257.599 5.51529L257.426 7.60693H251.407L251.292 6.58987C252.582 5.73032 253.638 4.98523 254.46 4.35489C255.281 3.71509 255.693 3.05632 255.693 2.37832C255.693 1.53787 255.166 1.11749 254.115 1.12237L254.115 1.11749C253.924 1.11754 253.695 1.14604 253.427 1.2033C253.16 1.25104 252.916 1.32238 252.697 1.41783L252.467 2.47876L251.45 2.3637L251.707 0.60165C252.118 0.401088 252.563 0.253475 253.041 0.15797C253.519 0.0529708 253.958 1.99446e-05 254.359 0Z\"\n    fill=\"currentColor\" />\u003C/g>",{"tile":13,"orbsWithOnlyMarkdownPages":143},{"id":14,"data":15,"type":16,"maxContentLevel":19,"version":20,"orbs":21},"354fce4d-f6c1-4289-8e4a-02b3907f76c4",{"type":16,"title":17,"tagline":18},9,"Samples and Populations","How to choose the subjects of your analysis, and avoid common errors.",3,1,[22,75,108],{"id":23,"data":24,"type":25,"version":20,"maxContentLevel":19,"pages":27},"1ddf6431-38b6-4613-9ad1-64f44eda98fc",{"type":25,"title":26},2,"Understanding Populations and Samples",[28,43,59],{"id":29,"data":30,"type":20,"maxContentLevel":19,"version":20,"reviews":34},"95bc7af2-d6c6-4b9b-87b8-47bed5d3043e",{"type":20,"title":31,"contentRole":25,"markdownContent":32,"audioMediaId":33},"Populations","A population is a group of interest for your research, like everyone in your city or country. It doesn’t necessarily have to be a group of people either, any list of items works. \n\nAs an example, it could be all laptops of a specific model produced by a company in 2021. In this example, the time period depends on what you’re interested in finding out. \n\n ![Graph](image://3786a416-ee2d-4b33-8322-0a8bb31c0f41 \"The population is the total group of units for your study\")\n\nIf you wanted to know the number of defects for just one year, then the time period you used for your sample would be one year. If you wanted to know the number of defects for all time, then your population would be all laptops of that model ever produced. \n\nThese are some of the reasons that it’s important to know your research aims before you select your population. \n\n","85e6bd76-ddf9-4d92-afd2-78ce69d20744",[35],{"id":36,"data":37,"type":38,"version":20,"maxContentLevel":19},"48c3b2a3-ec53-428f-a2c3-a49a0bde0e0d",{"type":38,"reviewType":20,"spacingBehaviour":20,"activeRecallQuestion":39,"activeRecallAnswers":41},11,[40],"What is a population in research?",[42],"A group of interest for your research",{"id":44,"data":45,"type":20,"maxContentLevel":19,"version":20,"reviews":49},"d7cbd587-cf7f-4704-93cd-5b5d4107907a",{"type":20,"title":46,"contentRole":25,"markdownContent":47,"audioMediaId":48},"Samples","\nIn statistics, you often want to know more about an entire population, but to survey them all would be too expensive, or take too long, so you take a smaller sample instead. \n\n ![Graph](image://0a91f7bf-e218-41c6-ba5f-e18e5d3859ee \"An illustration of a sample\")\n\nA sample is the portion of that population that we gathered data on for our research. As an example, imagine that there are 4 million people in your city, but it is only realistic for you to collect data on 400 people. \n\nYour population is 4 million but those 400 people are your sample. Even though you didn’t get data on everyone in our city, with good sampling and statistics we can reliably make inferences about the population based on what we observe in our sample. \n\n","ac4d8768-60a9-4662-9fd2-8b5846de7ce0",[50],{"id":51,"data":52,"type":38,"version":20,"maxContentLevel":19},"78b425c0-a49b-495c-8f2a-9186dfe97ff4",{"type":38,"reviewType":25,"spacingBehaviour":20,"binaryQuestion":53,"binaryCorrect":55,"binaryIncorrect":57},[54],"What is the portion of a population that we gather data on for our research called?",[56],"Sample",[58],"Population",{"id":60,"data":61,"type":20,"maxContentLevel":19,"version":20,"reviews":65},"874e552e-162f-400a-b4df-8573314ee4bc",{"type":20,"title":62,"contentRole":25,"markdownContent":63,"audioMediaId":64},"Observations and Units","\nA population is all the people you are interested in finding something out about. A sample is a small group we take from our population so that we can analyze and test the data we gather from them. \n\nAn observation is the term we use for one data point – meaning one element that we are observing within a sample. It is not to be confused with a unit within that sample – meaning one specific member of the group being observed.\n\n ![Graph](image://53dd3769-c569-4dd1-b977-b93382a07adb \"The observation here would be 'area of residence'\")\n\nImagine you are conducting a study of people’s heights on a dating app – strictly for research purposes, of course. The population would be the group on that app you are interested in – perhaps ‘men’, or ‘women’. \n\nThe sample would be a selection of people within that group who you choose to gather data from. The observation would be the height of each person in that group. A unit would be one individual from that group.\n\n","30897824-9a94-4a84-88bc-06123c5a99de",[66],{"id":67,"data":68,"type":38,"version":20,"maxContentLevel":19},"e594c03f-7674-4133-a9d2-02d2bf1f93cf",{"type":38,"reviewType":25,"spacingBehaviour":20,"binaryQuestion":69,"binaryCorrect":71,"binaryIncorrect":73},[70],"What is the term used for one data point being analyzed within a sample?",[72],"Observation",[74],"Unit",{"id":76,"data":77,"type":25,"version":20,"maxContentLevel":19,"pages":79},"bcfb48b2-c737-4cfb-8f70-113a0cd2866c",{"type":25,"title":78},"Ensuring Representative Samples",[80,94],{"id":81,"data":82,"type":20,"maxContentLevel":19,"version":20,"reviews":86},"74c62d2d-d0d9-41ee-86cc-4a08b1daf1cb",{"type":20,"title":83,"contentRole":25,"markdownContent":84,"audioMediaId":85},"Representative samples ","\nA good sample is representative of the population you’re interested in studying and learning more about. \n\nLook in the mirror, now back at me. Now look back in the mirror and then back at me again. A sample is representative when it mirrors or reflects the characteristics of the population which you would like to learn more about. \n\n\n ![Graph](image://699159b3-a86d-4f1c-9745-e80dca0ee357 \"Samples should represent every group within the population being studied\")\n\nWas what you saw in the mirror representative of yourself? Sure it was… but was it representative of everyone in your neighborhood? Well… probably not. \n\nTo get a representative sample you would need to gather lots more people. Ideally your sample is completely representative of the population you are studying, a term known as your ‘target’ population. So if you are conducting a study on how young people spend their time, you need a sample that is representative of everyone that fits your definition of ‘young’ – not just people from your immediate environment.\n\n","fed54e7a-c911-4c3c-a471-7fe1c4f8404a",[87],{"id":88,"data":89,"type":38,"version":20,"maxContentLevel":19},"44352025-e319-479a-b44d-b436c8c98fe1",{"type":38,"reviewType":20,"spacingBehaviour":20,"activeRecallQuestion":90,"activeRecallAnswers":92},[91],"When can a sample be representative of the population you are studying?",[93],"When it mirrors or reflects the characteristics of the population which you would like to learn more about",{"id":95,"data":96,"type":20,"maxContentLevel":19,"version":20,"reviews":100},"2788b1a4-9ac8-4701-9951-7113a746d99b",{"type":20,"title":97,"contentRole":25,"markdownContent":98,"audioMediaId":99},"Generalization for statistics ","\nStatistical generalization means using the results we obtained from a sample and inferring characteristics about a population from those results. \n\nIt’s important for a sample to be representative of its population so that we can generalize results from statistical testing to the population at large. \n\nOtherwise, the population could be too different from our sample, and the pattern or effect we saw in our sample might not exist in the population. \n","a6cec959-df9a-4183-8c69-1641010ec2bc",[101],{"id":102,"data":103,"type":38,"version":20,"maxContentLevel":19},"e1ea3eb5-579e-460e-bb20-f6ebcefdd49b",{"type":38,"reviewType":20,"spacingBehaviour":20,"activeRecallQuestion":104,"activeRecallAnswers":106},[105],"What technique requires using the results from a sample to infer characteristics about a population?",[107],"Statistical generalization",{"id":109,"data":110,"type":25,"version":20,"maxContentLevel":19,"pages":112},"114d6076-78d4-4199-87ff-ab846c531cae",{"type":25,"title":111},"Generalization in Statistics and Data Science",[113,129],{"id":114,"data":115,"type":20,"maxContentLevel":19,"version":20,"reviews":119},"56a203ee-9b4b-4c8b-b475-b56a8466289f",{"type":20,"title":116,"contentRole":25,"markdownContent":117,"audioMediaId":118},"Generalization for data science ","\nGeneralization for data science is how well a machine learning model – the algorithmic recipe you use to create predictions or classifications – adapts to new data it hasn’t seen yet. \n\nThis is because just like we use samples in statistics, we can also consider the data we use to train our machine learning models as a sample. This is because we can’t possibly use all the data that exists for our sample and because machine learning is often about making predictions or classifications on data that doesn’t even exist yet.  \n\nIf your model generalizes well, then the results you see in the real world will closely match the results you saw in training and testing the model. \n\n","6a22c80a-f9a3-4277-91f2-e7a16cceb034",[120],{"id":121,"data":122,"type":38,"version":20,"maxContentLevel":19},"c3e800f3-1d74-4307-b55e-ad169c938979",{"type":38,"reviewType":25,"spacingBehaviour":20,"binaryQuestion":123,"binaryCorrect":125,"binaryIncorrect":127},[124],"What is the goal of generalization for data science?",[126],"To make predictions or classifications on data that doesn't exist yet.",[128],"To use all the data that exists for a sample.",{"id":130,"data":131,"type":20,"maxContentLevel":19,"version":20,"reviews":135},"ad483acb-7a31-44ac-8bd4-d9148263efa6",{"type":20,"title":132,"contentRole":25,"markdownContent":133,"audioMediaId":134},"How samples can be used for training data models","\nIn order to create accurate models using data science, it's important to carefully select and prepare your data. Generally, you'll want to start by creating a training dataset. This dataset will contain the samples of data that your model will learn from. \n\nBy analyzing these samples, your model will learn to identify patterns and make predictions. But to ensure your model is accurate, you'll also need to test it against a separate dataset, called the test dataset.\n\nThe test dataset should contain data that wasn't used in the training process. Because your dataset is complete, including the correct value for the variable you are predicting, you can compare how accurate your predictions are against the actual observations.\n\nThis process of training and testing is critical to building a model that is both accurate and generalizable.\n","42b679ee-333e-407f-b370-97c23d532d99",[136],{"id":137,"data":138,"type":38,"version":20,"maxContentLevel":19},"99d67401-232c-4c0c-8ca4-294d8c64fed0",{"type":38,"reviewType":20,"spacingBehaviour":20,"activeRecallQuestion":139,"activeRecallAnswers":141},[140],"What is used to compare the accuracy of a model's predictions against actual observations?",[142],"A test dataset",[144,253,312],{"id":23,"data":24,"type":25,"version":20,"maxContentLevel":19,"pages":145},[146,188,218],{"id":29,"data":30,"type":20,"maxContentLevel":19,"version":20,"reviews":34,"parsed":147},{"data":148,"body":151,"toc":186},{"title":149,"description":150},"","A population is a group of interest for your research, like everyone in your city or country. It doesn’t necessarily have to be a group of people either, any list of items works.",{"type":152,"children":153},"root",[154,161,166,176,181],{"type":155,"tag":156,"props":157,"children":158},"element","p",{},[159],{"type":160,"value":150},"text",{"type":155,"tag":156,"props":162,"children":163},{},[164],{"type":160,"value":165},"As an example, it could be all laptops of a specific model produced by a company in 2021. In this example, the time period depends on what you’re interested in finding out.",{"type":155,"tag":156,"props":167,"children":168},{},[169],{"type":155,"tag":170,"props":171,"children":175},"img",{"alt":172,"src":173,"title":174},"Graph","image://3786a416-ee2d-4b33-8322-0a8bb31c0f41","The population is the total group of units for your study",[],{"type":155,"tag":156,"props":177,"children":178},{},[179],{"type":160,"value":180},"If you wanted to know the number of defects for just one year, then the time period you used for your sample would be one year. If you wanted to know the number of defects for all time, then your population would be all laptops of that model ever produced.",{"type":155,"tag":156,"props":182,"children":183},{},[184],{"type":160,"value":185},"These are some of the reasons that it’s important to know your research aims before you select your population.",{"title":149,"searchDepth":25,"depth":25,"links":187},[],{"id":44,"data":45,"type":20,"maxContentLevel":19,"version":20,"reviews":49,"parsed":189},{"data":190,"body":192,"toc":216},{"title":149,"description":191},"In statistics, you often want to know more about an entire population, but to survey them all would be too expensive, or take too long, so you take a smaller sample instead.",{"type":152,"children":193},[194,198,206,211],{"type":155,"tag":156,"props":195,"children":196},{},[197],{"type":160,"value":191},{"type":155,"tag":156,"props":199,"children":200},{},[201],{"type":155,"tag":170,"props":202,"children":205},{"alt":172,"src":203,"title":204},"image://0a91f7bf-e218-41c6-ba5f-e18e5d3859ee","An illustration of a sample",[],{"type":155,"tag":156,"props":207,"children":208},{},[209],{"type":160,"value":210},"A sample is the portion of that population that we gathered data on for our research. As an example, imagine that there are 4 million people in your city, but it is only realistic for you to collect data on 400 people.",{"type":155,"tag":156,"props":212,"children":213},{},[214],{"type":160,"value":215},"Your population is 4 million but those 400 people are your sample. Even though you didn’t get data on everyone in our city, with good sampling and statistics we can reliably make inferences about the population based on what we observe in our sample.",{"title":149,"searchDepth":25,"depth":25,"links":217},[],{"id":60,"data":61,"type":20,"maxContentLevel":19,"version":20,"reviews":65,"parsed":219},{"data":220,"body":222,"toc":251},{"title":149,"description":221},"A population is all the people you are interested in finding something out about. A sample is a small group we take from our population so that we can analyze and test the data we gather from them.",{"type":152,"children":223},[224,228,233,241,246],{"type":155,"tag":156,"props":225,"children":226},{},[227],{"type":160,"value":221},{"type":155,"tag":156,"props":229,"children":230},{},[231],{"type":160,"value":232},"An observation is the term we use for one data point – meaning one element that we are observing within a sample. It is not to be confused with a unit within that sample – meaning one specific member of the group being observed.",{"type":155,"tag":156,"props":234,"children":235},{},[236],{"type":155,"tag":170,"props":237,"children":240},{"alt":172,"src":238,"title":239},"image://53dd3769-c569-4dd1-b977-b93382a07adb","The observation here would be 'area of residence'",[],{"type":155,"tag":156,"props":242,"children":243},{},[244],{"type":160,"value":245},"Imagine you are conducting a study of people’s heights on a dating app – strictly for research purposes, of course. The population would be the group on that app you are interested in – perhaps ‘men’, or ‘women’.",{"type":155,"tag":156,"props":247,"children":248},{},[249],{"type":160,"value":250},"The sample would be a selection of people within that group who you choose to gather data from. The observation would be the height of each person in that group. A unit would be one individual from that group.",{"title":149,"searchDepth":25,"depth":25,"links":252},[],{"id":76,"data":77,"type":25,"version":20,"maxContentLevel":19,"pages":254},[255,290],{"id":81,"data":82,"type":20,"maxContentLevel":19,"version":20,"reviews":86,"parsed":256},{"data":257,"body":259,"toc":288},{"title":149,"description":258},"A good sample is representative of the population you’re interested in studying and learning more about.",{"type":152,"children":260},[261,265,270,278,283],{"type":155,"tag":156,"props":262,"children":263},{},[264],{"type":160,"value":258},{"type":155,"tag":156,"props":266,"children":267},{},[268],{"type":160,"value":269},"Look in the mirror, now back at me. Now look back in the mirror and then back at me again. A sample is representative when it mirrors or reflects the characteristics of the population which you would like to learn more about.",{"type":155,"tag":156,"props":271,"children":272},{},[273],{"type":155,"tag":170,"props":274,"children":277},{"alt":172,"src":275,"title":276},"image://699159b3-a86d-4f1c-9745-e80dca0ee357","Samples should represent every group within the population being studied",[],{"type":155,"tag":156,"props":279,"children":280},{},[281],{"type":160,"value":282},"Was what you saw in the mirror representative of yourself? Sure it was… but was it representative of everyone in your neighborhood? Well… probably not.",{"type":155,"tag":156,"props":284,"children":285},{},[286],{"type":160,"value":287},"To get a representative sample you would need to gather lots more people. Ideally your sample is completely representative of the population you are studying, a term known as your ‘target’ population. So if you are conducting a study on how young people spend their time, you need a sample that is representative of everyone that fits your definition of ‘young’ – not just people from your immediate environment.",{"title":149,"searchDepth":25,"depth":25,"links":289},[],{"id":95,"data":96,"type":20,"maxContentLevel":19,"version":20,"reviews":100,"parsed":291},{"data":292,"body":294,"toc":310},{"title":149,"description":293},"Statistical generalization means using the results we obtained from a sample and inferring characteristics about a population from those results.",{"type":152,"children":295},[296,300,305],{"type":155,"tag":156,"props":297,"children":298},{},[299],{"type":160,"value":293},{"type":155,"tag":156,"props":301,"children":302},{},[303],{"type":160,"value":304},"It’s important for a sample to be representative of its population so that we can generalize results from statistical testing to the population at large.",{"type":155,"tag":156,"props":306,"children":307},{},[308],{"type":160,"value":309},"Otherwise, the population could be too different from our sample, and the pattern or effect we saw in our sample might not exist in the population.",{"title":149,"searchDepth":25,"depth":25,"links":311},[],{"id":109,"data":110,"type":25,"version":20,"maxContentLevel":19,"pages":313},[314,336],{"id":114,"data":115,"type":20,"maxContentLevel":19,"version":20,"reviews":119,"parsed":315},{"data":316,"body":318,"toc":334},{"title":149,"description":317},"Generalization for data science is how well a machine learning model – the algorithmic recipe you use to create predictions or classifications – adapts to new data it hasn’t seen yet.",{"type":152,"children":319},[320,324,329],{"type":155,"tag":156,"props":321,"children":322},{},[323],{"type":160,"value":317},{"type":155,"tag":156,"props":325,"children":326},{},[327],{"type":160,"value":328},"This is because just like we use samples in statistics, we can also consider the data we use to train our machine learning models as a sample. This is because we can’t possibly use all the data that exists for our sample and because machine learning is often about making predictions or classifications on data that doesn’t even exist yet.",{"type":155,"tag":156,"props":330,"children":331},{},[332],{"type":160,"value":333},"If your model generalizes well, then the results you see in the real world will closely match the results you saw in training and testing the model.",{"title":149,"searchDepth":25,"depth":25,"links":335},[],{"id":130,"data":131,"type":20,"maxContentLevel":19,"version":20,"reviews":135,"parsed":337},{"data":338,"body":340,"toc":361},{"title":149,"description":339},"In order to create accurate models using data science, it's important to carefully select and prepare your data. Generally, you'll want to start by creating a training dataset. This dataset will contain the samples of data that your model will learn from.",{"type":152,"children":341},[342,346,351,356],{"type":155,"tag":156,"props":343,"children":344},{},[345],{"type":160,"value":339},{"type":155,"tag":156,"props":347,"children":348},{},[349],{"type":160,"value":350},"By analyzing these samples, your model will learn to identify patterns and make predictions. But to ensure your model is accurate, you'll also need to test it against a separate dataset, called the test dataset.",{"type":155,"tag":156,"props":352,"children":353},{},[354],{"type":160,"value":355},"The test dataset should contain data that wasn't used in the training process. Because your dataset is complete, including the correct value for the variable you are predicting, you can compare how accurate your predictions are against the actual observations.",{"type":155,"tag":156,"props":357,"children":358},{},[359],{"type":160,"value":360},"This process of training and testing is critical to building a model that is both accurate and generalizable.",{"title":149,"searchDepth":25,"depth":25,"links":362},[],{"left":4,"top":4,"width":364,"height":364,"rotate":4,"vFlip":6,"hFlip":6,"body":365},24,"\u003Cpath fill=\"none\" stroke=\"currentColor\" stroke-linecap=\"round\" stroke-linejoin=\"round\" stroke-width=\"2\" d=\"m9 18l6-6l-6-6\"/>",{"left":4,"top":4,"width":364,"height":364,"rotate":4,"vFlip":6,"hFlip":6,"body":367},"\u003Cpath fill=\"none\" stroke=\"currentColor\" stroke-linecap=\"round\" stroke-linejoin=\"round\" stroke-width=\"2\" d=\"M4 5h16M4 12h16M4 19h16\"/>",1778179422941]