|
|
(576 intermediate revisions by the same user not shown) |
Line 1: |
Line 1: |
| + | {{Sidebar}} |
| | | |
| + | <html><buttonclass="averte" onclick="aver()">aver</button></html> |
| | | |
| + | <html> |
| + | <script src="https://ajax.googleapis.com/ajax/libs/jquery/3.4.1/jquery.min.js"></script> |
| + | <script> |
| + | function aver() { |
| + | link = "http://wiki.sinfronteras.ws/index.php?title=P%C3%A1gina_de_pruebas_3+&+action=edit" |
| + | link2 = link.replace("amp;","") |
| + | window.location = link2 |
| + | sleep(2); |
| + | window.document.getElementById('firstHeading').style.color = "red" |
| + | } |
| + | $(document).ready( function() { |
| + | $('#totalItems, #enteredItems').keyup(function(){ |
| + | window.document.getElementById('firstHeading').style.color = "red" |
| + | }); |
| + | window.document.getElementById('firstHeading').style.color = "red" |
| + | }); |
| + | </script> |
| + | </html> |
| | | |
− | {| class="wikitable"
| + | <br /> |
− | ! rowspan="2" |
| + | ==Projects portfolio== |
− | ! rowspan="2" |
| |
− | ! rowspan="2" style="width:80px; background-color:#E6B0AA" |Values have any meaningful order
| |
− | ! rowspan="2" style="width:80px; background-color:#A9DFBF" |Distance between values is defined
| |
− | ! colspan="3" style="width:80px; background-color:#FDEBD0" |'''Mathematical operations make sense'''
| |
− | (Values can be used to perform '''mathematical operations)'''
| |
− | ! rowspan="2" style="width:80px; background-color:#AED6F1" |There is a meaning ful zero-point
| |
− | ! colspan="5" style="width:80px; background-color:#D7BDE2" |Values can be used to perform statistical computations
| |
− | ! rowspan="2" |Example
| |
− | |-
| |
− | ! style="width:80px; background-color:#FDEBD0" | '''Comparison operators'''
| |
− | ! style="width:80px; background-color:#FDEBD0" | Addition and subtrac tion
| |
− | ! style="width:80px; background-color:#FDEBD0" | Multiplica tion and division
| |
− | ! style="width:80px; background-color:#D7BDE2" | "Counts", aka, "Fre quency of Distribu tion"
| |
− | ! style="width:80px; background-color:#D7BDE2" | Mode
| |
− | ! style="width:80px; background-color:#D7BDE2" | Median
| |
− | ! style="width:80px; background-color:#D7BDE2" | Mean
| |
− | ! style="width:80px; background-color:#D7BDE2" | Stn
| |
− | |-
| |
− | !'''Nominal'''
| |
− | |Values serve only as labels
| |
− | | colspan="11" style="margin: 0; padding: 0;" |
| |
− | {| class="mw-collapsible mw-collapsed wikitable" style="margin: 0; padding: 0;"
| |
− | |- style="vertical-align:middle;"
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;"><div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;">✘</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;"><div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;">✘</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;"><div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;">✘</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;"><div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;">✘</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;"><div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;">✘</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;"><div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;">✘</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;"><div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;">✘</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;"><div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;">✘</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px; vertical-align:top; padding-top:60px;" |<div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;"><div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;">✘</span></div></span></div>
| |
− | |- style="vertical-align:top;"
| |
− | | style="height:100px; text-align:left; width:80px;" |
| |
− | Values don't have any meaningful order
| |
− | | style="height:100px; text-align:left; width:80px;" |
| |
− | No distance between values is defined
| |
− | | colspan="3" style="height:100px; text-align:left; width:80px;" |
| |
− | Values don't carry any mathematical meaning
| |
− | |
| |
− | | style="height:100px; text-align:left; width:80px;" |
| |
− | | style="height:100px; text-align:left; width:80px;" |
| |
− | | colspan="3" style="height:100px; text-align:left; width:80px;" |
| |
− | Values cannot be used to perform many statistical computations, such as mean and standard deviation
| |
− | |-
| |
− | | colspan="11" |Even if the values are numbers. For example, if we want to categorize males and females, we could use a number of 1 for male, and 2 for female. However, the values of 1 and 2 in this case don't have any meaningful order or carry any mathematical meaning. They are simply used as labels. <nowiki>https://www.statisticssolutions.com/data-levels-and-measurement/</nowiki>
| |
− | |}
| |
− | |For an '''«outlook»''' attribute from weather data, potential values could be "sunny", "overcast", and "rainy".
| |
− | |-
| |
− | !'''Ordinal'''
| |
− | |Distinction between nominal and ordinal not always clear (e.g., attribute "outlook")
| |
− | | colspan="11" style="margin: 0; padding: 0;" |
| |
− | {| class="mw-collapsible mw-collapsed wikitable" style="margin: 0; padding: 0;"
| |
− | |- style="vertical-align:middle; margin: 0; padding: 0;"
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;"><div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;">✘</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;"><div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;">✘</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;"><div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;">✘</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;"><div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;">✘</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;"><div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;">✘</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px; vertical-align:top; padding-top:30px;" |<div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;"><div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;">✘</span></div></span></div>
| |
− | |- style="vertical-align:top;"
| |
− | | style="height:100px; text-align:left; width:80px;" |
| |
− | Values have a meaningful order
| |
− | | style="height:100px; text-align:left; width:80px;" |
| |
− | No distance between values is defined
| |
− | | style="height:100px; text-align:left; width:80px;" |
| |
− | Only comparison operators make sense
| |
− | | colspan="2" |Mathematical operations such as addition, subtraction, multiplication, etc. do not make sense
| |
− | |
| |
− | | style="height:100px; text-align:left; width:80px;" |
| |
− | | style="height:100px; text-align:left; width:80px;" |
| |
− | | style="height:100px; text-align:left; width:80px;" |
| |
− | |
| |
− | |
| |
− | |-
| |
− | | colspan="11" |For example, an '''«Education level»''' attribute with possible values of '''«high school»''', '''«undergraduate degree»''', and '''«graduate degree»'''. There is a definitive order to the categories (i.eº., graduate is higher than undergraduate, and undergraduate is higher than high school), but we cannot make any other arithmetic assumption. For instance, we cannot assume that the difference in education level between undergraduate and high school is the same as the difference between graduate and undergraduate.
| |
− | |}
| |
− | |A '''«temperature»''' attribute in weather data with potential values fo: "hot" > "warm" > "cool"
| |
− | |-
| |
− | !'''Interval'''
| |
− | |
| |
− | | colspan="11" style="margin: 0; padding: 0;" |
| |
− | {| class="mw-collapsible mw-collapsed wikitable" style="margin: 0; padding: 0;"
| |
− | |- style="vertical-align:middle;"
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;"><div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;">✘</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;"><div style="text-align: center;"><span style="color: red; font-size: 15pt; text-align: center;">✘</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px; vertical-align:top; padding-top:30px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | |- style="vertical-align:top;"
| |
− | | style="height:100px; text-align:left; width:80px;" |
| |
− | | style="height:100px; text-align:left; width:80px;" |
| |
− | Distance between values is defined. In other words, we can quantify the difference between values
| |
− | | style="height:100px; text-align:left; width:80px;" |
| |
− | Comparison operators make sense
| |
− | |Addition, subtraction, make sense
| |
− | |Multiplication, and division do not make sense
| |
− | |Interval variables often do not have a meaningful zero-point.
| |
− | | style="height:100px; text-align:left; width:80px;" |
| |
− | | style="height:100px; text-align:left; width:80px;" |
| |
− | | style="height:100px; text-align:left; width:80px;" |
| |
− | |
| |
− | |(not sure)
| |
− | |-
| |
− | | colspan="11" |An example of an interval variable would be a '''«Temperature»''' attribute. We can correctly assume that the difference between 70 and 80 degrees is the same as the difference between 80 and 90 degrees. However, the mathematical operations of multiplication and division do not apply to interval variables. For instance, we cannot accurately say that 100 degrees is twice as hot as 50 degrees. Additionally, interval variables often do not have a meaningful zero-point. For example, a temperature of zero degrees (on Celsius and Fahrenheit scales) does not mean a complete absence of heat.
| |
| | | |
| | | |
− | An interval variable can be used to compute commonly used statistical measures such as the average (mean), standard deviation, and the Pearson correlation coefficient. <nowiki>https://www.statisticssolutions.com/data-levels-and-measurement/</nowiki>
| + | <br /> |
− | |}
| + | ==Data Analytics courses== |
− | |a '''«Temperature»''' attribute composed by numeric measures of such property
| |
− | |-
| |
− | !'''Ratio'''
| |
− | |
| |
− | | colspan="11" style="margin: 0; padding: 0;" |
| |
− | {| class="mw-collapsible mw-collapsed wikitable" style="margin: 0; padding: 0;"
| |
− | |- style="vertical-align:middle;"
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | | style="height:100px; text-align:center; width:80px; vertical-align:top; padding-top:30px;" |<div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;"><div style="text-align: center;"><span style="color: blue; font-size: 20pt; text-align: center;">✔</span></div></span></div>
| |
− | |- style="vertical-align:top;"
| |
− | | style="height:100px; text-align:left; width:80px;" |
| |
− | | style="height:100px; text-align:left; width:80px;" |
| |
− | | colspan="3" style="height:100px; text-align:left; width:80px;" |
| |
− | All arithmetic operations are possible on a ratio variable
| |
− | |Ratio variables have a meaningful zero-point
| |
− | | style="height:100px; text-align:left; width:80px;" |
| |
− | | style="height:100px; text-align:left; width:80px;" |
| |
− | | style="height:100px; text-align:left; width:80px;" |
| |
− | |
| |
− | |
| |
− | |-
| |
− | | colspan="11" |An example of a ratio variable would be weight (e.g., in pounds). We can accurately say that 20 pounds is twice as heavy as 10 pounds. Additionally, ratio variables have a meaningful zero-point (e.g., exactly 0 pounds means the object has no weight).
| |
| | | |
| | | |
− | A ratio variable can be used as a dependent variable for most parametric statistical tests such as t-tests, F-tests, correlation, and regression. <nowiki>https://www.statisticssolutions.com/data-levels-and-measurement/</nowiki>
| + | <br /> |
− | |}
| + | ==Possible sources of data== |
− | |The '''«weight»''' (e.g., in pounds)
| |
| | | |
− | Other examples: gross sales of a company, the income of a company, etc.
| + | |
− | |}
| + | <br /> |
| + | ==What is data== |
| + | |
| + | |
| + | <br /> |
| + | ===Qualitative vs quantitative data=== |
| + | |
| + | |
| + | <br /> |
| + | ====Discrete and continuous data==== |
| + | |
| + | |
| + | <br /> |
| + | ===Structured vs Unstructured data=== |
| + | |
| + | |
| + | <br /> |
| + | ===Data Levels and Measurement=== |
| + | |
| + | |
| + | <br /> |
| + | ===What is an example=== |
| + | |
| + | |
| + | <br /> |
| + | ===What is a dataset=== |
| + | |
| + | |
| + | <br /> |
| + | ===What is Metadata=== |
| + | |
| + | |
| + | <br /> |
| + | ==What is Data Science== |
| + | |
| + | |
| + | <br /> |
| + | ===Supervised Learning=== |
| + | |
| + | |
| + | |
| + | <br /> |
| + | ===Unsupervised Learning=== |
| + | |
| + | |
| + | <br /> |
| + | ===Reinforcement Learning=== |
| + | |
| + | |
| + | <br /> |
| + | ==Some real-world examples of big data analysis== |
| + | |
| + | |
| + | <br /> |
| + | ==Statistic== |
| + | |
| + | |
| + | <br /> |
| + | ==Descriptive Data Analysis== |
| + | |
| + | |
| + | <br /> |
| + | ===Central tendency=== |
| + | |
| + | |
| + | <br /> |
| + | ====Mean==== |
| + | |
| + | |
| + | <br /> |
| + | =====When not to use the mean===== |
| + | |
| + | |
| + | <br /> |
| + | ====Median==== |
| + | |
| + | |
| + | <br /> |
| + | ====Mode==== |
| + | |
| + | |
| + | <br /> |
| + | ====Skewed Distributions and the Mean and Median==== |
| + | |
| + | |
| + | <br /> |
| + | ====Summary of when to use the mean, median and mode==== |
| + | measures-central-tendency-mean-mode-median-faqs.php |
| + | |
| + | |
| + | <br /> |
| + | ===Measures of Variation=== |
| + | |
| + | |
| + | <br /> |
| + | ====Range==== |
| + | |
| + | |
| + | <br /> |
| + | ====Quartile==== |
| + | |
| + | |
| + | <br /> |
| + | ====Box Plots==== |
| + | |
| + | |
| + | |
| + | <br /> |
| + | ====Variance==== |
| + | |
| + | |
| + | <br /> |
| + | ====Standard Deviation==== |
| + | |
| + | |
| + | <br /> |
| + | ==== Z Score ==== |
| + | |
| + | |
| + | <br /> |
| + | ===Shape of Distribution=== |
| + | |
| + | |
| + | <br /> |
| + | ====Probability distribution==== |
| + | |
| + | |
| + | <br /> |
| + | =====The Normal Distribution===== |
| + | |
| + | |
| + | <br /> |
| + | ====Histograms==== |
| + | |
| + | |
| + | <br /> |
| + | ====Skewness==== |
| + | |
| + | |
| + | <br /> |
| + | ====Kurtosis==== |
| + | |
| + | |
| + | <br /> |
| + | ====Visualization of measure of variations on a Normal distribution==== |
| + | |
| + | |
| + | <br /> |
| + | ==Simple and Multiple regression== |
| + | |
| + | |
| + | <br /> |
| + | ===Correlation=== |
| + | |
| + | |
| + | <br /> |
| + | ====Measuring Correlation==== |
| + | |
| + | |
| + | <br /> |
| + | =====Pearson correlation coefficient - Pearson s r===== |
| + | |
| + | |
| + | <br /> |
| + | =====The coefficient of determination <math>R^2</math>===== |
| + | |
| + | |
| + | <br /> |
| + | ====Correlation <math>\neq</math> Causation==== |
| + | |
| + | |
| + | <br /> |
| + | ====Testing the "generalizability" of the correlation ==== |
| + | |
| + | |
| + | <br /> |
| + | ===Simple Linear Regression=== |
| + | |
| + | |
| + | <br /> |
| + | ===Multiple Linear Regression=== |
| + | |
| + | |
| + | <br /> |
| + | ===RapidMiner Linear Regression examples=== |
| + | |
| + | |
| + | <br /> |
| + | ==K-Nearest Neighbour== |
| + | |
| + | |
| + | <br /> |
| + | ==Decision Trees== |
| + | |
| + | |
| + | <br /> |
| + | ===The algorithm=== |
| + | |
| + | |
| + | <br /> |
| + | ====Basic explanation of the algorithm==== |
| + | |
| + | |
| + | <br /> |
| + | ====Algorithms addressed in Noel s Lecture==== |
| + | |
| + | |
| + | <br /> |
| + | =====The ID3 algorithm===== |
| + | |
| + | |
| + | <br /> |
| + | =====The C5.0 algorithm===== |
| + | |
| + | |
| + | <br /> |
| + | ===Example in RapidMiner=== |
| + | |
| + | |
| + | <br /> |
| + | ==Random Forests== |
| + | https://www.youtube.com/watch?v=J4Wdy0Wc_xQ&t=4s |
| + | |
| + | |
| + | <br /> |
| + | ==Naive Bayes== |
| + | |
| + | |
| + | <br /> |
| + | ===Probability=== |
| + | |
| + | |
| + | <br /> |
| + | ===Independent and dependent events=== |
| + | |
| + | |
| + | <br /> |
| + | ===Mutually exclusive and collectively exhaustive=== |
| + | |
| + | |
| + | <br /> |
| + | ===Marginal probability=== |
| + | The marginal probability is the probability of a single event occurring, independent of other events. A conditional probability, on the other hand, is the probability that an event occurs given that another specific event has already occurred. https://en.wikipedia.org/wiki/Marginal_distribution |
| + | |
| + | |
| + | <br > |
| + | ===Joint Probability=== |
| + | |
| + | |
| + | <br /> |
| + | ===Conditional probability=== |
| + | |
| + | |
| + | <br /> |
| + | ====Kolmogorov definition of Conditional probability==== |
| + | |
| + | |
| + | <br /> |
| + | ====Bayes s theorem==== |
| + | |
| + | |
| + | <br /> |
| + | =====Likelihood and Marginal Likelihood===== |
| + | |
| + | |
| + | <br /> |
| + | =====Prior Probability===== |
| + | |
| + | |
| + | <br /> |
| + | =====Posterior Probability===== |
| + | |
| + | |
| + | <br /> |
| + | ===Applying Bayes' Theorem=== |
| + | |
| + | |
| + | <br /> |
| + | ====Scenario 1 - A single feature==== |
| + | |
| + | |
| + | <br /> |
| + | ====Scenario 2 - Class-conditional independence==== |
| + | |
| + | |
| + | <br /> |
| + | ====Scenario 3 - Laplace Estimator==== |
| + | |
| + | |
| + | <br /> |
| + | ===Naïve Bayes - Numeric Features=== |
| + | |
| + | |
| + | <br /> |
| + | ===RapidMiner Examples=== |
| + | |
| + | |
| + | <br /> |
| + | ==Perceptrons - Neural Networks and Support Vector Machines== |
| + | |
| + | |
| + | <br /> |
| + | ==Boosting== |
| + | |
| + | |
| + | <br /> |
| + | ===Gradient boosting=== |
| + | |
| + | |
| + | <br /> |
| + | ==K Means Clustering== |
| + | |
| + | |
| + | <br /> |
| + | ===Clustering class of the Noel course=== |
| + | |
| + | |
| + | <br /> |
| + | ====RapidMiner example 1==== |
| + | |
| + | |
| + | <br /> |
| + | ==Principal Component Analysis PCA== |
| + | |
| + | |
| + | <br /> |
| + | ==Association Rules - Market Basket Analysis== |
| + | |
| + | |
| + | <br /> |
| + | ===Association Rules example in RapidMiner=== |
| + | |
| + | |
| + | <br /> |
| + | ==Time Series Analysis== |
| + | |
| + | |
| + | <br /> |
| + | ==[[Text Analytics|Text Analytics / Mining]]== |
| + | |
| + | |
| + | <br /> |
| + | ==Model Evaluation== |
| + | |
| + | |
| + | <br /> |
| + | ===Why evaluate models=== |
| + | |
| + | |
| + | <br /> |
| + | ===Evaluation of regression models=== |
| + | |
| + | |
| + | <br /> |
| + | ===Evaluation of classification models=== |
| + | |
| + | |
| + | <br /> |
| + | ===References=== |
| + | Landis JR, Koch GG. The measurement of observer agreement for categorical data. Biometrics. 1977 Mar;33(1):159-174. DOI: 10.2307/2529310. |
| + | |
| + | |
| + | <br /> |
| + | ==[[Python for Data Science]]== |
| + | |
| + | |
| + | <br /> |
| + | ===[[NumPy and Pandas]]=== |
| + | |
| + | |
| + | <br /> |
| + | ===[[Data Visualization with Python]]=== |
| + | |
| + | |
| + | <br /> |
| + | ===[[Text Analytics in Python]]=== |
| + | |
| + | |
| + | <br /> |
| + | ===[[Dash - Plotly]]=== |
| + | |
| + | |
| + | <br /> |
| + | ===[[Scrapy]]=== |
| + | |
| + | |
| + | <br /> |
| + | ==[[R]]== |
| + | |
| + | |
| + | <br /> |
| + | ===[[R tutorial]]=== |
| + | |
| + | |
| + | <br /> |
| + | ==[[RapidMiner]]== |
| + | |
| + | |
| + | <br /> |
| + | ==Assessments== |
| + | |
| + | |
| + | <br /> |
| + | ===Diploma in Predictive Data Analytics assessment=== |
| + | |
| + | |
| + | <br /> |
| + | ==Notas== |
| + | |
| + | |
| + | <br /> |
| + | ==References== |
| + | |
| + | |
| + | <br /> |