diff --git a/content/blog/2015-04-16-function-two-points-theory.md b/content/blog/2015-04-16-function-two-points-theory.md new file mode 100644 index 0000000..04f79ae --- /dev/null +++ b/content/blog/2015-04-16-function-two-points-theory.md @@ -0,0 +1,25 @@ +--- +id: 65 +title: Math Theory for Function Between Two Points +date: 2015-04-16T22:15:21+00:00 +author: Brandon Rozek +layout: post +guid: http://brandonrozek.com/?p=65 +permalink: /2015/04/function-two-points-theory/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' +dsq_thread_id: + - "" + - "" +tumblr_post_id: + - "138122079174" +kind: + - note +--- + + + +[Part1](https://brandonrozek.com/wp-content/uploads/2015/04/Part1.jpeg){.broken_link} +[Part2](https://brandonrozek.com/wp-content/uploads/2015/04/Part2.jpeg){.broken_link} +[Part3](https://brandonrozek.com/wp-content/uploads/2015/04/Part3.jpeg){.broken_link} +[Part4](https://brandonrozek.com/wp-content/uploads/2015/04/Part4.jpeg){.broken_link} \ No newline at end of file diff --git a/content/blog/2015-04-16-responsive-layout-and-animation.md b/content/blog/2015-04-16-responsive-layout-and-animation.md new file mode 100644 index 0000000..26612ae --- /dev/null +++ b/content/blog/2015-04-16-responsive-layout-and-animation.md @@ -0,0 +1,89 @@ +--- +id: 57 +title: Responsive Layout and Animation +date: 2015-04-16T22:19:36+00:00 +author: Brandon Rozek +layout: post +guid: http://brandonrozek.com/?p=57 +permalink: /2015/04/responsive-layout-and-animation/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' +dsq_thread_id: + - "3688354609" + - "3688354609" +mf2_cite: + - 'a:1:{s:6:"author";a:0:{}}' + - 'a:1:{s:6:"author";a:0:{}}' +tumblr_post_id: + - "135656876494" + - "135656876494" +kind: + - article +--- +I saw [Mike Riethmuller’s](http://madebymike.com.au/) precision typography [pen](http://codepen.io/MadeByMike/pen/YPJJYv){.broken_link}, and was highly impressed. I think the equation used has other purposes as well + + + +Side Note: I changed the form of the equation to something similar to y = mx + b so that I can more easily recognize how it functions + +#### Responsive Layout + +There are many occasions where I want an element on the page to move between two points. The navigation in the header of my site (at the time of writing) is a great example of this. So knowing the two points I want it to lie between and having the screen width as the variable, I can plug in… [f(x) = (100 * (b - a)/(d - c))X + (ad - bc) / (d - c)](https://brandonrozek.com/wp-content/uploads/2015/04/responsivelayoutequation.gif){.broken_link} where a is the start pixel b is the end pixel c is the start media query d is the end media query and X is the screen width out of 100 otherwise known as 1vw \*\*Don’t forget to keep track of your units!! Whether it’s px/rem/em/etc.\*\* Say I want to push a box towards the right a minimum of 5px, a maximum of 20px and for the push to vary between the widths 400-800px. Then I would write… + +

+@media (min-width: 400px) and (max-width: 800px) {
+
+.box {
+
+position: relative;
+
+left: calc(3.75vw - 10px) /*After simplifying the equation*/ }
+
+}
+
+ +That would only make it vary between 400-800px. Now we need to include what happens under 400px and over 800px. + +

+@media (max-width: 400px) {
+
+.box {
+
+position: relative;
+
+left: 5px; }
+
+}
+
+@media (min-width: 400px) and (max-width: 800px) {
+
+.box {
+
+position: relative;
+
+left: calc(3.75vw - 10px); }
+
+}
+
+@media (min-width: 800px) {
+
+.box {
+
+position: relative;
+
+left: 20px; }
+
+}
+
+ +This is exactly like Mike’s pen, but instead he uses the equation to adjust the font-size between an upper and lower bound. You can apply this method to anything that accepts calc() and viewport units. Here is my [pen](http://codepen.io/brandonrozek/pen/JoQVEb){.broken_link} showing some use cases. To make your life easier, I made a quick little tool where you can input the variables and it will provide you with a simpler form of the equation to put into your calc() function [here](http://codepen.io/brandonrozek/pen/KpPwGL){.broken_link}. + +#### Animation + +This is where the majority of my research went towards. It’s not as practical as say positioning an element is but I find it interesting. Like, what if I can manipulate the acceleration of the function? [f(x) = ((b - a) / (d^n - c^n))X^n + (ad^n - bc^n) / (d^n - c^n) ](https://brandonrozek.com/wp-content/uploads/2015/04/accelerationequation.gif){.broken_link} Where a is the start unit b is the end unit c is the start time d is the end time n is the acceleration modifier and X is time The interesting part of the function here is the n. If I keep n at 1, then the acceleration is constant. If it’s less than one, then it’s fast in the beginning and slows down at the end. If it’s greater than one, then it’s the opposite. I also made a little pen [here](http://codepen.io/brandonrozek/pen/RNzdOV){.broken_link} to demo this for you. + +#### Conclusion + +Having a function that goes between two points is incredibly handy. Now when it comes to positioning, I don’t have to guess which values match the design. If i cant something to be between here and there fluidly, I can do it. What about animation? Chaining them together should have an interesting affect… P.S For those of you crazy people who like to see the theory behind the math, (like myself) I have my scanned work [here](https://brandonrozek.com/2015/04/function-two-points-theory/). \ No newline at end of file diff --git a/content/blog/2015-05-23-animatable-border.md b/content/blog/2015-05-23-animatable-border.md new file mode 100644 index 0000000..b4a52ce --- /dev/null +++ b/content/blog/2015-05-23-animatable-border.md @@ -0,0 +1,130 @@ +--- +id: 85 +title: 'Animatable: Border' +date: 2015-05-23T19:59:25+00:00 +author: Brandon Rozek +layout: post +guid: http://brandonrozek.com/?p=85 +permalink: /2015/05/animatable-border/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' +dsq_thread_id: + - "3807156267" + - "3807156267" +tumblr_post_id: + - "135657818649" + - "135657818649" +mf2_cite: + - 'a:1:{s:6:"author";a:0:{}}' + - 'a:1:{s:6:"author";a:0:{}}' +kind: + - article +--- +This is part 1 of an animation series I’m doing. It is inspired by Lea Verou’s talk called “[The Humble Border-Radius.](https://www.youtube.com/watch?v=JSaMl2OKjfQ)” I looked at her site and she has a good demo of a bunch of different animations [here](http://lea.verou.me/2011/10/animatable-a-css-transitions-gallery/). My goal here is to create a more comprehensive guide to these different animatable properties–mainly for future reference. Animations play a big part in adding interactivity to the web, so why not explore some possible options? + + + +This post follows well along with my Codepen [demo](http://codepen.io/brandonrozek/full/waWMWR/){.broken_link}, where I’ll state the box number that applies to what I’m talking about. \*\*Initial values must be explicitly stated, implicit initial values are generally ignored in animation\*\* \*\\*\*In English terms, you must have already stated a value for what you are animating before you animate it\*\** + +### Border-color {#border-color} + + * Accepts 1 to 4 color values + * Each value corresponds to each side of the border (starting from the top and going clockwise) + * Initial Value: currentColor + +Border-color animates by splitting the colors to their red, green and blue components and raises/lowers them to it’s new value. ([Demo](http://codepen.io/brandonrozek/pen/PqzPMe){.broken_link}) ([Spec](http://www.w3.org/TR/css3-transitions/#animtype-color)) Example of animation corresponds to #1 in the pen, but I will rewrite the relevant code here. + +

+@keyframes color {
+
+to { border-color: purple red green blue; }
+
+}
+
+.border-color {
+
+border-color: white;
+
+animation: color .4s ease-in .1s infinite alternate;
+
+}
+
+ +  + +### Border-radius {#border-radius} + + * Accepts 1 to 4 values for both horizontal and vertical radii + * Each value corresponds to a corner starting from the top left and going clockwise + * Initial Value: 0 + +

+.border-radius {
+
+border-radius: 40% 30% 60% 50% / 20% 40% 60% 80%;
+
+/** is the same as **/
+
+border-top-left-radius: 40% 20%;
+
+border-top-right-radius: 30% 40%;
+
+border-bottom-right-radius: 60% 60%;
+
+border-bottom-left-radius: 50% 80%;
+
+/** where the first value is the horizontal radius and the second value the vertical radius**/
+
+}
+
+ +For animation, this corresponds to #2 in the pen I made at the top. I’ll repeat the relevant code here. + +

+
+@keyframes radius {
+
+to { border-radius: 20%; }
+
+}
+
+.border-radius {
+
+border-radius: 0;
+
+animation: radius .5s ease-in .1s infinite alternate;
+
+}
+
+ +  + +### Border-width {#border-width} + + * Accepts 1 to 4 values + * Each value corresponds to a side of the border (starting from the top and going clockwise) + * Initial Value: medium + +For animation, this corresponds to #3 in the pen I made at the top. I’ll repeat the relevant code here. + +

+@keyframes width {
+
+to { border-width: .15rem .25rem .15rem .25rem; }
+
+}
+
+.border-width {
+
+border-width: .7rem;
+
+animation: width .5s ease-in .1s infinite alternate;
+
+}
+
+ +  + +### Conclusion + +Animations are quite enjoyable. The last box in my Codepen demo tries combining all three of those animations. (Super Wacky!)  You don’t need to use keyframe animations to achieve this, you can also use the transition property. I used keyframes so you can better visualize what’s going on. There are plenty of other animatable properties to go through, so I’ll get started on those. In the meantime, if you want to look at some of the sites I used for research I’ll include the links below. {.broken_link} {.broken_link} {.broken_link} \ No newline at end of file diff --git a/content/blog/2015-09-14-animatable-box-model.md b/content/blog/2015-09-14-animatable-box-model.md new file mode 100644 index 0000000..6225cc5 --- /dev/null +++ b/content/blog/2015-09-14-animatable-box-model.md @@ -0,0 +1,194 @@ +--- +id: 155 +title: 'Animatable: Box Model' +date: 2015-09-14T12:07:52+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=155 +permalink: /2015/09/animatable-box-model/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"17293fa1c115";s:21:"follower_notification";s:2:"no";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:66:"https://medium.com/@brandonrozek/animatable-box-model-17293fa1c115";}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"17293fa1c115";s:21:"follower_notification";s:2:"no";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:66:"https://medium.com/@brandonrozek/animatable-box-model-17293fa1c115";}' +dsq_thread_id: + - "4130257548" + - "4130257548" +mf2_cite: + - 'a:1:{s:6:"author";a:0:{}}' + - 'a:1:{s:6:"author";a:0:{}}' +tumblr_post_id: + - "135657238924" + - "135657238924" +kind: + - article +--- +This post is part 2 of an animation series I am doing; you can read part 1 [here](https://brandonrozek.com/2015/05/animatable-border/). In this post, we’ll look at the different parts of the box model (margin, padding, height, and width) and see how they can be animated. + + + +The W3C has a great starting reference for the [CSS Box Model](http://www.w3.org/TR/CSS2/box.html). It can be wordy at times, but has everything you need to know. I had never heard of _margin collapsing_ until I read that. Luckily there is a great [post](https://css-tricks.com/what-you-should-know-about-collapsing-margins/) on CSS-Tricks written by Geoff Graham explaining what it is. To see it all in action, take a look at this Codepen [demo](http://codepen.io/brandonrozek/full/RWPYgV/){.broken_link}–  I reference this multiple times in this post. Now, on to the box model. + +### Margin + + * Accepts 1 to 4 numerical values (negative numbers are allowed) + * If you use 4 values, the first value is the top margin and the rest follow in a clockwise fashion + * Initial value: 0 + +Margins can be described as the space around an element. In the Codepen demo (#1), it shows 2 boxes. The first box has a margin-right that is increasing, making it seem as though it’s pushing the second box away. + +

+@keyframes margin {
+
+to { margin-right: 7rem; }
+
+}
+
+.margin {
+
+display: inline-block;
+
+height: 5rem;
+
+width: 5rem;
+
+background-color: lightblue;
+
+vertical-align: top;
+
+}
+
+.margin:first-of-type {
+
+margin-right: 0;
+
+animation: margin 4s ease 0s infinite;
+
+}
+
+ +### Padding + + * Accepts 1 to 4 non-negative values + * If you use 4 values, the first value is the top margin and the rest follow in a clockwise fashion + * Initial value: 0 + +Padding is the space between the content and the border of an element. In the demo (#2),  it shows a box in which its padding is increasing. + +

+@keyframes padding {
+
+to { padding: 2rem; }
+
+}
+
+.padding {
+
+display: inline-block;
+
+padding: 0;
+
+background-color: lightgreen;
+
+animation: padding 2.5s ease 0s infinite;
+
+}
+
+ +### Height + + * Accepts a non-negative number, this number is overridden however by (min/max)-height + * Initial value: auto + +“Height” is the height of an element without its padding, border, or margin. In the demo (#3) you can see the boxes’ height shrink, and each box begins it’s animation at a different time. + +

+@keyframes height {
+
+to { height: .01rem; }
+
+}
+
+.height {
+
+display: inline-block;
+
+height: 4rem;
+
+width: 3rem;
+
+background-color: violet;
+
+animation: height 1.25s ease 0s infinite;
+
+vertical-align: top;
+
+}
+
+.height:nth-of-type(n) {
+
+animation: height 1.25s ease .2s infinite alternate;
+
+}
+
+.height:nth-of-type(2n) {
+
+animation: height 1.25s ease .4s infinite alternate;
+
+}
+
+.height:nth-of-type(3n) {
+
+animation: height 1.25s ease .6s infinite alternate;
+
+}
+
+ +### Width + + * Accepts a non-negative number, this number is overridden however by (min/max)-width + * Initial value: auto + +“Width” is the width of an element without its padding, border, or margin. In the demo (#4), it is similar to #3, however, it’s the width being affected as opposed to the height. + +

+@keyframes width {
+
+to { width: .01rem; }
+
+}
+
+.width {
+
+margin-bottom: .2rem;
+
+height: 3rem;
+
+width: 6.5rem;
+
+background-color: bisque;
+
+}
+
+.width:nth-of-type(n) {
+
+animation: width 1.25s ease .2s infinite alternate;
+
+}
+
+.width:nth-of-type(2n) {
+
+animation: width 1.25s ease .4s infinite alternate;
+
+}
+
+.width:nth-of-type(3n) {
+
+animation: width 1.25s ease .6s infinite alternate;
+
+}
+
+
+ +### Conclusion + +And so with this we can add another collection of animations to our toolbelt! If you’re wondering why I left border out of this box-model post, it’s because I have already written a post dedicated to just the [border animation](https://brandonrozek.com/2015/05/animatable-border/). Here are some of the resources I looked at for this post. Hopefully I’ll come back with another animatable post soon! {.broken_link} {.broken_link} {.broken_link} {.broken_link} \ No newline at end of file diff --git a/content/blog/2015-10-03-animatable-location.md b/content/blog/2015-10-03-animatable-location.md new file mode 100644 index 0000000..1aed8b4 --- /dev/null +++ b/content/blog/2015-10-03-animatable-location.md @@ -0,0 +1,231 @@ +--- +id: 190 +title: 'Animatable: Location' +date: 2015-10-03T09:34:08+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=190 +permalink: /2015/10/animatable-location/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"ad9e6109d5aa";s:21:"follower_notification";s:2:"no";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:65:"https://medium.com/@brandonrozek/animatable-location-ad9e6109d5aa";}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"ad9e6109d5aa";s:21:"follower_notification";s:2:"no";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:65:"https://medium.com/@brandonrozek/animatable-location-ad9e6109d5aa";}' +dsq_thread_id: + - "4194325357" + - "4194325357" +mf2_cite: + - 'a:1:{s:6:"author";a:0:{}}' + - 'a:1:{s:6:"author";a:0:{}}' +tumblr_post_id: + - "135657326384" + - "135657326384" +kind: + - article +--- +Animating the location of objects is one of the most common types of animation. It’s interesting to animate this way because you need to keep in mind how each of the element’s interact with each other to constitute a page. + + + +This is part 4 of my series on animation. Check out the other parts of this series! + + * Part 1 — [Animatable: Border](https://brandonrozek.com/2015/05/animatable-border/) + * Part 2 — [Animatable: Box Model](https://brandonrozek.com/2015/09/animatable-box-model/) + * Part 3 — [Animatable: Text](https://brandonrozek.com/2015/10/animatable-text/) + +This post goes along well with this [Codepen demo](http://codepen.io/brandonrozek/full/NGbWzo/){.broken_link}, I’ll reference it multiple times in this post. Now onto animations! + +### background-position + + * Accepts keywords, percentages, or lengths + * Offset-x | Offset-Y + * Initial Value: 0% 0% + +Background-position sets where the background is relative to it’s background-origin. In the Codepen demo (#1), you can see the background image scrolling horizontally. + +
 
+@keyframes background-position {
+ 
+ to { background-position: 100% 0%; }
+
+}
+
+.background-position {
+  background-image: url(https://upload.wikimedia.org/wikipedia/commons/d/d3/Tajik_mountains_edit.jpg);
+
+  height: 6rem;
+
+  width: 8rem;
+
+  background-size: 200% 100%;
+
+  background-position: 0% 0%;
+
+  animation: background-position 5s linear .1s infinite alternate;
+
+}
+
+ +### position with left, right, top, bottom + + * Accepts length, percentage, or some keywords + * Initial value: auto + +The left, right, top, and bottom properties require the position to be set to something other than static. When you add a value to any of these properties just imagine that value pushing the element on that side. For example: for “left: 2rem” imagine that the element is being pushed on the left side by 2rem, making it move to the right 2rem. In the demo (#2), the box is being pushed in a square path. + +

+@keyframes position {
+
+  25% {
+
+    top: 0;
+
+    left: 3rem;
+
+  }
+
+  50% {
+
+    top: 3rem;
+
+    left: 3rem;
+
+  }
+
+  75% {
+
+    top: 3rem;
+
+    left: 0;
+
+  }
+
+}
+
+.position {
+
+  position: relative;
+
+  top: 0;
+
+  left: 0;
+
+  height: 3rem;
+
+  width: 3rem;
+
+  background-color: lightblue;
+
+  animation: position 1.5s ease .1s infinite;
+
+}
+
+ +  + +### vertical-align + + * Accepts keywords, percentages, or lengths (Negative values allowed) + * Initial Value: baseline + +Vertical-align sets how vertically the inline element or text is compared to the baseline. In the Codepen demo (#3), the question has its vertical align being manipulated which causes the “Maybe” to bounce up and down. + +

+@keyframes vertical-align {
+
+  to { vertical-align: 1rem; }
+
+}
+
+.vertical-align {
+
+  font-size: 1.5rem;
+
+  vertical-align: 0;
+
+  animation: vertical-align 1s ease-out .1s infinite alternate;
+
+}
+
+ +### z-index + + * Accepts any integer value + * Initial Value: auto + +If elements overlap, z-index determines which element appears on top. If the z-index is the same, then it is controlled by source order. In the demo (#4), The z-index of the biggest box changes, revealing what is under it. + +

+@keyframes z-index {
+
+  to { z-index: 0; }
+
+}
+
+.z-index {
+
+  position: absolute;
+
+  left: 1rem;
+
+  display: inline-block;
+
+}
+
+.z-index:nth-child(1) {
+
+  height: 1rem;
+
+  width: 1rem;
+
+  background-color: lightgreen;
+
+  z-index: 4;
+
+}
+
+.z-index:nth-child(2) {
+
+  height: 2rem;
+
+  width: 2rem;
+
+  background-color: #F4FFA4;
+
+  z-index: 3;
+
+}
+
+.z-index:nth-child(3) {
+
+  height: 3rem;
+
+  width: 3rem;
+
+  background-color: #DEB0ED;
+
+  z-index: 2;
+
+}
+
+.z-index:nth-child(4) {
+
+  height: 4rem;
+
+  width: 4rem;
+
+  background-color: #D8EADF;
+
+  z-index: 5;
+
+  animation: z-index 1s ease .1s infinite alternate;
+
+}
+
+ +### Conclusion + +By animating the location of an element, it opens up a whole bunch of different opportunities. Using motion, you can signify that the user has indeed pressed the button, instead of what would otherwise leave them there clicking on the button multiple times thinking that nothing has happened. Using motion, you can bring a webpage that would’ve otherwise been boring to life. Use these animations to work, and I’ll be back with another animatable post soon! + +#### The links + + {.broken_link} {.broken_link} {.broken_link} {.broken_link} \ No newline at end of file diff --git a/content/blog/2015-10-03-animatable-text.md b/content/blog/2015-10-03-animatable-text.md new file mode 100644 index 0000000..e91f0ba --- /dev/null +++ b/content/blog/2015-10-03-animatable-text.md @@ -0,0 +1,208 @@ +--- +id: 148 +title: 'Animatable: Text' +date: 2015-10-03T08:44:51+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=148 +permalink: /2015/10/animatable-text/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"8ef239deb1ea";s:21:"follower_notification";s:2:"no";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:61:"https://medium.com/@brandonrozek/animatable-text-8ef239deb1ea";}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"8ef239deb1ea";s:21:"follower_notification";s:2:"no";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:61:"https://medium.com/@brandonrozek/animatable-text-8ef239deb1ea";}' +mf2_cite: + - 'a:1:{s:6:"author";a:0:{}}' + - 'a:1:{s:6:"author";a:0:{}}' +tumblr_post_id: + - "135657083469" + - "135657083469" +kind: + - article +--- +This post is part 3 of my series on animation. In this post, I’ll show you different animations you can add onto text. If you haven’t already, you should check out [part 1](https://brandonrozek.com/2015/09/animatable-box-model/) and [part 2](https://brandonrozek.com/2015/05/animatable-border/) of this series. Animations on text can be used to bring attention, to add importance, or to convey a point. As with all animations, however, keep your user in mind and your text readable. + + + +This post follows along with a [Codepen demo](http://codepen.io/brandonrozek/full/dYGwbE/){.broken_link} I made. + +### line-height + + * Accepts certain keywords, or any positive number or length + * Initial value: normal + +Line-height is the space between each line in a text block. It is commonly recommended that you use a unitless line-height because then it takes the font-size into consideration. When you use an unitless value, the browser determines the line-height by taking the unitless value and multiplying it by the element’s font-size. In the Codepen demo (#1), you can see the line-height decreasing while the opacity increases. + +

+@keyframes line-height {
+
+  to {
+
+    opacity: 1;
+
+    line-height: 1.2;
+
+  }
+
+}
+
+.line-height {
+
+  opacity: 0;
+
+  line-height: 2.5;
+
+  animation: line-height .75s ease .2s infinite;
+
+}
+
+ +### font-weight + + * Accepts certain keywords or 100, 200, 300, 400, 500, 600, 700, 800, 900 (the higher the number, the darker the font-weight) + * Initial value: normal + +Font-weight specifies the boldness of the text. If the typeface doesn’t come with multiple weights, then the animation would only happen between the weights that it does have. In the demo (#2), the text will go from normal weight to bold. + +

+@keyframes font-weight {
+
+  to { font-weight: 900;}
+
+}
+
+.font-weight {
+
+  font-weight: 100;
+
+  animation: font-weight 2s linear .2s infinite alternate;
+
+}
+
+ +### font-size + + * Accepts any length + * Initial value: medium + +It is important to note that changing the font-size could change the value of other text properties that are dependent upon it. (Like unitless line-heights) In the demo (#3), you can see the text’s font-size shrinking. + +

+@keyframes font-size {
+
+  to { font-size: .1rem;}
+
+}
+
+.font-size {
+
+  font-size: 2rem;
+
+  animation: font-size 2s ease-out  .1s infinite;
+
+}
+
+ +### text-shadow + + * Accepts a color and 3 lengths + * Color | Offset-X | Offset-Y | Blur-radius + * Initial value: none + +Text-shadow applies a shadow to both the text and it’s text-decoration. Multiple shadows can be added, and they are applied from front to back. In the animation (#4), you can see the text’s shadow move. + +

+@keyframes text-shadow {
+
+  to { text-shadow: 25px 10px 5px rgba(0, 0, 0, .9);}
+
+}
+
+.text-shadow {
+
+    font-size: 1.5rem;
+
+    text-shadow: -10px 5px 3.5px rgba(0, 0, 0, .3);
+
+    animation: text-shadow 1s ease 0s infinite;
+
+}
+
+ +### text-decoration-color + + * Accepts a color value + * Initial value: currentColor + +This sets the color for [text-decoration-line](https://developer.mozilla.org/en-US/docs/Web/CSS/text-decoration-line) (underlines, overlines, or strike-throughs) In the demo (#5), the strike-through changes from red to black. + +

+@keyframes text-decoration-color {
+
+  to { text-decoration-color: black;}
+
+}
+
+.text-decoration-color {
+
+  text-decoration-color: red;
+
+  text-decoration-line: line-through;
+
+  animation: text-decoration-color 2s linear 0s infinite alternate;
+
+}
+
+ +### word-spacing + + * Accepts keywords or positive/negative length + * Initial value: normal + +Word-spacing defines the space between tags and words. Negative values bring the words closer to each other. In the demo (#6), you can see the word-spacing increase with ‘good bye!’ where the word ‘bye!’ is moving away. + +

+@keyframes word-spacing {
+
+  to { word-spacing: 5rem;}
+
+}
+
+.word-spacing {
+
+  word-spacing: normal;
+
+  animation: word-spacing 1s ease-in 0s infinite;
+
+}
+
+ +### letter-spacing + + * Accepts keywords or positive/negative length + * Initial value: normal + +Letter-spacing specifies the spacing between text characters. Negative values bring the letters closer together. In the demo (#7), each letter gets separated from one another. + +

+@keyframes letter-spacing {
+
+  to { letter-spacing: 2rem;}
+
+}
+
+.letter-spacing {
+
+  letter-spacing: 0;
+
+  animation: letter-spacing .75s ease 0s infinite alternate;
+
+}
+
+ +### Conclusion + +These animations show the different things you can do with text. Perhaps you’ll add a small animation to a heading to bring depth and attention, or you’ll add some to the text of a button to scream “call to action”. Whatever you decide, I hope this post helped. I’ll see you again next time with another animatable post! 🙂 + +#### The links + +[https://docs.webplatform.org/wiki/css/properties/line-height](https://developer.mozilla.org/en-US/docs/Web/CSS/line-height) {.broken_link} {.broken_link} {.broken_link} {.broken_link} {.broken_link} {.broken_link} \ No newline at end of file diff --git a/content/blog/2015-10-04-html-css-javascript-link-together.md b/content/blog/2015-10-04-html-css-javascript-link-together.md new file mode 100644 index 0000000..6e84abb --- /dev/null +++ b/content/blog/2015-10-04-html-css-javascript-link-together.md @@ -0,0 +1,129 @@ +--- +id: 210 +title: HTML, CSS, Javascript, and how they all link together +date: 2015-10-04T17:50:50+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=210 +permalink: /2015/10/html-css-javascript-link-together/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"9579f30ae529";s:21:"follower_notification";s:3:"yes";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:96:"https://medium.com/@brandonrozek/html-css-javascript-and-how-they-all-link-together-9579f30ae529";}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"9579f30ae529";s:21:"follower_notification";s:3:"yes";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:96:"https://medium.com/@brandonrozek/html-css-javascript-and-how-they-all-link-together-9579f30ae529";}' +dsq_thread_id: + - "4194222476" + - "4194222476" +mf2_cite: + - 'a:1:{s:6:"author";a:0:{}}' + - 'a:1:{s:6:"author";a:0:{}}' +tumblr_post_id: + - "135657370214" + - "135657370214" +kind: + - article +--- +I’ve been teaching a small class on web development recently, and after my first lecture, I’ve gained a newfound respect for teachers. Teaching didn’t come as naturally to me as I would have imagined. I tried going in prepared: with a few outlines and a few code demos. Instead of letting my preparation go to waste, I decided to share them here with you on my site. It’s a nice break from the Animatable posts, so I hope you enjoy! + + + +I suggest a couple short readings to check out before the lecture: + + * [What is CSS](http://www.sitepoint.com/web-foundations/css/) by Adam Roberts + * [Box Model](http://www.w3.org/TR/CSS2/box.html) by the W3C + +Take a quick look if you wish. These are mostly to give an idea of what is going to happen over the next few lectures. What is HTML, CSS, and Javascript? We’ll look into the different parts that form a webpage and how they all interact with each other. + +## HTML + +HTML is where the content of your site lives. It’s also the file the server returns to no matter what, the bare-bones of a webpage. This file may contain text, pictures, and/or other media. + +## CSS + +This is where you style your content. Whether it’s through colors, layout, or typography, there are plenty of different ways for you to visually manipulate your content. + +## Javascript + +Javascript is where you add functionality of your site. Validating user input or having dynamic content are one of the many things you can do with Javascipt. + +## How do they all link together? + +HTML, CSS, and Javascript each do what they do the best. So how can you have them all play nicely on the same ball field? + +### In HTML + +Link the CSS file + +

+  <link rel='stylesheet' href='style.css' />
+
+ +Link the Javascript file + +

+  <script src='script.js'></script>
+
+ +Give the

tag a class of hello and id of world to use in CSS and Javascript + +


+  <p class='hello' id='world'></p>
+
+ +### In CSS + +Refer to any element with class=’hello’ and change it’s text color to red. + +

+.hello { color: red; }
+
+ +Any element with an id=’world’ will have it’s font-size changed to 2rem + +

+#world { font-size: 2rem; }
+
+ +You don’t have to only use the class and id attributes in html, you can refer to any attribute. This code snippet grabs any canvas element with data=’sales’ and changes it’s border to be 5px thick, dashed, and the color blue. + +

+canvas[data=sales] { border: 5px dashed blue; }
+
+ +### In Javascript + +Javascript has many properties and methods you can use to reference different HTML elements To grab (an) element(s) + +

+document.getElementById();
+document.getElementsByClassName(); //Returns an array of element(s)
+document.querySelector(); //Returns the first matching selector
+document.querySelectorAll(); //Returns an array of element(s)
+
+ +To add a class to an element + +

+element.className += “ random-class” //Note the space
+
+ +To check whether a certain condition is true in the browser + +

+window.matchMedia('aspect-ratio: 12/8'); //Returns true if the aspect ratio is 12/8
+window.innerHeight; //Is the height of the window
+window.innerWidth; //Is the width of the window
+
+ +_And a lot more_ + +## What should handle what? + +HTML, CSS, and Javascript should all handle what each of them does best. HTML should handle the content, CSS should handle the styles/presentation, and Javascript should handle the behavior of the webpage. Why, you ask? One reason is that it demonstrates a “separation of concerns”. It would be a mess if you’re writing an article in the HTML and you put style attributes all over the place. That would make the markup confusing and hard to read/edit. + +## Can’t I just put everything in a Javascript file? + +Yes you can, but then you lose some of the great features of HTML and CSS. HTML and CSS ignore everything that it doesn’t understand. When Javascript encounters something it doesn’t understand, it stops running the code completely, regardless of what comes after. Please note that I am only speaking about what gets served to the user. When it comes to what’s actually on your server, then store your content however you wish. + +## Conclusion + +To me personally, my first lecture was a mess. Some of my examples didn’t work properly in the first type-through and I was everywhere. Though, to be sharing the little knowledge I do have, comes with it’s own joy. It must not have gone as terrible as I imagined it in my head because they seemed enthusiastic for the next lecture. So I’m excited to share this outline with you, and hopefully I’ll have many more to come. Until next time. 🙂 \ No newline at end of file diff --git a/content/blog/2015-10-10-javascript-data-types.md b/content/blog/2015-10-10-javascript-data-types.md new file mode 100644 index 0000000..4c0eaef --- /dev/null +++ b/content/blog/2015-10-10-javascript-data-types.md @@ -0,0 +1,311 @@ +--- +id: 238 +title: Javascript Data Types +date: 2015-10-10T20:01:20+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=238 +permalink: /2015/10/javascript-data-types/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"edcd4e2dcf42";s:21:"follower_notification";s:2:"no";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:67:"https://medium.com/@brandonrozek/javascript-data-types-edcd4e2dcf42";}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"edcd4e2dcf42";s:21:"follower_notification";s:2:"no";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:67:"https://medium.com/@brandonrozek/javascript-data-types-edcd4e2dcf42";}' +dsq_thread_id: + - "4215821079" + - "4215821079" +mf2_cite: + - 'a:1:{s:6:"author";a:0:{}}' + - 'a:1:{s:6:"author";a:0:{}}' +tumblr_post_id: + - "135657462089" + - "135657462089" +kind: + - article +--- +Javascript has multiple ways you can store your data. Each of these different ways is called a data type, and they each carry different “methods” which are helpful commands. Today, I’ll show you the different data types and methods that I use and how they’re useful. + + + +This post is by far not a comprehenive list of all the Data types and their methods. If you want one of those, please check out [MDN](https://developer.mozilla.org/en-US/docs/Web/JavaScript/Reference/Global_Objects) and/or [WebPlatform](http://docs.webplatform.org/wiki/javascript/objects){.broken_link}. This is the second lecture of the web development class I’m teaching for the newer folks over at [Math I/O](http://math-io.com). Due to the nature of Math I/O (making math games and all), the next few posts will be Javascript centric. We’re getting ready to build a new game, so I want to prepare them as much as possible. \*Excited\* ^_^ Ilya Kantor does a good job of descibing Javascript data types and their many methods in [Mastering Data Types](http://javascript.info/tutorial/mastering-data-types) which I made the recommended reading for this lecture. + +### String {#string} + +A string is one or more characters. + +
var name = "Brandon";
+ +You can access a character inside of a string by using [] notation. Inside the [] you put the index of the character you want. An index is the numeral location of the character starting from the left. It is important to note that Javascript starts counting from 0. + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ B + + r + + a + + n + + d + + o + + n +
+ + 1 + + 2 + + 3 + + 4 + + 5 + + 6 +
+ +
var firstInitial = "Brandon"[0];
+ +Now the value of firstInitial is the letter "B". + +#### Some useful methods for strings {#some-useful-methods-for-strings} + +##### String.prototype.indexOf(); {#string.prototype.indexof();} + +This can be used to find the index of any character(s) in a string. I primarily use it for when I need to check if something exists in a string. Do I have a ‘z’ in my name? + +
"Brandon".indexOf('z');
+ +Nope, so Javascript will return a -1. How about a ‘d’? + +
"Brandon".indexOf('d');
+ +Yes, Javascript will return 5 which is the index of the letter ‘d’. + +##### String.prototype.replace(); {#string.prototype.replace();} + +The replace method can replace any character(s) with other character(s). For more complex replacing, look into [Regular Expression](https://developer.mozilla.org/en-US/docs/Web/JavaScript/Guide/Regular_Expressions) and how you can use them in .replace(). Replace the first ‘n’ in my name with an ‘m’. + +

+var modifiedName = "Brandon".replace('n', 'm');
+
+console.log(modifiedName);
+
+ +Logs "Bramdon". + +##### String.prototype.toUpperCase(); {#string.prototype.touppercase();} + +This method returns the string with all the lowercase characters converted to uppercase and can be useful for when you’re checking user input and you don’t want to worry about different cases. + +
"Brandon".toUpperCase();
+ +Returns "BRANDON". + +##### String.prototype.toLowerCase(); {#string.prototype.tolowercase();} + +Same as above but instead of converting lowercase to uppercase, it converts uppercase to lowercase. + +
"Brandon".toLowerCase();
+ +Returns "brandon". + +#### A couple useful escape secquences {#a-couple-useful-escape-secquences} + + * n for newline. + * t for tab character. + +You can also use escape sequnces if you want to add “” or ‘’ to your strings. + +

+var greeting = "Hello "Brandon"";
+
+console.log(greeting);
+
+ +Returns "Hello "Brandon"". + +### Number {#number} + +Any number between -(253 – 1) and (253 – 1). + +#### Number Methods {#number-methods} + +Number methods are useful when trying to represent complex numbers. + +##### Number.prototype.toExponential(); {#number.prototype.toexponential();} + +Returns a string representing a number in exponential notation. + +
77.1234.toExponential(2);
+ +Returns "7.71e+1". + +##### Number.prototype.toFixed(); {#number.prototype.tofixed();} + +Returns a string representing a number fixed to x amount of decimal places. + +
12345.6789.toFixed(1);
+ +Returns "12345.7". + +##### Number.prototype.toPrecision(); {#number.prototype.toprecision();} + +Returns a string representing a number using x amount of significant figures. + +
5.123456.toPrecision(2);
+ +Returns "5.1". + +#### Math properties/methods {#math-properties/methods} + +In Javascript there is a Math object which contains many properties and methods which are useful for mathmatical calculations. + +##### Return Euler’s constant {#return-euler's-constant} + +Math.E which returns ~2.718. + +##### Return the natural log of x {#return-the-natural-log-of-x} + +Math.log(x) + +##### Rise x to the y power {#rise-x-to-the-y-power} + +Math.pow(x,y) + +##### Return a psuedo random number [0,1) {#return-a-psuedo-random-number-[0,1)} + +Math.random() + +##### Round x to the nearest integer {#round-x-to-the-nearest-integer} + +Math.round(x) + +### Boolean {#boolean} + +Booleans are either true or false and are typically used in conditional statements. You can either create them explicitly + +
var alive = true;
+ +or by evaluating a [comparison](https://developer.mozilla.org/en-US/docs/Web/JavaScript/Reference/Operators/Comparison_Operators). + +

+var dead = false;
+var isAlive = !dead;
+
+ +isAlive equals true. + +### Array {#array} + +An array is a list of items. In Javascript these items can be any data type, even arrays themselves. + +
var mixedBag = ['sword', 24, true, [Math.PI, Math.E], 'shield'];
+ +To access an item in an array use [] notation with an index as mentioned over at strings. + +
['sword', 'shield', 'helmet'][1];
+ +Returns 'shield'. to figure out how many items are in the array. + +

+var inventory = ['boots', 'gloves', 'pants', 'shirt'];
+var inventoryAmt = inventory.length;
+
+ +inventoryAmt is 4 since there are 4 items in inventory. + +#### Array Methods {#array-methods} + +##### Array.prototype.push(); {#array.prototype.push();} + +Adds whatever is inside the parenthesis to the end of the array. Great for adding items to a list. For example, test scores. + +
[100,92,95].push(80);
+ +Returns [100,92,95,80]. + +##### Array.prototype.reverse(); {#array.prototype.reverse();} + +Reverses the order of all the items in the array. + +
[1,2,3].reverse();
+ +Returns [3,2,1]. + +##### Array.prototype.concat(); {#array.prototype.concat();} + +Combines two arrays, putting the items from the array in the parenthesis to the end of the main array. This method is a lot faster than grabbing each item by their index and adding them using the .push() method. + +
['a','b','c'].concat([1,2,3]);
+ +Returns ['a','b','c',1,2,3]. + +##### Array.prototype.join(); {#array.prototype.join();} + +Converts the array into a string, with each item seperated by whatever is in the parenthesis. Useful for telling the user the items in their inventory, for example. + +

+var inventory = ['books','apples','pencils'];
+console.log("You have " + inventory.join(", ") + " in your inventory.");
+
+ +Logs "You have books, apples, pencils in your inventory." + +##### Array.prototype.indexOf(); {#array.prototype.indexof();} + +Similar to String.prototype.indexOf(), it returns the index of the item inside the parenthesis. + +
['chicken','pizza','tacos'].indexOf('tacos');
+ +Returns 2. + +### Objects {#objects} + +Objects are like arrays, however they’re easier for establishing the relationship between properties and their values. You can store any data type as a property of an object. + +

+var player = {};
+player.name = "Brandon";
+player.health = Number.POSITIVE_INFINITY;
+console.log(player.name + " has " + player.health + " health.");
+
+ +Logs "Brandon has Infinity health" Yup that sounds about right. + +### Conclusion {#conclusion} + +All of the different data types in Javascript are tools for you to get the job done. When assigning a variable, think to yourself which tool you should use. I had fun doing this lecture. We finished earlier than expected, due to my extra preparations. (Still shuddering over my unpreparedness from last week). We had finished so early in fact, that I went ahead and started teaching next week’s material. Do not worry though, my lovely reader’s only get the most structured of lesson materials. So you’ll have to wait until next week to hear more. 🙂 \ No newline at end of file diff --git a/content/blog/2015-10-11-animatable-visual.md b/content/blog/2015-10-11-animatable-visual.md new file mode 100644 index 0000000..25d16b2 --- /dev/null +++ b/content/blog/2015-10-11-animatable-visual.md @@ -0,0 +1,119 @@ +--- +id: 297 +title: 'Animatable: Visual' +date: 2015-10-11T16:52:36+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=297 +permalink: /2015/10/animatable-visual/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"c1119f67e27a";s:21:"follower_notification";s:2:"no";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:63:"https://medium.com/@brandonrozek/animatable-visual-c1119f67e27a";}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"c1119f67e27a";s:21:"follower_notification";s:2:"no";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:63:"https://medium.com/@brandonrozek/animatable-visual-c1119f67e27a";}' +tumblr_post_id: + - "135657496179" + - "135657496179" +mf2_cite: + - 'a:1:{s:6:"author";a:0:{}}' + - 'a:1:{s:6:"author";a:0:{}}' +kind: + - article +--- +Hello everyone! This is part 5 of my series on animation. Today’s post will be short, since we’re only going to talk about color and opacity. + + + +I’ll give a shout-out to , if you are interested in [CSS Animation performance](https://blogs.adobe.com/webplatform/2014/03/18/css-animations-and-transitions-performance/), then check them out to see what triggers a repaint and/or reflow. Take a look at the other posts in this series! + + * Part 1 — [Animatable: Border](https://brandonrozek.com/2015/05/animatable-border/) + * Part 2 — [Animatable: Box Model](https://brandonrozek.com/2015/09/animatable-box-model/) + * Part 3 — [Animatable: Text](https://brandonrozek.com/2015/10/animatable-text/) + * Part 4 — [Animatable: Location](https://brandonrozek.com/2015/10/animatable-location/) + +This post goes with a [Codepen demo](http://codepen.io/brandonrozek/full/rOzeyO/){.broken_link} I made, I’ll reference it later in this post. + +### color {#color} + + * Accepts any [color](https://developer.mozilla.org/en-US/docs/Web/CSS/color_value) value + * Typically inherits it’s color from the parent element + +The color property sets the color of an element’s text content and its decoration. During the animation, the browser sees the colors in their red, green, and blue (rgb) components, then increments/decrements those values until it reaches the color it’s animating to. For example, in the Codepen demo (#1), the color of the text is changing from red or rgb(255, 0, 0) to green or rgb(0, 255, 0). Meaning the red component is going from 255 to 0 and the green component is going from 0 to 255 during the animation. + +
@keyframes color {
+
+  to { color: green; }
+
+}
+
+.color {
+
+  font-size: 2rem;
+
+  color: red;
+
+  text-decoration: underline;
+
+  animation: color 1.5s ease-in 0s infinite alternate;
+
+}
+
+ +### opacity {#opacity} + + * Accepts any number from [0, 1] + * Initial Value: 1 + +Opacity sets the transparency of an element and it’s decendants. Unlike display: none;, when the element is opacity: 0; the element still holds it’s space on the page. In the Codepen demo (#2), you can see the element and it’s children fading out. + +
@keyframes opacity {
+
+  to { opacity: 0; }
+
+}
+
+.opacity {
+
+  height: 5rem;
+
+  width: 5rem;
+
+  background-color: #cd86e4;
+
+  opacity: 1;
+
+  animation: opacity 2s linear 0s infinite alternate;
+
+}
+
+.opacity div {
+
+  margin-left: auto;
+
+  margin-right: auto;
+
+  height: 3rem;
+
+  width: 3rem;
+
+  background-color: lightblue;
+
+}
+
+.opacity div div {
+
+  margin-left: auto;
+
+  margin-right: auto;
+
+  height: 1rem;
+
+  width: 1rem;
+
+  background-color: #00b300;
+
+}
+
+ +### Conclusion {#conclusion} + +I used to work on a chat application called Babbler. In it, I used opacity to fade in the messages as the user recieved them. With all these different types of animations, you can visually show the user what’s going on in your website/application. Doing this series helps me, (as well as you, I hope) recognize all the different properties and possibilities for animation. This is the second to last part of this series, meaning that the next part is the finale. I’m somewhat sad to see this series ending but excited at the same time. Until next time, have fun animating. 🙂 \ No newline at end of file diff --git a/content/blog/2015-10-18-animatable-transform.md b/content/blog/2015-10-18-animatable-transform.md new file mode 100644 index 0000000..13e596e --- /dev/null +++ b/content/blog/2015-10-18-animatable-transform.md @@ -0,0 +1,144 @@ +--- +id: 337 +title: 'Animatable: Transform' +date: 2015-10-18T16:32:37+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=337 +permalink: /2015/10/animatable-transform/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"1eb4fcf6a5df";s:21:"follower_notification";s:3:"yes";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:66:"https://medium.com/@brandonrozek/animatable-transform-1eb4fcf6a5df";}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"1eb4fcf6a5df";s:21:"follower_notification";s:3:"yes";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:66:"https://medium.com/@brandonrozek/animatable-transform-1eb4fcf6a5df";}' +mf2_cite: + - 'a:1:{s:6:"author";a:0:{}}' + - 'a:1:{s:6:"author";a:0:{}}' +tumblr_post_id: + - "135657540174" + - "135657540174" +kind: + - article +--- +This is the last post of the animatable series. The grand finale. Here, we will talk about the transform property. It’s only one property but it comes with a lot of goodies in the form of transform-functions. + + + +This is not a comprehensize list. If you want one of those, please check out MDN. They have a great [resource](https://developer.mozilla.org/en-US/docs/Web/CSS/transform-function). This is the last post of the animatable series, I recommend you check out the other parts too. + + * Part 1 — [Animatable: Border](https://brandonrozek.com/2015/05/animatable-border/) + * Part 2 — [Animatable: Box Model](https://brandonrozek.com/2015/09/animatable-box-model/) + * Part 3 — [Animatable: Text](https://brandonrozek.com/2015/10/animatable-text/) + * Part 4 — [Animatable: Location](https://brandonrozek.com/2015/10/animatable-location/) + * Part 5 — [Animatable: Visual](https://brandonrozek.com/2015/10/animatable-visual/) + +Animatable: Transform goes with a [CodePen demo](http://codepen.io/brandonrozek/full/ojoMyE){.broken_link} I made. Please check it out, as I will be referencing it later on in the post. + +### rotate() {#rotate()} + +The rotate() function moves the element around a fixed point as defined by the [transform-origin](https://developer.mozilla.org/en-US/docs/Web/CSS/transform-origin) property. In the Codepen demo (#1), the star continously rotates 360 degrees. + +
@keyframes rotate {
+
+  to { transform: rotate(360deg);}
+
+}
+
+.rotate {
+
+  width: 6rem;
+
+  height: 6rem;
+
+  background-image: url("https://upload.wikimedia.org/wikipedia/commons/thumb/5/51/Star_full.svg/2000px-Star_full.svg.png");
+
+  background-size: cover;
+
+  transform: none;
+
+  animation: rotate 1s ease 0s infinite;
+}
+
+ +### scale() {#scale()} + +Scale(sx, sy) modifies the size of the element by taking 2 arguments: sx and sy. Where sx is the multiplier that scales the element in the x-direction while sy is the multiplier that scales the element in the y-direction. In the CodePen demo (#2), the little ninja man scales to half his size and back to normal again. + +
@keyframes scale {
+
+  to { transform: scale(.5); }
+
+}
+
+.scale {
+
+  width: 6rem;
+
+  height: 6rem;
+
+  background-image: url("https://upload.wikimedia.org/wikipedia/commons/7/71/Monocromaticman.JPG");
+
+  background-size: contain;
+
+  background-repeat: no-repeat;
+
+  transform: none;
+
+  animation: scale 1s ease 0s infinite alternate;
+}
+
+ +### skew() {#skew()} + +Skew distorts the element by moving each point to a certain angle determined by it’s distance from the origin. In the CodePen demo (#3), the square skews -20 degrees, making it appear as a parallelogram. + +
@keyframes skew {
+
+  to { transform: skew(-20deg); }
+
+}
+
+.skew {
+
+  height: 6rem;
+
+  width: 6rem;
+
+  background-color: lightblue;
+
+  transform: none;
+
+  animation: skew .75s ease 0s infinite alternate;
+}
+
+ +### translate() {#translate()} + +Transform(tx, ty) moves the element as specified by it’s two parameters tx and ty. Tx tells the browser how many units to move it in the x direction while ty tells the browser how many units to move the element in the y direction. In the CodePen demo (#4), the car moves forward 10rem and back again. + +
@keyframes translate {
+
+  to { transform: translate(10rem);}
+
+}
+
+.translate {
+
+  height: 6rem;
+
+  width: 6rem;
+
+  background-image: url("http://res.freestockphotos.biz/pictures/15/15685-illustration-of-a-red-cartoon-car-pv.png");
+
+  background-size: contain;
+
+  background-repeat: no-repeat;
+
+  transform: none;
+
+  animation: translate 1s ease 0s infinite alternate;
+}
+
+ +### Conclusion {#conclusion} + +It is now the end of the Animatable series. I am sad to see this first completed series of mine go. It’s okay though, I’m bound to think of another series to write for you guys in no time. My goal in Animatable, is to show you (and me) what is possible using CSS animations. With this small reference completed, we have a good overview of the different tools available. Now with our new toolbelt, go out and craft meaningful experinces! \ No newline at end of file diff --git a/content/blog/2015-10-18-javascript-conditional-statements.md b/content/blog/2015-10-18-javascript-conditional-statements.md new file mode 100644 index 0000000..8497661 --- /dev/null +++ b/content/blog/2015-10-18-javascript-conditional-statements.md @@ -0,0 +1,101 @@ +--- +id: 344 +title: Javascript Conditional Statements +date: 2015-10-18T18:30:21+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=344 +permalink: /2015/10/javascript-conditional-statements/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"72ac61ee8d04";s:21:"follower_notification";s:2:"no";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:79:"https://medium.com/@brandonrozek/javascript-conditional-statements-72ac61ee8d04";}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"72ac61ee8d04";s:21:"follower_notification";s:2:"no";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:79:"https://medium.com/@brandonrozek/javascript-conditional-statements-72ac61ee8d04";}' +dsq_thread_id: + - "4237729275" + - "4237729275" +mf2_cite: + - 'a:1:{s:6:"author";a:0:{}}' + - 'a:1:{s:6:"author";a:0:{}}' +tumblr_post_id: + - "135657634939" + - "135657634939" +kind: + - article +--- +Javascript, like most other programming languages, include ways to run blocks of code when something meets a condition. Here, I will describe the most common ways to do so. + + + +This post is part of my lecture series for Math I/O. There is no pre-reading for this lecture. + +### If Statement {#if-statement} + +To run a block of code when a condition is true, use an if statement. + +
    if (condition) {
+        doSomething();
+    }
+
+ +You can also run a block of code when a condition is false using the else statement. + +
    if (condition) {
+        doSomething();
+    } else {
+        doSomethingElse();
+    }
+
+ +### Switch statement {#switch-statement} + +If you want to check a variable for **equality** against multiple different cases, use a switch statement. + +
    switch (variable) {
+        case condition1:
+            doSomething();
+            break;
+        case condition2:
+            doSomethingElse();
+            break;
+        default:
+            doSomethingCompletelyDifferent();
+            break;
+    }
+
+ +The default statement runs when the variable doesn’t equal any of the cases. + +### While loop {#while-loop} + +To run a block of code over and over again until a condition is false, use a while loop. + +
    while (condition) {
+        doSomething();
+    }
+
+ +Don’t forget to include something in the loop that will eventually make the condition false, otherwise you run into an infinite loop. (Which is a loop that never stops repeating itself; most likely crashing your browser) + +### For loop {#for-loop} + +If you want to run something a certain amount of times, use a “for" loop. For loops can be broken down into three components: an initiating statement, a condition, and a statement that runs after every loop. + +
    for (var i = 0; i < 5; i++) {
+        doSomething();
+    }
+
+ +Here you have the initiating statement of var i = 0. From there you check, is i less than 5? Yes, so then we doSomething();. After we doSomething();, we add 1 to i. Now i equals 2. Is i still less than 5? Yes, so we doSomething();. Then we add 1 to i again. This loop will keep happening until i is not less than 5. + +### Conclusion {#conclusion} + +Having different control/conditional statements helps keep the state of any application you’re making. Did the user say not to notify them? Then don’t, otherwise (else) notify them. That’s all I have to say for this week. Hope this post helps you get a little more used to this big world called programming. + +
    if (youLikeThisPost) {
+        console.log("Come back next week! :)");
+    } else {
+        console.log("Aww that's okay, you should give me another chance next week :)");
+    }
+
+ +I recommend that you look at different perspectives of the same concepts. WebCheatSheet.com has a similar post to mine, check out what they had to say [here](http://webcheatsheet.com/javascript/if_else_switch.php). \ No newline at end of file diff --git a/content/blog/2015-10-25-functions.md b/content/blog/2015-10-25-functions.md new file mode 100644 index 0000000..713fb45 --- /dev/null +++ b/content/blog/2015-10-25-functions.md @@ -0,0 +1,115 @@ +--- +id: 350 +title: Functions +date: 2015-10-25T13:48:41+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=350 +permalink: /2015/10/functions/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"44583f68d3fa";s:21:"follower_notification";s:2:"no";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:55:"https://medium.com/@brandonrozek/functions-44583f68d3fa";}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"44583f68d3fa";s:21:"follower_notification";s:2:"no";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:55:"https://medium.com/@brandonrozek/functions-44583f68d3fa";}' +mf2_cite: + - 'a:1:{s:6:"author";a:0:{}}' + - 'a:1:{s:6:"author";a:0:{}}' +tumblr_post_id: + - "135657661534" + - "135657661534" +kind: + - article +--- +Ever had a snippet of code that appears multiple times in different places in your program? Whenever you had to change that snippet, you end up playing this game of search and replace. Functions can help. They exist to abstract your code, making it not only easier to change that little snippet, but to read and debug your code as well. + + + +### How to create/execute a function {#how-to-create/execute-a-function} + +To make a function + +
    
+    var doSomething = function() {
+        doStuff;
+    }
+
+ +To call the above function to execute + +

+    doSomething();
+
+ +### Arguments {#arguments} + +You can also add in arguments (parameters that go inside the paraenthesis next to the word function) for the functions to use. + +

+    var add = function(number1, number2) {
+        return number1 + number2;
+    }
+
+ +And when you use the `return` keyword, like the function above. You can store the value in a variable for future use. + +
    
+    var total = add(1, 3);
+
+ +total here will equal `4` + +### Scope {#scope} + +Functions create their own scope, which means that variables created inside the function will only be able available within that function. + +The snippet below will output an error like total is not defined + +

+    var add = function(number1, number2) {
+        var total = number1 + number2;
+    }
+    console.log(total);
+
+ +Below is a correct example of the concept + +

+    //Function below converts km/hr to m/s
+    var convert = function(speed) {
+        var metersPerHour = speed * 1000;
+        var metersPerSecound = metersPerHour / 3600;
+        return metersPerSecond;
+    }
+    var currentSpeed = convert(5);
+
+ +It’s also important to note that functions can use variables outside of it; granted it resides in the same scope. + +Here is an example of a variable that doesn’t reside in the same scope as the function. (The below code will fail) + +

+    var something = function() {
+        var x = 5;
+        var y = 2;
+    }
+    something();
+    var addXandY = function() {
+        console.log(x + y);
+    }
+    addXandY();
+
+ +Below, is an example of where the variable does reside in the same scope as the function. Which allows this snippet to execute properly. + +

+    var x = 5;
+    var addX = function(a) {
+        return a + x;
+    }
+    var sum = addX(6);
+
+ +sum here will equal 11 + +### Conclusion {#conclusion} + +As long as you name them appropriately, functions are useful for abstracting your code, making them easier to understand. This concludes another lecture made for the members over at Math I/O. Until next week 🙂 \ No newline at end of file diff --git a/content/blog/2015-11-14-service-workers.md b/content/blog/2015-11-14-service-workers.md new file mode 100644 index 0000000..75d81d8 --- /dev/null +++ b/content/blog/2015-11-14-service-workers.md @@ -0,0 +1,362 @@ +--- +id: 400 +title: An Offline Experience with Service Workers +date: 2015-11-14T15:47:06+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=400 +permalink: /2015/11/service-workers/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"125e50979ed8";s:21:"follower_notification";s:3:"yes";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:88:"https://medium.com/@brandonrozek/an-offline-experience-with-service-workers-125e50979ed8";}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"125e50979ed8";s:21:"follower_notification";s:3:"yes";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:88:"https://medium.com/@brandonrozek/an-offline-experience-with-service-workers-125e50979ed8";}' +mf2_cite: + - 'a:1:{s:6:"author";a:0:{}}' + - 'a:1:{s:6:"author";a:0:{}}' +tumblr_post_id: + - "135657690564" + - "135657690564" +kind: + - article +--- +I’m excited to say that I’ve written my first service worker for brandonrozek.com. What is a service worker? A service worker provides an extra layer between the client and the server. The exciting part about this is that you can use service workers to deliver an offline experience. (Cached versions of your site, offline pages, etc.) + + + +Service workers are currently supported in Chrome, Opera, and Firefox nightly. You don’t have to worry too much about browser support because the Service Worker spec was written in a [progressively enchanced](http://alistapart.com/article/understandingprogressiveenhancement) way meaning it won’t break your existing site 🙂 + +## Caveats {#caveats} + +You need HTTPS to be able to use service workers on your site. This is mainly for security reasons. Imagine if a third party can control all of the networking requests on your site? If you don’t want to go out and buy a SSL Certificate, there are a couple free ways to go about this. 1) [Cloudflare](https://www.cloudflare.com/) 2) [Let’s Encrypt](https://letsencrypt.org/) Service workers are promise heavy. Promises contain a then clause which runs code asynchronously. If you’re not accustomed to this idea please check out this [post](https://ponyfoo.com/articles/es6-promises-in-depth) by Nicolas Bevacqua. Now onto making the service worker! If you want to skip to the final code scroll down to the bottom. Unless you don’t like my syntax highlighting, then you can check out this [gist](https://gist.github.com/brandonrozek/0cf038df40a913fda655). + +## Register the service worker {#register-the-service-worker} + +Place `service-worker.js` on the root of your site. This is so the service worker can access all the files in the site. Then in your main javascript file, register the service worker. + +

+if (navigator.serviceWorker) {
+  navigator.serviceWorker.register('/serviceworker.js', {
+    scope: '/'
+  });
+}
+
+ +## Install the service worker {#install-the-service-worker} + +The first time the service worker runs, it emits the `install` event. At this time, we can load the visitor’s cache with some resources for when they’re offline. Every so often, I like to change up the theme of the site. So I have version numbers attached to my files. I would also like to invalidate my cache with this version number. So at the top of the file I added + +

+var version = 'v2.0.24:';
+
+ +Now, to specify which files I want the service worker to cache for offline use. I thought my home page and my offline page would be good enough. + +

+var offlineFundamentals = [
+    '/',
+    '/offline/'
+];
+
+ +Since cache.addAll() hasn’t been implemented yet in any of the browsers, and the polyfill implementation didn’t work for my needs. I pieced together my own. + +

+var updateStaticCache = function() {
+    return caches.open(version + 'fundamentals').then(function(cache) {
+        return Promise.all(offlineFundamentals.map(function(value) {
+            var request = new Request(value);
+            var url = new URL(request.url);
+            if (url.origin != location.origin) {
+                request = new Request(value, {mode: 'no-cors'});
+            }
+            return fetch(request).then(function(response) {
+                var cachedCopy = response.clone();
+                return cache.put(request, cachedCopy);
+            });
+        }))
+    })
+};
+
+ +Let’s go through this chunk of code. + + 1. Open the cache called 'v2.0.24:fundamentals' + 2. Go through all of the offlineFundamental‘s URLs + * Does the file I ask for come from the same domain as my site? + * No. Then, make the request ‘no-cors’ (I had difficulty getting my asset files in cors mode. If the cors headers are included in the response, then you can take out this line) + * Fetch the file from the network and then cache it. + +Now we call it when the `install` event is fired. + +

+self.addEventListener("install", function(event) {
+    event.waitUntil(updateStaticCache())
+})
+
+ +With this we now cached all the files in the offlineFundamentals array during the install step. + +## Clear out the old cache {#clear-out-the-old-cache} + +Since we’re caching everything. If you change one of the files, your visitor wouldn’t get the changed file. Wouldn’t it be nice to remove old files from the visitor’s cache? Every time the service worker finishes the install step, it releases an `activate` event. We can use this to look and see if there are any old cache containers on the visitor’s computer. From [Nicolas’ code](https://ponyfoo.com/articles/serviceworker-revolution). Thanks for sharing 🙂 + +

+var clearOldCaches = function() {
+    return caches.keys().then(function(keys) {
+            return Promise.all(
+                      keys
+                        .filter(function (key) {
+                              return key.indexOf(version) != 0;
+                        })
+                        .map(function (key) {
+                              return caches.delete(key);
+                        })
+                );
+        })
+}
+
+ + 1. Check the names of each of the cache containers + 2. If they don’t start with the correct version number + * Delete that cache container + +Call the function when the `activate` event fires. + +

+self.addEventListener("activate", function(event) {
+    event.waitUntil(clearOldCaches())
+});
+
+ +## Intercepting fetch requests {#intercepting-fetch-requests} + +The cool thing about service worker’s is that it can handle file requests. We could cache all files requested for offline use, and if a fetch for a resource failed, then the service worker can look for it in the cache or provide an alternative. This is a large section, so I’m going to attempt to break it down as much as I can. + +### Limit the cache {#limit-the-cache} + +If the visitor started browsing all of the pages on my site, his or her cache would start to get bloated with files. To not burden my visitors, I decided to only keep the latest 25 pages and latest 10 images in the cache. + +

+var limitCache = function(cache, maxItems) {
+    cache.keys().then(function(items) {
+        if (items.length > maxItems) {
+            cache.delete(items[0]);
+        }
+    })
+}
+
+ +We’ll call it later in the code. + +### Fetch from network and cache {#fetch-from-network-and-cache} + +Every time I fetch a file from the network I throw it into a specific cache container. 'pages' for HTML files, 'images' for CSS files, and 'assets' for any other file. This is so I can handle the cache limiting above easier. Defined within the `fetch` event. + +

+var fetchFromNetwork = function(response) {
+        var cacheCopy = response.clone();
+        if (event.request.headers.get('Accept').indexOf('text/html') != -1) {
+            caches.open(version + 'pages').then(function(cache) {
+                cache.put(event.request, cacheCopy).then(function() {
+                    limitCache(cache, 25);
+                })
+            });
+        } else if (event.request.headers.get('Accept').indexOf('image') != -1) {
+            caches.open(version + 'images').then(function(cache) {
+                cache.put(event.request, cacheCopy).then(function() {
+                    limitCache(cache, 10); 
+                });
+            });
+        } else {
+            caches.open(version + 'assets').then(function add(cache) {
+                cache.put(event.request, cacheCopy);
+            });
+        }
+
+        return response;
+    }
+
+ +### When the network fails {#when-the-network-fails} + +There are going to be times where the visitor cannot access the website. Maybe they went in a tunnel while they were riding a train? Or maybe your site went down. I thought it would be nice for my reader’s to be able to look over my blog posts again regardless of an internet connection. So I provide a fall-back. Defined within the `fetch` event. + +

+var fallback = function() {
+        if (event.request.headers.get('Accept').indexOf('text/html') != -1) {
+            return caches.match(event.request).then(function (response) { 
+                return response || caches.match('/offline/');
+            })
+        } else if (event.request.headers.get('Accept').indexOf('image') != -1) {
+            return new Response('<svg width="400" height="300" role="img" aria-labelledby="offline-title" viewBox="0 0 400 300" xmlns="http://www.w3.org/2000/svg"><title id="offline-title">Offline</title><g fill="none" fill-rule="evenodd"><path fill="#D8D8D8" d="M0 0h400v300H0z"/><text fill="#9B9B9B" font-family="Helvetica Neue,Arial,Helvetica,sans-serif" font-size="72" font-weight="bold"><tspan x="93" y="172">offline</tspan></text></g></svg>', { headers: { 'Content-Type': 'image/svg+xml' }});
+        } 
+    }
+
+ + 1. Is the request for a HTML file? + * Show the [offline](https://brandonrozek.com/offline/) page. + 2. Is the request for an image? + * Show a place-holder image (Courtesy of [Jeremy Keith](https://adactio.com/journal/9775)) + +### Handle the request {#handle-the-request} + +First off, I’m only handling GET requests. + +

+if (event.request.method != 'GET') {
+        return;
+}
+
+ +For HTML files, grab the file from the network. If that fails, then look for it in the cache. _Network then cache strategy_ + +

+if (event.request.headers.get('Accept').indexOf('text/html') != -1) {
+            event.respondWith(fetch(event.request).then(fetchFromNetwork, fallback));
+        return;
+        }
+
+ +For non-HTML files, follow this series of steps + + 1. Check the cache + 2. Does a cache exist for this file? + * Yes. Then show it + * No. Then grab it from the network and cache it. + +_Cache then network strategy_ + +

+event.respondWith(
+        caches.match(event.request).then(function(cached) {
+            return cached || fetch(event.request).then(fetchFromNetwork, fallback);
+        })
+    )
+
+ +For different stategy’s, take a look at Jake Archibald’s [offline cookbook](https://jakearchibald.com/2014/offline-cookbook/). + +## Conclusion {#conclusion} + +With all of that, we now have a fully functioning offline-capable website! I wouldn’t be able to implement this myself if it wasn’t for some of the awesome people I mentioned earlier sharing their experience. So share, share, share! With that sentiment, I’ll now share the full code for `service-worker.js` **Update:** There is a new version of this code over at this [blog post](https://brandonrozek.com/2015/11/limiting-cache-service-workers-revisited/). + +

+var version = 'v2.0.24:';
+
+var offlineFundamentals = [
+    '/',
+    '/offline/'
+];
+
+//Add core website files to cache during serviceworker installation
+var updateStaticCache = function() {
+    return caches.open(version + 'fundamentals').then(function(cache) {
+        return Promise.all(offlineFundamentals.map(function(value) {
+            var request = new Request(value);
+            var url = new URL(request.url);
+            if (url.origin != location.origin) {
+                request = new Request(value, {mode: 'no-cors'});
+            }
+            return fetch(request).then(function(response) {
+                var cachedCopy = response.clone();
+                return cache.put(request, cachedCopy);
+            });
+        }))
+    })
+};
+
+//Clear caches with a different version number
+var clearOldCaches = function() {
+    return caches.keys().then(function(keys) {
+            return Promise.all(
+                      keys
+                        .filter(function (key) {
+                              return key.indexOf(version) != 0;
+                        })
+                        .map(function (key) {
+                              return caches.delete(key);
+                        })
+                );
+        })
+}
+
+/*
+    limits the cache
+    If cache has more than maxItems then it removes the first item in the cache
+*/
+var limitCache = function(cache, maxItems) {
+    cache.keys().then(function(items) {
+        if (items.length > maxItems) {
+            cache.delete(items[0]);
+        }
+    })
+}
+
+
+//When the service worker is first added to a computer
+self.addEventListener("install", function(event) {
+    event.waitUntil(updateStaticCache())
+})
+
+//Service worker handles networking
+self.addEventListener("fetch", function(event) {
+
+    //Fetch from network and cache
+    var fetchFromNetwork = function(response) {
+        var cacheCopy = response.clone();
+        if (event.request.headers.get('Accept').indexOf('text/html') != -1) {
+            caches.open(version + 'pages').then(function(cache) {
+                cache.put(event.request, cacheCopy).then(function() {
+                    limitCache(cache, 25);
+                })
+            });
+        } else if (event.request.headers.get('Accept').indexOf('image') != -1) {
+            caches.open(version + 'images').then(function(cache) {
+                cache.put(event.request, cacheCopy).then(function() {
+                    limitCache(cache, 10);
+                });
+            });
+        } else {
+            caches.open(version + 'assets').then(function add(cache) {
+                cache.put(event.request, cacheCopy);
+            });
+        }
+
+        return response;
+    }
+
+    //Fetch from network failed
+    var fallback = function() {
+        if (event.request.headers.get('Accept').indexOf('text/html') != -1) {
+            return caches.match(event.request).then(function (response) { 
+                return response || caches.match('/offline/');
+            })
+        } else if (event.request.headers.get('Accept').indexOf('image') != -1) {
+            return new Response('<svg width="400" height="300" role="img" aria-labelledby="offline-title" viewBox="0 0 400 300" xmlns="http://www.w3.org/2000/svg"><title id="offline-title">Offline</title><g fill="none" fill-rule="evenodd"><path fill="#D8D8D8" d="M0 0h400v300H0z"/><text fill="#9B9B9B" font-family="Helvetica Neue,Arial,Helvetica,sans-serif" font-size="72" font-weight="bold"><tspan x="93" y="172">offline</tspan></text></g></svg>', { headers: { 'Content-Type': 'image/svg+xml' }});
+        }
+    }
+
+    //This service worker won't touch non-get requests
+    if (event.request.method != 'GET') {
+        return;
+    }
+
+    //For HTML requests, look for file in network, then cache if network fails.
+    if (event.request.headers.get('Accept').indexOf('text/html') != -1) {
+            event.respondWith(fetch(event.request).then(fetchFromNetwork, fallback));
+        return;
+        }
+
+    //For non-HTML requests, look for file in cache, then network if no cache exists.
+    event.respondWith(
+        caches.match(event.request).then(function(cached) {
+            return cached || fetch(event.request).then(fetchFromNetwork, fallback);
+        })
+    )
+});
+
+//After the install event
+self.addEventListener("activate", function(event) {
+    event.waitUntil(clearOldCaches())
+});
+
\ No newline at end of file diff --git a/content/blog/2015-11-15-fractions-js.md b/content/blog/2015-11-15-fractions-js.md new file mode 100644 index 0000000..9b0c42a --- /dev/null +++ b/content/blog/2015-11-15-fractions-js.md @@ -0,0 +1,126 @@ +--- +id: 398 +title: Math with Fractions.js +date: 2015-11-15T12:46:14+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=398 +permalink: /2015/11/fractions-js/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"dd3b15d9d3c9";s:21:"follower_notification";s:2:"no";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:68:"https://medium.com/@brandonrozek/math-with-fractions-js-dd3b15d9d3c9";}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"dd3b15d9d3c9";s:21:"follower_notification";s:2:"no";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:68:"https://medium.com/@brandonrozek/math-with-fractions-js-dd3b15d9d3c9";}' +mf2_cite: + - 'a:1:{s:6:"author";a:0:{}}' + - 'a:1:{s:6:"author";a:0:{}}' +tumblr_post_id: + - "135657739439" + - "135657739439" +kind: + - article +--- +Last week I published my first library over on Github called [Fractions.js](https://github.com/brandonrozek/Fractions.js). Fractions.js is a library to help avoid the [mathmatetical errors](http://floating-point-gui.de/) in floating point arithmetic. What do you mean by floating point artihmetic errors? Here is an example: .1 * .2 outputs 0.020000000000000004 even though the correct answer is .02 + + + +## Purpose {#purpose} + +My team and I are currently working on a new game for Math I/O. One of the levels is testing whether the player can add, subtract, multiply, and divide fractions correctly. I didn’t want to implement a solution where we check if the input entered is within a range of the answer. So I asked the team, how do you add, subtract, multiply, and divide fractions in your head? As we were working through it together, I realized that this is a common problem over at Math I/O. So I decided to make a library dedicated to this. + +## How it works {#how-it-works} + +I broke up each fraction into two things, a numerator and a denominator. With these two numbers, I can figure out all of the most common operations. + +### Addition {#addition} + +For addition, if two fractions have the same denominator, then you just need to add the numerators. + + 1/3 + 1/3 = 2/3 + + +If not, then you need to change it to have a common denominator. We can do this by multiply each fractions numerator and denominator by the other fractions denominator. + + 1/2 + 1/3 = (1 * 3)/ (2 * 3) + (1 * 2)/ (2 * 3) = 3/6 + 2/6 = 5/6 + + +### Subtraction {#subtraction} + +Works the same as addition, except the second fraction is subtracted (taken away) from the first. + +### Multiplication {#multiplication} + +To multiply two fractions, just multiply the numerators by each other, and the denominators by each other. + + 2/3 * 1/2 = 2/6 + + +### Division {#division} + +Treated similar to multiplication since dividing a number is the same thing as multiplying by it’s [reciprocal](https://www.mathsisfun.com/reciprocal.html). + + 1 / (1 / 2) = 1 * 2 = 2 + + +### Simplification {#simplification} + +Sometimes with the operations above, it’ll produce fractions in an unsimplified form. To avoid any confusion, I created a simplify function. It was challanging trying to figure out a way to code this. While I was browsing around for an implementation, I knocked into Euclider’s algorithm for finding the greatest common factor. Straight from the [Wikipedia article](https://en.wikipedia.org/wiki/Euclidean_algorithm) (where a is greater than b): + + + function gcd(a, b) + while b ≠ 0 + t := b; + b := a mod b; + a := t; + return a; + + +I can then simplify the fraction by dividing the numerator and denominator by the greatest common factor. + +## The API {#the-api} + +I decided to provide as much flexibility as I can in the API. You have several ways to create a new Fraction. + +

+var oneHalf = new Fraction(1,2);
+var oneHalf = new Fraction(.5);
+var oneHalf = new Fraction("1/2");
+var oneHalf = new Fraction("1", "2")
+
+ +All of these results will return a Fraction with a numerator of 1 and a denominator of 2. You also have two different ways to do the most common operations. + +

+var fiveThirds = Fraction.add("1/3", "4/3");
+var fiveThirds = new Fraction("1/3").add("4/3");
+
+ +The second style came from how jQuery implements it’s library. That way you can chain operations. + +

+new Fraction("1/2").add("2/3").divide("5/6").subtract("7/8").multiply("6/5").toString()
+
+ +Outputs '63/100' This is accomplished in the code through [prototypes](http://javascriptissexy.com/javascript-prototype-in-plain-detailed-language/). + +

+Fraction.add = function(frac1, frac2) {
+    Fraction.correctArgumentLength(2, arguments.length);
+    frac1 = Fraction.toFraction(frac1)
+    frac2 = Fraction.toFraction(frac2)
+
+    var newFrac = frac1;
+    newFrac.numerator = frac1.numerator * frac2.denominator + frac1.denominator * frac2.numerator;
+    newFrac.denominator = frac1.denominator * frac2.denominator;
+    return Fraction.simplify(newFrac);
+}
+Fraction.prototype.add = function(frac) {
+    Fraction.correctArgumentLength(1, arguments.length);
+    return Fraction.change(this, Fraction.add(this, frac));
+}
+
+ +In the code, the add prototype calls the Fraction.add function within it to avoid code duplication. + +## Conclusion {#conclusion} + +After I coded this up, I looked online for different implementations and found [fraction.js](https://github.com/ekg/fraction.js) by [Erik Garrison](http://hypervolu.me/~erik/). It’s important to look at different implementations and see which matches your needs better. This post isn’t meant to go fully into detail of the library. To know what else the library can do, visit the [readme page](https://github.com/brandonrozek/Fractions.js/blob/master/README.md). If you’re curious in how it’s implemented, check out the [code](https://github.com/brandonrozek/Fractions.js/blob/master/Fraction.js). [Email me](mailto:hello@brandonrozek.com) if you have any questions/criticisms 🙂 \ No newline at end of file diff --git a/content/blog/2015-11-30-limiting-cache-service-workers-revisited3.md b/content/blog/2015-11-30-limiting-cache-service-workers-revisited3.md new file mode 100644 index 0000000..1c6d513 --- /dev/null +++ b/content/blog/2015-11-30-limiting-cache-service-workers-revisited3.md @@ -0,0 +1,247 @@ +--- +id: 449 +title: Limiting the Cache in Service Workers Revisited +date: 2015-11-30T00:34:15+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=449 +permalink: /2015/11/limiting-cache-service-workers-revisited3/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"9cc502aae12e";s:21:"follower_notification";s:2:"no";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:93:"https://medium.com/@brandonrozek/limiting-the-cache-in-service-workers-revisited-9cc502aae12e";}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"9cc502aae12e";s:21:"follower_notification";s:2:"no";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:93:"https://medium.com/@brandonrozek/limiting-the-cache-in-service-workers-revisited-9cc502aae12e";}' +mf2_cite: + - 'a:1:{s:6:"author";a:0:{}}' + - 'a:1:{s:6:"author";a:0:{}}' +tumblr_post_id: + - "135657767639" + - "135657767639" +tumblr_crosspostr_crosspost: + - 'N' +kind: + - article +--- +Summary: I rewrote how cache limiting works to address a few problems listed later in this post. Check out the [gist](https://gist.github.com/brandonrozek/0cf038df40a913fda655) for the updated code. + + + +I wrote a function in my [previous service worker post](https://brandonrozek.com/2015/11/service-workers/) to help limit the cache. Here’s a reminder of what it looked like. + +

+var limitCache = function(cache, maxItems) {
+	cache.keys().then(function(items) {
+		if (items.length > maxItems) {
+			cache.delete(items[0]);
+		}
+	})
+}
+
+ +### The Problem + +Jeremy Keith updated the service worker on his site and noticed that the images has blown past the amount he allocated for it ([post](https://adactio.com/journal/9844)). Looking back at my service worker, I noticed that mine has the same shortcoming as well. So what happened? Service workers function in an asynchronous manner. Meaning it can be processing not just one, but many fetch events at the same time. This comes into conflict when there are synchronous instructions such as deleting the first item from the cache which Jeremy describes in his follow up [post](https://adactio.com/journal/9888). + +### A Solution + +Jeremy wrote a function to help trim the cache and asked when it would be appropriate to apply it. + +

+var trimCache = function (cacheName, maxItems) {
+    caches.open(cacheName)
+        .then(function (cache) {
+            cache.keys()
+                .then(function (keys) {
+                    if (keys.length > maxItems) {
+                        cache.delete(keys[0])
+                            .then(trimCache(cacheName, maxItems));
+                    }
+                });
+        });
+};
+
+ +And that got me thinking. In what situations is this problem more likely to occur? This particular problem happens when a lot of files are being called asynchronously. This problem doesn’t occur when only one file is being loaded. So when do we load a bunch of files? During page load. During page load, the browser might request css, javascript, images, etc. Which for most [websites](http://royal.pingdom.com/2011/11/21/web-pages-getting-bloated-here-is-why/), is a lot of files. Let’s now move our focus back to the humble script.js. Before, the only role it played with service workers was registering the script. However, if we can get the script to notify the service worker when the page is done loading, then the service worker will know when to trim the cache. + +

+if ('serviceWorker' in navigator) {
+	navigator.serviceWorker.register('https://yourwebsite.com/serviceworker.js', {scope: '/'});
+}
+window.addEventListener("load", function() {
+	if (navigator.serviceWorker.controller != null) {
+		navigator.serviceWorker.controller.postMessage({"command":"trimCache"});
+	}
+});
+
+ +Why if (navigator.serviceWorker.controller != null)? Service Workers don’t take control of the page immediately but on subsequent page loads, Jake Archibald [explains](https://jakearchibald.com/2014/using-serviceworker-today/). When the service worker does have control of the page however, we can use the [postMessage api](https://developer.mozilla.org/en-US/docs/Web/API/Worker/postMessage) to send a message to the service worker. Inside, I provided a json with a “command” to “trimCache”. Since we send the json to the service worker, we need to make sure that it can receive it. + +

+self.addEventListener("message", function(event) {
+	var data = event.data;
+	
+	if (data.command == "trimCache") {
+		trimCache(version + "pages", 25);
+		trimCache(version + "images", 10);
+		trimCache(version + "assets", 30);
+	}
+});
+
+ +Once it receives the command, it goes on to trim all of the caches. + +### Conclusion + +So whenever you download a bunch of files, make sure to run navigator.serviceWorker.controller.postMessage({"command":"trimCache"}); on the main javascript file to trim the cache. A downside to this method is that since Service Workers don’t take control during the first page load, the cache isn’t trimmed until the second page load. If you can find a way to make it so that this event happens in the first page load [tell me](mailto:hello@brandonrozek.com) about it/write a blog post. 🙂 **Update:** To get the service worker to take control of the page immediately call [self.skipWaiting()](https://developer.mozilla.org/en-US/docs/Web/API/ServiceWorkerGlobalScope/skipWaiting) after the install event and [self.clients.claim()](https://developer.mozilla.org/en-US/docs/Web/API/Clients/claim) after the activate event. Current code for our humble service worker: + +

+var version = 'v2.0.24:';
+
+var offlineFundamentals = [
+	'/',
+	'/offline/'
+];
+
+//Add core website files to cache during serviceworker installation
+var updateStaticCache = function() {
+	return caches.open(version + 'fundamentals').then(function(cache) {
+		return Promise.all(offlineFundamentals.map(function(value) {
+			var request = new Request(value);
+			var url = new URL(request.url);
+			if (url.origin != location.origin) {
+				request = new Request(value, {mode: 'no-cors'});
+			}
+			return fetch(request).then(function(response) { 
+				var cachedCopy = response.clone();
+				return cache.put(request, cachedCopy); 
+				
+			});
+		}))
+	})
+};
+
+//Clear caches with a different version number
+var clearOldCaches = function() {
+	return caches.keys().then(function(keys) {
+			return Promise.all(
+          			keys
+            			.filter(function (key) {
+              				return key.indexOf(version) != 0;
+            			})
+            			.map(function (key) {
+              				return caches.delete(key);
+            			})
+        		);
+		})
+}
+
+/*
+	trims the cache
+	If cache has more than maxItems then it removes the excess items starting from the beginning
+*/
+var trimCache = function (cacheName, maxItems) {
+    caches.open(cacheName)
+        .then(function (cache) {
+            cache.keys()
+                .then(function (keys) {
+                    if (keys.length > maxItems) {
+                        cache.delete(keys[0])
+                            .then(trimCache(cacheName, maxItems));
+                    }
+                });
+        });
+};
+
+
+//When the service worker is first added to a computer
+self.addEventListener("install", function(event) {
+	event.waitUntil(updateStaticCache()
+				.then(function() { 
+					return self.skipWaiting(); 
+				})
+			);
+})
+
+self.addEventListener("message", function(event) {
+	var data = event.data;
+	
+	//Send this command whenever many files are downloaded (ex: a page load)
+	if (data.command == "trimCache") {
+		trimCache(version + "pages", 25);
+		trimCache(version + "images", 10);
+		trimCache(version + "assets", 30);
+	}
+});
+
+//Service worker handles networking
+self.addEventListener("fetch", function(event) {
+
+	//Fetch from network and cache
+	var fetchFromNetwork = function(response) {
+		var cacheCopy = response.clone();
+		if (event.request.headers.get('Accept').indexOf('text/html') != -1) {
+			caches.open(version + 'pages').then(function(cache) {
+				cache.put(event.request, cacheCopy);
+			});
+		} else if (event.request.headers.get('Accept').indexOf('image') != -1) {
+			caches.open(version + 'images').then(function(cache) {
+				cache.put(event.request, cacheCopy);
+			});
+		} else {
+			caches.open(version + 'assets').then(function add(cache) {
+				cache.put(event.request, cacheCopy);
+			});
+		}
+
+		return response;
+	}
+
+	//Fetch from network failed
+	var fallback = function() {
+		if (event.request.headers.get('Accept').indexOf('text/html') != -1) {
+			return caches.match(event.request).then(function (response) { 
+				return response || caches.match('/offline/');
+			})
+		} else if (event.request.headers.get('Accept').indexOf('image') != -1) {
+			return new Response('Offlineoffline', { headers: { 'Content-Type': 'image/svg+xml' }});
+		} 
+	}
+	
+	//This service worker won't touch non-get requests
+	if (event.request.method != 'GET') {
+		return;
+	}
+	
+	//For HTML requests, look for file in network, then cache if network fails.
+	if (event.request.headers.get('Accept').indexOf('text/html') != -1) {
+        	event.respondWith(fetch(event.request).then(fetchFromNetwork, fallback));
+		return;
+    	}
+
+	//For non-HTML requests, look for file in cache, then network if no cache exists.
+	event.respondWith(
+		caches.match(event.request).then(function(cached) {
+			return cached || fetch(event.request).then(fetchFromNetwork, fallback);
+		})
+	)	
+});
+
+//After the install event
+self.addEventListener("activate", function(event) {
+	event.waitUntil(clearOldCaches()
+				.then(function() { 
+					return self.clients.claim(); 
+				})
+			);
+});
+
+ +

+if ('serviceWorker' in navigator) {
+	navigator.serviceWorker.register('https://brandonrozek.com/serviceworker.js', {scope: '/'});
+}
+window.addEventListener("load", function() {
+	if (navigator.serviceWorker.controller != null) {
+		navigator.serviceWorker.controller.postMessage({"command":"trimCache"});
+	}
+});
+
\ No newline at end of file diff --git a/content/blog/2015-12-22-playing-with-qr-codes.md b/content/blog/2015-12-22-playing-with-qr-codes.md new file mode 100644 index 0000000..97075ec --- /dev/null +++ b/content/blog/2015-12-22-playing-with-qr-codes.md @@ -0,0 +1,48 @@ +--- +id: 572 +title: Playing with QR Codes +date: 2015-12-22T15:13:44+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=572 +permalink: /2015/12/playing-with-qr-codes/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' +mf2_cite: + - 'a:1:{s:6:"author";a:0:{}}' + - 'a:1:{s:6:"author";a:0:{}}' +tumblr_post_id: + - "135727537264" + - "135727537264" +bridgy_syndication: + - | + + https://twitter.com/B_RozekJournal/status/790337750280970241 +kind: + - article +--- +Looking at Aaron Parecki’s [“Fun with QR Codes”](https://aaronparecki.com/articles/2015/10/05/1/fun-with-qr-codes) inspired me to play with QR Codes myself. Using the tool [QArt Coder](http://research.swtch.com/qr/draw) made by [Russ Cox](https://plus.google.com/116810148281701144465), I made a QR Code with my face in it! + + + +qrcode-large + +### Why QR Codes? + +QR Codes aren’t prevalent in the United States of America. In fact, they’re often viewed by technologists as a [joke](http://picturesofpeoplescanningqrcodes.tumblr.com/). But as [Christina Xu](http://www.christinaxu.org/) points out on her Medium post [“Pictures of Chinese People Scanning QR Codes”](https://medium.com/chrysaora-weekly/pictures-of-chinese-people-scanning-qr-codes-a564047ec58f), it’s not a joke everywhere. In fact, many people actually depend on this humble little QR code to get by in their day. Another story, my family and I go out to eat sometimes. Occasionally, we’ll knock into a Heinz Ketchup bottle. + +
+ Picture of Heinz ketchup bottle with QR Code. + +

+ Picture by Azad Zahoory +

+
My brother would get so excited whenever he saw this. This little ketchup bottle meant that we got to play a + +trivia game. No matter what you think of QR Codes, vanity or not, there are people who use it every day. So have some fun and make yourself a QR Code of your own. You know, just in case 😉 + +### Setting up the QR Code + +First, you need a picture. I used a picture of myself. Then for the QArt Coder site to work correctly, the image needs to be in high-contrast. Meaning, it needs to be mostly black and white. To accomplish this, fire up [Gimp](https://www.gimp.org/) (or your image editor of choice), and hit Color -> Threshold. That will give you a black and white version of the picture where you can then play around with the slider to get it just how you want it. After that, open up [QArt Coder](http://research.swtch.com/qr/draw) and upload the image onto the site. Once that’s accomplished, you might need to play with the QR Size, Image Size, Rotation, and other options. After that, hit “Save this QR Code” and viola! You got yourself three different sizes of QR codes to use. What should you do with the QR Code after you get it? First, brag to your friends about how cool it looks. Then maybe put it on your [business card](https://www.webdesignerdepot.com/2011/07/30-creative-qr-code-business-cards/). If you can think of any other excuses uses of QR Codes [contact me](mailto:hello@brandonrozek.com) 🙂 \ No newline at end of file diff --git a/content/blog/2015-12-27-creating-vcards-from-h-cards.md b/content/blog/2015-12-27-creating-vcards-from-h-cards.md new file mode 100644 index 0000000..cde20c2 --- /dev/null +++ b/content/blog/2015-12-27-creating-vcards-from-h-cards.md @@ -0,0 +1,324 @@ +--- +id: 599 +title: Creating vCards from h-cards +date: 2015-12-27T15:17:12+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=599 +permalink: /2015/12/creating-vcards-from-h-cards/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:74:"https://cdn-images-1.medium.com/fit/c/200/200/1*dmbNkD5D-u45r44go_cf0g.png";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"9eab6bd8e0e4";s:21:"follower_notification";s:3:"yes";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:74:"https://medium.com/@brandonrozek/creating-vcards-from-h-cards-9eab6bd8e0e4";}' +mf2_cite: + - 'a:1:{s:6:"author";a:0:{}}' +tumblr_post_id: + - "136059699334" +kind: + - article +--- +Microformats is semantic HTML used to convey metadata. Using an userscript, I can generate a vCard from the representative h-card of the page. The code for this is on this gist [here.](https://gist.github.com/brandonrozek/e0153b2733e947fa9c87) + + + +### Terminology + +[Microformats](http://microformats.org/wiki/Main_Page) allows search engines, browsers, websites, or people like me to consume content on a site. + +[H-card](http://microformats.org/wiki/h-card) is a type of microformat that serves as a contact card for people and organizations. + +[vCard](https://en.wikipedia.org/wiki/VCard) is the standard for electronic business cards. They’re most likely used in your phone to store contacts. + +Userscript is essentially JavaScript that runs in the [Greasemonkey](http://www.greasespot.net/) extension. + +### What I’ll need + + * Microformat parser + * Way to find the representative h-card + * Way to generate a vCard from an h-card + * The userscript itself + +### Implementation + +To keep everything in small [reusable components](https://en.wikipedia.org/wiki/Modular_programming), I created four different sections. Thankfully, [Glenn Jones](http://glennjones.net/) already wrote a JavaScript microformats parser called [microformat-shiv.](https://github.com/glennjones/microformat-shiv) It’s licensed with [MIT](https://tldrlegal.com/license/mit-license), so we can use it, yay! + +Next, I need to find the representative h-card of the page. Following the [instructions](http://microformats.org/wiki/representative-h-card-parsing) on the microformats wiki, I wrote the following code. + +

+/*
+   representative-h-card - v0.1.0
+   Copyright (c) 2015 Brandon Rozek
+   Licensed MIT 
+*/
+
+/**
+	Finds the representative h-card of the page
+	[http://microformats.org/wiki/representative-h-card-parsing]
+	@returns representative h-card if found, null otherwise
+**/
+var representativeHCard = function(hCards, url) {
+	if (hCards.items.length == 0) {
+		return null;
+	} else if (hCards.items.length == 1 && urlsMatchURL(hCards.items[0], url)) {
+		hCard = hCards;
+		hCard.items = [hCards.items[0]];
+		return hCard
+	} else {
+		for (var i = 0; i < hCards.items.length; i++) {
+			if (urlsMatchURL(hCards.items[i], url) && (uidsMatchURL(hCards.items[i], url) || relMeMatchURL(hCards, url))) {
+				hCard = hCards;
+				hCard.items = [hCards.items[i]];
+				return hCard
+			}
+
+		}
+	}
+	return null;
+}
+
+var urlsMatchURL = function(hCard, url) {
+	var urls = hCard.properties.url;
+	if (typeof(urls) == "object") {
+		for (var i = 0; i < urls.length; i++) {
+			if (new URL(urls[i]).toString() == new URL(url).toString()) {
+				return true;
+			}
+		}
+	}
+	return false;
+}
+var uidsMatchURL = function(hCard, url) {
+	var uids = hCard.properties.uid;
+	if (typeof(uids) == "object") {
+		for (var i = 0; i < uids.length; i++) {
+			if (new URL(uids[i]).toString() == new URL(url).toString()) {
+				return true;
+			}
+		}
+	}
+	return false;
+};
+var relMeMatchURL = function(microformats, url) {
+	var me = microformats.rels.me;
+	if (typeof(me) == "object") {
+		for (var i = 0; i < me.length; i++) {
+			if (new URL(me[i]).toString() == new URL(url).toString()) {
+				return true;
+			}
+		}
+	}
+	return false;
+}
+
+ +Next up, is making the vCard. For this, I had to look at the [vCard 4.0 specification](https://tools.ietf.org/html/rfc6350) to figure out what the property names and values are. Then I browsed around different sites (takes you to a random [Indieweb](https://indiewebcamp.com/) site)  to figure out which properties are the most common. + +The properties I ended up adding to the vCard. + + * name + * photo + * telephone numbers + * URLs + * [IMPPs](https://en.wikipedia.org/wiki/Instant_Messaging_and_Presence_Protocol) (Instant Messaging and Presence Protocol) + * emails + * roles + * categories + * notes + + As I was browsing around, I noticed that a few people would have empty values for certain properties on their h-card. To avoid having this show up on the vCard, I added a filter that takes out empty strings. + +

+/*
+   vCard-from-h-card - v0.1.0
+   Copyright (c) 2015 Brandon Rozek
+   Licensed MIT 
+*/
+var makeVCard = function(hCard) {
+	var vCard = "BEGIN:VCARDnVERSION:4.0n";
+
+	//Add full name
+	var name = hCard.items[0].properties.name;
+	if (typeof(name) == "object") {
+		name.removeEmptyStrings();
+		for (var i = 0; i < name.length; i++) {
+			vCard += "FN: " + name[i] + "n";
+		}
+	}
+
+	//Add photo
+	var photo = hCard.items[0].properties.photo;
+	if (typeof(photo) == "object") {
+		photo.removeEmptyStrings();
+		for (var i = 0; i < photo.length; i++) {
+			vCard += "PHOTO: " + photo[i] + "n";
+		}
+	}
+
+	//Add phone number
+	var tel = hCard.items[0].properties.tel;
+	if (typeof(tel) == "object") {
+		tel.removeEmptyStrings();
+		for (var i = 0; i < tel.length; i++) {
+			try {
+				if (new URL(tel[i]).schema == "sms:") {
+					vCard += "TEL;TYPE=text;VALUE=text: " + new URL(tel[i]).pathname + "n";
+				} else {
+					vCard += "TEL;TYPE=voice;VALUE=text: " + new URL(tel[i]).pathname + "n";
+				}
+			} catch(e) {
+				vCard += "TEL;TYPE=voice;VALUE=text: " + tel[i] + "n";
+			}
+		}
+	}
+
+	//Add URLs
+	var url = hCard.items[0].properties.url;
+	if (typeof(url) == "object") {
+		url.removeEmptyStrings();
+		for (var i = 0; i < url.length; i++) {
+			vCard += "URL: " + url[i] + "n";
+		}
+	}
+
+	var impp = hCard.items[0].properties.impp;
+	//Add IMPP (Instant Messaging and Presence Protocol)
+	if (typeof(impp) == "object") {
+		impp.removeEmptyStrings();
+		for (var i = 0; i < impp.length; i++) {
+			vCard += "IMPP;PREF=" + (i + 1) + ": " + impp[i] + "n";
+		}
+	}
+
+	//Add emails
+	var email = hCard.items[0].properties.email;
+	if (typeof(email) == "object") {
+		email.removeEmptyStrings();
+		for (var i = 0; i < email.length; i++) {
+			try {
+				vCard += "EMAIL: " + new URL(email[i]).pathname + "n";
+			} catch (e) { 
+				vCard += "EMAIL: " + email[i] + "n" 
+			}		
+		}
+	}
+
+	//Add roles
+	var role = hCard.items[0].properties.role;
+	if (typeof(role) == "object") {
+		role.removeEmptyStrings();
+		for (var i = 0; i < role.length; i++) {
+			vCard += "ROLE: " + role[i] + "n";
+		}
+	}
+
+	//Add Organizations
+	var org = hCard.items[0].properties.org;
+	if (typeof(org) == "object") {
+		org.removeEmptyStrings();
+		for (var i = 0; i < org.length; i++) {
+			vCard += "ORG: " + org[i] + "n";
+		}
+	}
+
+	//Add Categories
+	var category = hCard.items[0].properties.category; 
+	if (typeof(category) == "object") {
+		vCard += "CATEGORIES: " + category.removeEmptyStrings().join(",") + "n";
+	}
+
+	//Add notes
+	var note = hCard.items[0].properties.note;
+	if (typeof(note) == "object") {
+		note.removeEmptyStrings();
+		for (var i = 0; i < note.length; i++) {
+			vCard += "NOTE: " + note[i] + "n";
+		}
+	}
+
+	return vCard + "END:VCARD";
+	
+}
+
+Array.prototype.removeEmptyStrings = function() {
+	return this.filter(function(i) { return i !== "" })
+}
+
+
+ +Now for the final part, making the userscript. Inspired by [Ryan Barret](https://snarfed.org/) and his userscript [Let’s Talk,](https://github.com/snarfed/misc/blob/master/userscripts/lets_talk.user.js) this userscript brings all of the above modules together. First it grabs the microformats from the page using microformat-shiv. + +For some reason, when I tried filtering it by ‘h-card’ it froze my computer. So I wrote my own little filter instead. + +After I grab the representative h-card from the page using the little module I wrote, I generated a vCard. With the vCard generated, I set up a little HTML and CSS to display the link in the top left corner of the screen. + +The link is actually a [data uri](https://developer.mozilla.org/en-US/docs/Web/HTTP/data_URIs) that has all of the information of the vCard encoded in it. Depending on your browser, once you click the link you might have to hit CTRL-S to save. + +

+/*
+   show-vCard - v0.1.0
+   Copyright (c) 2015 Brandon Rozek
+   Licensed MIT 
+*/
+var filterMicroformats = function(items, filter) {
+	var newItems = [];
+	for (var i = 0; i < items.items.length; i++) {
+		for (var k = 0; k < items.items[i].type.length; k++) {
+			if (filter.indexOf(items.items[i].type[k]) != -1) {
+				newItems.push(items.items[i]);
+			}
+		}
+	}
+	items.items = newItems;
+	return items;
+}
+var render = function() {
+	var hCards = filterMicroformats(Microformats.get(), ['h-card']);
+	var person = representativeHCard(hCards, location.origin);
+	if (person == null) {
+		return;
+	}
+
+	var node = document.createElement("div");
+	node.setAttribute("class", "lt");
+	
+	var link = "<a href="text/vcf;base64," + btoa(makeVCard(person))+ "" target="_blank">vCard</a>";
+	var style = " 
+			.lt { 
+				position: absolute; 
+				left: 24px; 
+				top: 0; 
+				color: #DDD; 
+				background-color: #FFD700; 
+				z-index: 9999; 
+				border-width: medium 1px 1px; 
+				border-style: none solid solid; 
+				border-color: #DDD #C7A900 #9E8600; 
+				box-shadow: 0px 1px rgba(0, 0, 0, 0.1), 0px 1px 2px rgba(0, 0, 0, 0.1), 0px 1px rgba(255, 255, 255, 0.34) inset; 
+				border-radius: 0px 0px 4px 4px; 
+		        } 
+			.lt a { 
+				padding: .5rem; 
+			 	color: #8f6900; 
+			 	text-shadow: 0px 1px #FFE770; 
+				border: medium none; 
+			} 
+		     ";
+
+	node.innerHTML = link + style;
+	document.body.appendChild(node);	
+}
+document.addEventListener("DOMContentLoaded", function() {
+	render();
+});
+
+ +Sadly, I have no way of controlling the file name when you save it so you’ll have to manually rename it to something more meaningful than a random string of characters. Also remember to add the extension ‘.vcf’ for it to be recognized by some devices. + +### Conclusion + +Fire up your favorite userscript handling tool and add the [script](https://gist.github.com/brandonrozek/e0153b2733e947fa9c87) in! Of course, since it’s pure JavaScript, you can also add it to your own site to serve the same purpose. + +I ran into a small problem loading a contact onto my Android 5.0.2 phone. Apparently, they don’t support vCard 4.0 yet so I had to go into the file and change the line that says “VERSION 4.0” to “VERSION 3.0” which then allowed me to import the file into my contacts. + +As with all the code I write, feel free to comment/criticize. I love hearing feedback so if you spot anything, [contact me](mailto:hello@brandonrozek.com) 🙂 + +Also posted on [IndieNews](http://news.indiewebcamp.com/en){.u-syndication} \ No newline at end of file diff --git a/content/blog/2016-08-16-pass-password-manager.md b/content/blog/2016-08-16-pass-password-manager.md new file mode 100644 index 0000000..d3e8afb --- /dev/null +++ b/content/blog/2016-08-16-pass-password-manager.md @@ -0,0 +1,94 @@ +--- +id: 919 +title: Pass the password manager +date: 2016-08-16T23:37:09+00:00 +author: Brandon Rozek +layout: post +guid: http://brandonrozek.com/?p=919 +permalink: /2016/08/pass-password-manager/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";N;s:21:"follower_notification";s:3:"yes";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:4:"none";s:3:"url";N;}' +mf2_cite: + - 'a:4:{s:9:"published";s:25:"0000-01-01T00:00:00+00:00";s:7:"updated";s:25:"0000-01-01T00:00:00+00:00";s:8:"category";a:1:{i:0;s:0:"";}s:6:"author";a:0:{}}' +tumblr_post_id: + - "149056904199" +bridgy_syndication: + - https://twitter.com/B_RozekJournal/status/790336614866100224 +tumblr_crosspostr_crosspost: + - 'N' +mf2_syndicate-to: + - 'a:1:{i:0;s:4:"none";}' +kind: + - note +--- +Looking over the list of programs installed on my computer, one of my all time favorites is a program called [Pass](https://www.passwordstore.org/). It’s a program available under most Linux distributions, Mac OS X (through [Brew](http://brew.sh/)), [Windows](https://github.com/mbos/Pass4Win), [Android](https://play.google.com/store/apps/details?id=com.zeapo.pwdstore), and [iOS](https://github.com/davidjb/pass-ios#readme). It stores all of the passwords using gpg encryption and stores them as actual files on the hard disk. Meaning if you wanted, you can sync them to all your devices! + +This program assumes a light familiarity with the terminal + + + +## Setup {#setup} + +First if you do not already have a gpg key, [create one](http://wooledge.org/~greg/crypto/node41.html). + +Then in the terminal type in + + pass init youremail@address + +Substituting youremail@address with the email associated with your gpg key. + +This will autmatically create an empty repository under your home folder in a folder labeled `.pass` + +If you are switching from an existing password manager, check to see if on the [Pass homepage](https://www.passwordstore.org/), there doesn’t exist a script to help you out + +## Basic Tasks {#basic-tasks} + +To insert a password into pass + + pass insert password-name + +It will then prompt you to enter the password + +To show passwords you have already inserted + + pass + +To show an individual password + + pass password-name + +But generally I find it handy to have it automatically in my clipboard. You can do that with the -c option + + pass -c password-name + +You can generate new secure passwords using pass. (-c copies the result into your clipboard) + + pass generate -c password-name password-length + +If you don’t want it to output symbols, use the -n option to restrict it to alphanumericals + + pass generate -n -c password-name password-length + +Another command i find handy is the `find` command. Mainly because I have over a 100 passwords in this system and i tend to forget what I named some of them + + pass find search-string + +There are too many commands to list them all, but if you ever want to find out more, check out the manual entry page for `pass` + + man pass + +## Extra: Syncing {#sync} + +I use a nextCloud instance on my server to sync my passwords, but I don’t see a reason why this wouldn’t work with other projects like dropbox, syncthing, or any other sync solution + +Some sync solutions don’t like to sync folders that begin with a ‘.’, my solution around this is to create a symbolic link between that and a folder you wish to link it to + + ln -s /path/to/home/folder/.password-store /path/to/sync/folder/password-store + +Then you just need to make sure to make the same link to all your other computers + +## Conclusion {#conclusion} + +I like Pass for it’s ease of use and for the fact that I’m not tied into any one company for managing my passwords. It’s based on open source tools and the fact I didn’t have to configure a database is a huge plus for me + +If you’re in a need of a password manager (I hope you have more than one password), then give pass a shot. It served me and my many passwords well. \ No newline at end of file diff --git a/content/blog/2017-03-07-knit-document-rstudio.md b/content/blog/2017-03-07-knit-document-rstudio.md new file mode 100644 index 0000000..c96e42d --- /dev/null +++ b/content/blog/2017-03-07-knit-document-rstudio.md @@ -0,0 +1,29 @@ +--- +id: 2090 +title: Knit a Document in RStudio +date: 2017-03-07T04:29:50+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=2090 +permalink: /2017/03/knit-document-rstudio/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' +mf2_syndicate-to: + - 'a:1:{i:0;s:4:"none";}' +mf2_cite: + - 'a:4:{s:9:"published";s:25:"0000-01-01T00:00:00+00:00";s:7:"updated";s:25:"0000-01-01T00:00:00+00:00";s:8:"category";a:1:{i:0;s:0:"";}s:6:"author";a:0:{}}' +tumblr_post_id: + - "158095811719" +format: aside +kind: + - note +--- +In case you were wondering how I got all the R code and output for the [“Do females live longer than males?”](https://brandonrozek.com/portfolio/male-vs-female-life-expectancy/) page. There is actually a function in RStudio that allows one to compile a report based on code and it’s output. + + + +First go to File->Knit Document. If this is your first time, then it will install RMarkdown, a dependency this tool needs to compile the report. + +Once that is downloaded, it will let you choose between three different file formats (HTML, PDF, MS Word). For the purposes of blog posts, I like to output it in HTML so I can copy and paste the code. But for personal use, I like using PDFs + +After you select the file format, hit compile, and voila! A nice neat compiled report is created for you. Here is a [pdf](https://brandonrozek.com/wp-content/uploads/2017/03/LifeExpectancy.pdf) example of the report I made. \ No newline at end of file diff --git a/content/blog/2017-03-07-uniformity-math-random.md b/content/blog/2017-03-07-uniformity-math-random.md new file mode 100644 index 0000000..ea76278 --- /dev/null +++ b/content/blog/2017-03-07-uniformity-math-random.md @@ -0,0 +1,132 @@ +--- +id: 2095 +title: Uniformity of Math.random() +date: 2017-03-07T21:50:52+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=2095 +permalink: /2017/03/uniformity-math-random/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' +mf2_syndicate-to: + - 'a:1:{i:0;s:4:"none";}' +mf2_cite: + - 'a:4:{s:9:"published";s:25:"0000-01-01T00:00:00+00:00";s:7:"updated";s:25:"0000-01-01T00:00:00+00:00";s:8:"category";a:1:{i:0;s:0:"";}s:6:"author";a:0:{}}' +tumblr_post_id: + - "158123669889" +format: aside +kind: + - note +--- +There are many cases where websites use random number generators to influence some sort of page behavior. One test to ensure the quality of a random number generator is to see if after many cases, the numbers produced follow a uniform distribution. + + + +Today, I will compare Internet Explorer 11, Chrome, and Firefox on a Windows 7 machine and report my results. + +## Hypothesis + +H0: The random numbers outputted follow the uniform distribution + +HA: The random numbers outputted do not follow the uniform distribution + +## Gathering Data + +I wrote a small [website](http://share.zeropointshift.com/files/2017/03/random.html) and obtained my data by getting the CSV outputted when I use IE11, Firefox, and Chrome. + +The website works by producing a random number using Math.random() between 1 and 1000 inclusive and calls the function 1,000,000 times. Storing it’s results in a file + +This website produces a file with all the numbers separated by a comma. We want these commas to be replaced by newlines. To do so, we can run a simple command in the terminal + +

+grep -oE '[0-9]+' Random.csv > Random_corrected.csv
+
+ +Do this with all three files and make sure to keep track of which is which. + +Here are a copy of my files for [Firefox](https://brandonrozek.com/wp-content/uploads/2017/03/Firefox_corrected.csv), [Chrome](https://brandonrozek.com/wp-content/uploads/2017/03/Chrome_corrected-1.csv), and [IE11](https://brandonrozek.com/wp-content/uploads/2017/03/IE11_corrected.csv) + +## Check Conditions + +Since we’re interested in if the random values occur uniformly, we need to perform a Chi-Square test for Goodness of Fit. With every test comes some assumptions + +Counted Data Condition: The data can be converted from quantatative to count data. + +Independence Assumption: One random value does not affect another. + +Expected Cell Frequency Condition: The expected counts are going to be 10000 + +Since all of the conditions are met, we can use the Chi-square test of Goodness of Fit + +## Descriptive Statistics + +For the rest of the article, we will use R for analysis. Looking at the histograms for the three browsers below. The random numbers all appear to occur uniformly + +
rm(list=ls())
+chrome = read.csv("~/Chrome_corrected.csv", header = F)
+firefox = read.csv("~/Firefox_corrected.csv", header = F)
+ie11 = read.csv("~/IE11_corrected.csv", header = F)
+
+ +

+hist(ie11$V1, main = "Distribution of Random Values for IE11", xlab = "Random Value")
+ +![](https://brandonrozek.com/wp-content/uploads/2017/03/ie11hist.png) + +
hist(firefox$V1, main = "Distribution of Random Values for Firefox", xlab = "Random Value")
+ +![](https://brandonrozek.com/wp-content/uploads/2017/03/firefoxhist.png) + +
hist(chrome$V1, main = "Distribution of Random Values for Chrome", xlab = "Random Value")
+ +![](https://brandonrozek.com/wp-content/uploads/2017/03/chromehist.png) + +## Chi-Square Test + +Before we run our test, we need to convert the quantatative data to count data by using the plyr package + +
#Transform to count data
+library(plyr)
+chrome_count = count(chrome)
+firefox_count = count(firefox)
+ie11_count = count(ie11)
+
+ +Run the tests + +

+# Chi-Square Test for Goodness-of-Fit
+chrome_test = chisq.test(chrome_count$freq)
+firefox_test = chisq.test(firefox_count$freq)
+ie11_test = chisq.test(ie11_count$freq)
+
+# Test results
+chrome_test
+ +As you can see in the test results below, we fail to reject the null hypothesis at a 5% significance level because all of the p-values are above 0.05. + + ## + ## Chi-squared test for given probabilities + ## + ## data: chrome_count$freq + ## X-squared = 101.67, df = 99, p-value = 0.4069 + +
firefox_test
+ + ## + ## Chi-squared test for given probabilities + ## + ## data: firefox_count$freq + ## X-squared = 105.15, df = 99, p-value = 0.3172 + +
ie11_test
+ + ## + ## Chi-squared test for given probabilities + ## + ## data: ie11_count$freq + ## X-squared = 78.285, df = 99, p-value = 0.9384 + +## Conclusion + +At a 5% significance level, we fail to obtain enough evidence to suggest that the distribution of random number is not uniform. This is a good thing since it shows us that our random number generators give all numbers an equal chance of being represented. We can use Math.random() with ease of mind. \ No newline at end of file diff --git a/content/blog/2017-03-09-simplifying-expressions-octave.md b/content/blog/2017-03-09-simplifying-expressions-octave.md new file mode 100644 index 0000000..72250f5 --- /dev/null +++ b/content/blog/2017-03-09-simplifying-expressions-octave.md @@ -0,0 +1,59 @@ +--- +id: 2115 +title: Simplifying Expressions with Octave +date: 2017-03-09T02:09:58+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=2115 +permalink: /2017/03/simplifying-expressions-octave/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' +mf2_syndicate-to: + - 'a:1:{i:0;s:22:"bridgy-publish_twitter";}' +mf2_cite: + - 'a:4:{s:9:"published";s:25:"0000-01-01T00:00:00+00:00";s:7:"updated";s:25:"0000-01-01T00:00:00+00:00";s:8:"category";a:1:{i:0;s:0:"";}s:6:"author";a:0:{}}' +tumblr_post_id: + - "158172999969" +mf2_syndication: + - 'a:1:{i:0;s:60:"https://twitter.com/B_RozekJournal/status/839659534146801665";}' +format: aside +kind: + - note +--- +Octave is a high level programming language intended for numerical computations. One of the cool features of this is that with symbolic expressions, you can then simplify mathematical expressions. + + + +## Setup + +First install [Octave](https://www.gnu.org/software/octave/) and the [symbolic package](https://octave.sourceforge.io/symbolic/) using the website or your package manager of choice. + +Then in octave type in the following code + + + pkg load symbolic + + +## Usage + +For every variable not defined earlier in your expression, make sure to declare it as a symbolic data type + +
syms x y
+ +Then make an expression + +

+expr = y + sin(x)^2 + cos(x)^2
+
+ +You can then ask Octave to simplify the expression for you + +

+simp_expr = simplify(expr)
+
+ +Displaying it shows it as + +
(sym) y + 1
+ +Which is indeed a simplification using a trig identity 🙂 \ No newline at end of file diff --git a/content/blog/2017-03-14-monte-carlo-pi.md b/content/blog/2017-03-14-monte-carlo-pi.md new file mode 100644 index 0000000..1dcf5b2 --- /dev/null +++ b/content/blog/2017-03-14-monte-carlo-pi.md @@ -0,0 +1,125 @@ +--- +id: 2089 +title: Monte Carlo Pi +date: 2017-03-14T05:31:21+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=2089 +permalink: /2017/03/monte-carlo-pi/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' +tumblr_post_id: + - "158383170019" +mf2_syndicate-to: + - 'a:1:{i:0;s:22:"bridgy-publish_twitter";}' +mf2_cite: + - 'a:4:{s:9:"published";s:25:"0000-01-01T00:00:00+00:00";s:7:"updated";s:25:"0000-01-01T00:00:00+00:00";s:8:"category";a:1:{i:0;s:0:"";}s:6:"author";a:0:{}}' +mf2_syndication: + - 'a:1:{i:0;s:60:"https://twitter.com/B_RozekJournal/status/841522141346570244";}' +format: aside +kind: + - note +--- +Using Monte Carlo methods, we can create a simulation that approximates pi. In this post, we will go over the math behind the approximation and the code. + + + +## The Math + +Pi is a mathematical constant consisting of the ratio between the circumfrence of a circle and it’s diameter. + +The circumfrence of the circle is defined to be $$ C = 2\pi r$$ while the diameter of the circle is $$d = 2r$$ + +Take the ratio between the two and you get $$\frac{2\pi r}{2r} = \pi$$ + +Now let us consider the area of a circle. One can derive the area of a circle by taking the integral of the circumfrence with respect to it’s radius $$ A_{circle} = \int{(2\pi r) dr} = \pi r^2 $$ + +Let us simplify the formula more by setting the radius equal to one. $$A_{circle} = \pi$$ + +Now consider only the first quadrant of the circle. Since our circle is centered at the origin and all the points on the circumfrence is equidistant from the center, our area is now $$A_{circle} = \frac{1}{4} \pi$$ + +And bound the quarter-circle in a 1×1 box with an area of $$A_{square} = 1^2 = 1$$ + +Notice that the ratio between the circle and the square is a quarter of pi $$\frac{A\_{circle}}{A\_{square}} = \frac{\frac{1}{4} \pi}{1} = \frac{1}{4} \pi$$ + +## Simulation and Statisitcs + +The formula for a circle centered at the origin with radius one is $$x^2 + y^2 = 1$$ + +Let us focus again on the first quadrent, and do a Monte Carlo simulation to find the area of the quarter-circle + +![](https://brandonrozek.com/wp-content/uploads/2017/03/circlefilled.png) + +We can do this by what is called the dart board method. We generate a random x and y between 0 and 1. If it satisfies the inequality $$x^2 + y^2 \leq 1$$ then it counts as being inside the circle, if not then it lies outside the circle. + +That point will count as an really small area. The point will always be inside the square but may sometimes be inside the circle. Running the simulations a large number of times allows us to add up all the tiny little areas that make up the circle and the square. + +To add up these small areas we need to make an assumption. The assumption is that the variance of all the little Monte Carlo trials are the same. Since we are using a psuedo-random number generator, it is safe to assume it is met. + +This will allow us to perform a pooled empiricle probability on the simulations to sum up the areas. + +Meaning the area of the circle will be the number of times that the inequality was satisfied $$A_{circle} = \# Successes$$ + +And the area of the square will be the number of times the simulation was run, since the random numbers generated will always be between 0 and 1 $$A_{square} = \# Trials$$ + +Recall that taking the ratio of the area of the circle and the area of the square is a fourth of pi. $$\frac{\frac{1}{4} \pi}{1} = \frac{1}{4} \pi$$ + +Multiply this number by 4 and you get the value for pi. + +This tells us that four times the probability that the randomly generated point is in the circle is equal to pi. + +$$\pi = 4 \* (Probability\ of\ being\ inside\ circle) = 4 \* \frac{\# Success}{\# Trials} = 4 * \frac{A\_{circle}}{A\_{square}}$$ + +## Implementation + +For the Monte Carlo simulation I used Java. The BigDecimal implementation was used so that there wouldn’t be any issue with integer size limits + +
/** Calculates Pi
+  * @author Brandon Rozek
+*/
+// Big Integers are used so we don't run into the integer size limit
+import java.math.BigInteger;
+import java.math.BigDecimal;
+class MonteCarloPi {
+        public static void main(String[] args) {
+
+                BigInteger successes = BigInteger.ZERO;
+                BigInteger trials = BigInteger.ZERO;
+
+ +For this simulation, we will run 1,000,000,000 trials + +
 BigInteger numTrials = new BigInteger("1000000000");
+/*
+    Monte Carlo Simulation
+        Generate a random point 0 <= x < 1 and 0 <= y < 1
+        If the generated point satisfies x^2 + x^2 < 1
+           Count as a success
+        Keep track of the number of trials and successes
+*/
+for (; trials.compareTo(numTrials) < 0; trials = trials.add(BigInteger.ONE)) {
+    double randomX = Math.random();
+    double randomY = Math.random();
+    if (Math.pow(randomX, 2) + Math.pow(randomY, 2) < 1) {
+        successes = successes.add(BigInteger.ONE);
+    }
+}
+
+ +And then we finalize it with a quick calculation of pi + +
// (Number of successes) / (Number of trials) * 4 gives the approximation for pi
+BigDecimal pi = new BigDecimal(successes)
+                       .divide(new BigDecimal(trials))
+                       .multiply(new BigDecimal("4"));
+System.out.println("The calculated value of pi is: " + pi);
+}}
+
+ +## Conclusion + +We found an approximation of pi using the Monte Carlo methods! I find that really awesome, however, there are some concerns I have with this approach. + +1) We don’t keep track of double counting. One possible solution for this is increasing the radius and bounding box appropriately so that the probability of double counting is low. + +2) Speed. The more trials you ask it to run, the longer it takes to perform all of the simulations. One possible way around this is to write a parrallel version of this code. That’s possible because of the equal variance that we spoke of earlier. Pooling the successses and trials will still result in a good approximation. \ No newline at end of file diff --git a/content/blog/2017-05-24-viewing-java-applets.md b/content/blog/2017-05-24-viewing-java-applets.md new file mode 100644 index 0000000..7dbe207 --- /dev/null +++ b/content/blog/2017-05-24-viewing-java-applets.md @@ -0,0 +1,74 @@ +--- +id: 2174 +title: Viewing Java Applets +date: 2017-05-24T15:59:45+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=2174 +permalink: /2017/05/viewing-java-applets/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' +mf2_syndicate-to: + - 'a:1:{i:0;s:22:"bridgy-publish_twitter";}' +mf2_cite: + - 'a:4:{s:9:"published";s:25:"0000-01-01T00:00:00+00:00";s:7:"updated";s:25:"0000-01-01T00:00:00+00:00";s:8:"category";a:1:{i:0;s:0:"";}s:6:"author";a:0:{}}' +tumblr_post_id: + - "161024360884" +mf2_syndication: + - 'a:1:{i:0;s:60:"https://twitter.com/B_RozekJournal/status/867409810932760576";}' +kind: + - article +--- +When you use an IDE there are many things you can take for granted. A section of an intro level computer science course at my university uses [JGrasp](http://www.jgrasp.org/) to build Java Applets. + +Following around using a normal text editor, I found that I couldn’t just compile and run the code like I have with my java programs in the past. To be able to help around and assist in the course, I need to be able to build and run these applications. The rest of this article describes the process I underwent to be able to use my existing setup to write and build java applets. Of course you can always install JGrasp and have that all built in, but it’s always nice to not have to change your workflow. + + + +When I tried following along, I would receive the following error + + Main method not found in class HelloWorld, please define main method as... + +Which makes sense since I have never defined a main method inside my source code. So how do I go about doing this? + +## Setup + +Java Applets are meant to run on web pages, because of this one needs an html file to host the applet. The following code gives you the bare minimum for setting up the html file. I called it `HelloWorld.html`. + +

+<html>
+    <head><title>Applet Container<title>
+    <body>
+        <applet code='HelloWorld.class' width=400 height=400></applet>
+    </body>
+</html>
+
+ +## Hello World Program + +To get it up and running, I will show a “Hello World” like application for applets. + +

+import javax.swing.JApplet;
+import java.awt.Graphics;
+
+public class HelloWorld extends JApplet {
+    public void paint(Graphics g) {
+        g.drawString("Hello World", 30, 30);
+    }
+} 
+
+ +## Running the Applet + +Now we need to compile the code + +
javac HelloWorld.java
+ +Then run the appletviewer + +
appletviewer HelloWorld.html
+ +## Conclusion + +This tutorial concludes the setup of running a simple Java applet. From here you can look at the different methods in the [Graphics library](https://docs.oracle.com/javase/7/docs/api/java/awt/Graphics.html) and play around 😀 \ No newline at end of file diff --git a/content/blog/2017-06-05-java-swing-components.md b/content/blog/2017-06-05-java-swing-components.md new file mode 100644 index 0000000..eff5468 --- /dev/null +++ b/content/blog/2017-06-05-java-swing-components.md @@ -0,0 +1,205 @@ +--- +id: 2198 +title: Java Swing Components +date: 2017-06-05T23:30:18+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=2198 +permalink: /2017/06/java-swing-components/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' +mf2_syndicate-to: + - 'a:1:{i:0;s:4:"none";}' +mf2_cite: + - 'a:4:{s:9:"published";s:25:"0000-01-01T00:00:00+00:00";s:7:"updated";s:25:"0000-01-01T00:00:00+00:00";s:8:"category";a:1:{i:0;s:0:"";}s:6:"author";a:0:{}}' +tumblr_post_id: + - "161484582559" +kind: + - article +--- +This post, over time, will serve as a reference to myself and others of the different UI components available in the Swing library. This post assumes a general familiarity with setting up a basic Swing application and focuses only on the individual components. + + + +### Buttons + +Buttons are created using the JButton component. The constructor takes the text placed inside the button. + +

+JButton stopBtn = new JButton("Stop");
+
+ + + +You can also add images inside a button. To do that you need to get the image and make it into an icon. The following code grabs the image file “smallpanda.jpg” from the current working directory. + +

+Image img = this.getImage(this.getCodeBase(), "smallpanda.jpg");
+ImageIcon imgIcon = new ImageIcon(img);
+JButton feedBtn = new JButton("Feed", imgIcon);
+
+ +Sometimes, you want to change the location of the text in the button. Like say, we want to place the text in the center horizontally and bottom vertically. + +

+feedBtn.setHorizontalTextPosition(JButton.CENTER);
+feedBtn.setVerticalTextPosition(JButton.BOTTOM);
+
+ +Don’t forget to add your buttons to the screen! + +

+this.add(stopBtn);
+this.add(feedBtn);
+
+ + + +### Labels and Textfields + +One of the most common forms of input is a text field, usually distinguished with a label. Those components are called JTextField and JLabel respectively. The constructor for JTextArea can take just the width of the text field, or another common use is to have already inputed text and its width. + +

+    JLabel nameLabel = new JLabel("Enter in your name: ");
+    
+    // Create an input and set the width to be 10px wide
+    JTextField nameInput = new JTextField(10);
+    //Override nameInput with a field already contains the text "Brandon"
+    //And is 10px wide
+    nameInput = new JTextField("Brandon", 10);
+    
+    this.add(nameLabel);
+    this.add(nameInput);
+
+ + + +### Checkboxes + +Checkboxes are commonly used when giving the possibility for multiple answers. Such as, check all of the foods that you like. + +

+    JCheckBox pizza = new JCheckBox("Pizza");
+    JCheckBox noodles = new JCheckBox("Noodles");
+    JCheckBox rice = new JCheckBox("Rice");
+    this.add(pizza);
+    this.add(noodles);
+    this.add(rice);
+
+ + + +You can even replace the default look of the checkbox with an image. To do this, you need to make image icons for both when it’s checked and when it’s unchecked. + +

+Image checkedImage = this.getImage(this.getCodeBase(), "checked.png");
+Image uncheckedImage = this.getImage(this.getCodeBase(), "unchecked.png");
+
+ImageIcon checkedIcon = new ImageIcon(checkedImage);
+ImageIcon uncheckedIcon = new ImageIcon(uncheckedImage);
+
+JCheckBox checkbox = new JCheckBox("Check Me", uncheckedIcon);
+checkbox.setSelectedIcon(checkedIcon);
+
+this.add(checkbox);
+
+ + + + +### Text Areas + +Text Areas are different from text fields in which it is made to be able to hold multiple lines of text. It’s called JTextArea and its construction takes a width and height as it’s arguments. + +

+JTextArea textarea = new JTextArea(10, 10);
+
+ +By default, when the someone inputs more text than the size can hold, it will automatically grow with the text inputted. To override this behaviour and instead introuduce scroll bars. One must define a ScrollPane and put the TextArea inside of it by using it as the scroll pane’s argument for its constructor. + +

+JScrollPane scrollPane = new JScrollPane(textarea);
+
+ + + +### Radio Buttons + +Radio buttons are used for when you only want one out of many different options to be selected. For this, one needs to define a button group that houses the radio buttons for the user to choose from. This can be achieved with ButtonGroup and JRadioButton respectively. + +

+// Make the radio buttons
+JRadioButton radio1 = new JRadioButton("Pies");
+JRadioButton radio2 = new JRadioButton("Cakes");
+JRadioButton radio3 = new JRadioButton("Cookies");
+
+// Put the radio buttons in a group
+Button Group desserts = new ButtonGroup();
+desserts.add(radio1);
+desserts.add(radio2);
+desserts.add(radio3);
+
+// Add the radio buttons to the screen
+this.add(radio1);
+this.add(radio2);
+this.add(radio3);
+
+ + + +### JList + +To display a list of items that are clickable by the user, you can use a `JList`. JLists require a model that stores the list implementation, we’ll use `DefaultListModel` to achieve this purpose. + +

+DefaultListModel model = new DefaultListModel();
+JList list = new JList(model);
+
+ +To add scrolling capabilities, remember to add it to a scroll pane + +

+JScollPane sp = new JScrollPane(list);
+
+ +You can set the number of items you wish to see in the list. The example below, allows us to see three items in the list. + +

+list.setVisibleRowCount(3);
+
+ +There are a variety of ways to add items to the list. If a number is specified that tells it to place it at the index specified. Starting from the top at zero, to the button. + +

+model.addElement("Apples")
+model.addElement("Cherries");
+model.addElement("Bananas");
+// Adds 'Oranges' to the top
+model.add(0, "Oranges");
+
+ +Sometimes, you want to only let the user select one item. At the end, don’t forget to add the component to the screen! + +

+list.setSelectionMode(ListSelectionModel.SINGLE_SELECTION);
+this.add(sp);
+
+ + + +### JComboBox + +To create a dropdown list of different options, consider using a JComboBox. + +

+JComboBox cb = new JComboBox();
+cb.addItem("Select Food Option");
+cb.addItem("Pizza");
+cb.addItem("Burger");
+cb.addItem("Hot Dog");
+cb.addItem("Steak");
+// Add it to the screen
+this.add(cb);
+
+ + \ No newline at end of file diff --git a/content/blog/2017-06-05-using-system-themes-java-swing.md b/content/blog/2017-06-05-using-system-themes-java-swing.md new file mode 100644 index 0000000..b96b3e4 --- /dev/null +++ b/content/blog/2017-06-05-using-system-themes-java-swing.md @@ -0,0 +1,45 @@ +--- +id: 2192 +title: Using System Themes In Java Swing +date: 2017-06-05T20:36:22+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=2192 +permalink: /2017/06/using-system-themes-java-swing/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' +mf2_syndicate-to: + - 'a:1:{i:0;s:4:"none";}' +mf2_cite: + - 'a:4:{s:9:"published";s:25:"0000-01-01T00:00:00+00:00";s:7:"updated";s:25:"0000-01-01T00:00:00+00:00";s:8:"category";a:1:{i:0;s:0:"";}s:6:"author";a:0:{}}' +tumblr_post_id: + - "161478693279" +mf2_syndication: + - 'a:1:{i:0;s:60:"https://twitter.com/B_RozekJournal/status/871828083459936257";}' +kind: + - article +--- +The default theme for Java Swing components is a cross-platform theme called “Metal”. I use the Adapta theme for GTK on Linux and this theme does not match at all what my other GUI applications look like. So here, I will describe a simple way to utlize already existent system themes in Java Swing applications. + + + +### Solution + +In the init method of your java application, place the following code. + +

+try {
+    UIManager.setLookAndFeel(UIManager
+                               .getSystemLookAndFeelClassName());
+} catch(Exception e) {}
+
+ +Here the application will attempt to look up the system theme and set that as the default styles for the Swing components. If the lookup fails, then it will default back to the metal theme. + +For more information, check out this page from [Oracle](http://docs.oracle.com/javase/tutorial/uiswing/lookandfeel/plaf.html). + +### Discussion + +If it is so easy to set up applications that look native to each desktop environment, why not have that by default? With the cross platform metal theme, you can ensure that the style of your application is the same across all the operating systems. In this fashion, you don’t need to worry about spacing between components and have full control of the “look and feel” of your application. + +Since I am used to development for the web, I don’t have strong motivation to have an application look the same on all platforms. I prefer the application to match the system theme and look like it was built for the platform that I am on. One loses partial control on the presentation of your application across different desktop environmnets, but with a strong layout, it is possible to make it look organized and integrated. \ No newline at end of file diff --git a/content/blog/2017-08-28-escape-sequences-java.md b/content/blog/2017-08-28-escape-sequences-java.md new file mode 100644 index 0000000..a631270 --- /dev/null +++ b/content/blog/2017-08-28-escape-sequences-java.md @@ -0,0 +1,96 @@ +--- +id: 2236 +title: Escape Sequences in Java +date: 2017-08-28T17:12:00+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=2236 +permalink: /2017/08/escape-sequences-java/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' +mf2_syndicate-to: + - 'a:1:{i:0;s:4:"none";}' +mf2_cite: + - 'a:4:{s:9:"published";s:25:"0000-01-01T00:00:00+00:00";s:7:"updated";s:25:"0000-01-01T00:00:00+00:00";s:8:"category";a:1:{i:0;s:0:"";}s:6:"author";a:0:{}}' +tumblr_post_id: + - "164716848139" +tumblr_crosspostr_crosspost: + - 'N' +kind: + - note +--- +Sometimes you want to format your outputs. This is a quick cheatsheet containing the differerent escape sequences + +  + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ Character + + Escape Sequence +
+ Newline + + \n +
+ Tab + + \t +
+ Backspace + + \b +
+ Double Quote            + + \” +
+ Single Quote + + \’ +
+ Backslash + + \\ +
\ No newline at end of file diff --git a/content/blog/2017-08-28-obtaining-command-line-input-java.md b/content/blog/2017-08-28-obtaining-command-line-input-java.md new file mode 100644 index 0000000..e32fd5c --- /dev/null +++ b/content/blog/2017-08-28-obtaining-command-line-input-java.md @@ -0,0 +1,136 @@ +--- +id: 2241 +title: Obtaining Command Line Input in Java +date: 2017-08-28T17:37:59+00:00 +author: Brandon Rozek +layout: post +guid: https://brandonrozek.com/?p=2241 +permalink: /2017/08/obtaining-command-line-input-java/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";N;s:10:"author_url";N;s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";N;s:2:"id";N;s:21:"follower_notification";N;s:7:"license";N;s:14:"publication_id";N;s:6:"status";N;s:3:"url";N;}' +mf2_syndicate-to: + - 'a:1:{i:0;s:4:"none";}' +mf2_cite: + - 'a:4:{s:9:"published";s:25:"0000-01-01T00:00:00+00:00";s:7:"updated";s:25:"0000-01-01T00:00:00+00:00";s:8:"category";a:1:{i:0;s:0:"";}s:6:"author";a:0:{}}' +tumblr_post_id: + - "164717769554" +mf2_mp-syndicate-to: + - 'a:1:{i:0;s:4:"none";}' +kind: + - note +--- +To obtain console input for your program you can use the Scanner class + +First import the relevant library + +

+import java.util.Scanner;
+
+ +Then create a variable to hold the Scanner object + +

+Scanner input;
+input = new Scanner(System.in);
+
+ +Inside the parenthesis, the Scanner binds to the System input which is by default the console + +The new varible input now has the ability to obtain input from the console. To do so, use any of the following methods + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ Method + + What it Returns +
+ next() + + The next space seperated string from the console +
+ nextInt() + + An integer if it exists from the console +
+ nextDouble()              + + A double if it exists from the console +
+ nextFloat() + + A float if it exists from the console +
+ nextLine() + + A string up to the next newline character from the console +
+ hasNext() + + Returns true if there is another token +
+ close() + + Unbinds the Scanner from the console +
+ +Here is an example program where we get the user’s first name + +

+import java.util.Scanner;
+
+public class GetName {
+  public static void main(String[] args) {
+    Scanner input = new Scanner(System.in);
+    System.out.print("Please enter your name: ");
+    String firstName = input.next();
+    System.out.println("Your first name is " + firstName); 
+  }
+}
+
\ No newline at end of file diff --git a/content/blog/2018-01-22-identifying-misspelled-words-dataset-hunspell.md b/content/blog/2018-01-22-identifying-misspelled-words-dataset-hunspell.md new file mode 100644 index 0000000..f2a6990 --- /dev/null +++ b/content/blog/2018-01-22-identifying-misspelled-words-dataset-hunspell.md @@ -0,0 +1,177 @@ +--- +id: 2250 +title: Identifying Misspelled Words in your Dataset with Hunspell +date: 2018-01-22T05:17:16+00:00 +author: rozek_admin +layout: post +guid: https://brandonrozek.com/?p=2250 +permalink: /2018/01/identifying-misspelled-words-dataset-hunspell/ +medium_post: + - 'O:11:"Medium_Post":11:{s:16:"author_image_url";s:75:"https://cdn-images-1.medium.com/fit/c/200/200/1*06lotWcLMUnKZTN6-Th3IQ.jpeg";s:10:"author_url";s:32:"https://medium.com/@brandonrozek";s:11:"byline_name";N;s:12:"byline_email";N;s:10:"cross_link";s:2:"no";s:2:"id";s:12:"c0ccd543b7e6";s:21:"follower_notification";s:3:"yes";s:7:"license";s:19:"all-rights-reserved";s:14:"publication_id";s:2:"-1";s:6:"status";s:6:"public";s:3:"url";s:104:"https://medium.com/@brandonrozek/identifying-misspelled-words-in-your-dataset-with-hunspell-c0ccd543b7e6";}' +mf2_mp-syndicate-to: + - 'a:1:{i:0;s:22:"bridgy-publish_twitter";}' +tumblr_post_id: + - "169988632939" +mf2_syndication: + - 'a:1:{i:0;s:60:"https://twitter.com/B_RozekJournal/status/955308388384235521";}' +kind: + - article +--- +This article is based on one written by [Markus Konrad](https://datascience.blog.wzb.eu/author/markus_konrad/) at this link https://datascience.blog.wzb.eu/2016/07/13/autocorrecting-misspelled-words-in-python-using-hunspell/ + +I assume in this article that you have hunspell and it's integration with python installed. If not, please refer to the article mention above and follow the prerequisite steps. + +This article is inspired from the need to correct misspelled words in the [Dress Attributes Dataset](https://archive.ics.uci.edu/ml/datasets/Dresses_Attribute_Sales). I'll share with you my initial pitfall, and what I ended up doing instead. + +### Background Information + +Misspelled words are common when dealing with survey data or data where humans type in the responses manually. In the Dress Attributes Dataset this is apparent when looking at the sleeve lengths of the different dresses. + +
dresses_data['SleeveLength'].value_counts()
+
+ +| Word | Frequency | +| -------------- | --------- | +| sleevless | 223 | +| full | 97 | +| short | 96 | +| halfsleeve | 35 | +| threequarter | 17 | +| thressqatar | 10 | +| sleeveless | 5 | +| sleeevless | 3 | +| capsleeves | 3 | +| cap-sleeves | 2 | +| half | 1 | +| Petal | 1 | +| urndowncollor | 1 | +| turndowncollor | 1 | +| sleveless | 1 | +| butterfly | 1 | +| threequater | 1 |
+ +Ouch, so many misspelled words. This is when my brain is racking up all the ways I can automate this problem away. Hence my stumbling upon Markus' post. + +### Automagically Correcting Data + +First, I decided to completely ignore what Markus warns in his post and automatically correct all the words in that column. + +To begin the code, let's import and create an instance of the spellchecker: + +
from hunspell import HunSpell
+spellchecker = HunSpell('/usr/share/hunspell/en_US.dic', '/usr/share/hunspell/en_US.aff')
+
+ +I modified his `correct_words` function so that it only corrects one word and so I can `apply` it along the `SleeveLength` column. + +
def correct_word(checker, word, add_to_dict=[]):
+    "Takes in a hunspell object and a word and corrects the word if needed"   
+    # Add custom words to the dictionary
+    for w in add_to_dict:
+        checker.add(w)
+
+    corrected = ""
+    # Check to see if it's a string
+    if isinstance(word, str):
+        # Check the spelling
+        ok = checker.spell(word)
+        if not ok:
+            # Grab suggestions for misspelled word
+            suggestions = checker.suggest(word)
+            if suggestions:
+                # Grab the best suggestion
+                best = suggestions[0]
+                corrected = best
+            else:
+                # There are no suggestions for misspelled word, return the original
+                corrected = word 
+        else:
+            # Word is spelled correctly
+            corrected = word
+    else:
+        ## Not a string. Return original
+        corrected = word
+    return corrected
+
+ +Now let's apply the function over the `SleeveLength` column of the dataset: + +
dresses_data['SleeveLength'] = dresses_data['SleeveLength'].apply(
+    lambda x: correct_word(spellchecker, x))
+
+ +Doing so creates the following series:
+ +| Word | Frequency | +| -------------- | --------- | +| sleeveless | 232 | +| full | 97 | +| short | 96 | +| half sleeve | 35 | +| three quarter | 17 | +| throatiness | 10 | +| cap sleeves | 3 | +| cap-sleeves | 2 | +| Petal | 1 | +| butterfly | 1 | +| turndowncollor | 1 | +| half | 1 | +| landownership | 1 | +| forequarter | 1 |
+ +As you might be able to tell, this process didn't go as intended. `landownership` isn't even a length of a sleeve! + +### Reporting Misspelled Items and Allowing User Intervention + +This is when I have to remember, technology isn't perfect. Instead we should rely on ourselves to identify what the word should be correctly spelled as. + +Keeping that in mind, I modified the function again to take in a list of the data, and return a dictionary that has the misspelled words as the keys and suggestions as the values represented as a list. + +
def list_word_suggestions(checker, words, echo = True, add_to_dict=[]):
+    "Takes in a list of words and returns a dictionary with mispellt words as keys and suggestions as a list. Also prints it out"
+    # add custom words to the dictionary
+    for w in add_to_dict:
+        checker.add(w)
+    
+    suggestions = {}
+    for word in words:
+        if isinstance(word, str):
+            ok = checker.spell(word)
+            if not ok and word not in suggestions:
+                suggestions[word] = checker.suggest(word)
+                if not suggestions[word] and echo:
+                    print(word + ": No suggestions")
+                elif echo:
+                    print(word + ": " + "[", ", ".join(repr(i) for i in suggestions[word]), "]")
+    return suggestions
+
+ +With that, I can use the function on my data. To do so, I convert the pandas values to a list and pass it to the function: + +
s = list_word_suggestions(spellchecker, dresses_data['SleeveLength'].values.tolist())
+
+ +These are the suggestions it produces: + +
sleevless: [ 'sleeveless', 'sleepless', 'sleeves', 'sleekness', 'sleeve', 'lossless' ]
+threequarter: [ 'three quarter', 'three-quarter', 'forequarter' ]
+halfsleeve: ['half sleeve', 'half-sleeve', 'sleeveless' ]
+turndowncollor: No suggestions
+threequater: [ 'forequarter' ]
+capsleeves: [ 'cap sleeves', 'cap-sleeves', 'capsules' ]
+sleeevless: [ 'sleeveless', 'sleepless', 'sleeves', 'sleekness', 'sleeve' ]
+urndowncollor: [ 'landownership' ]
+thressqatar: [ 'throatiness' ]
+sleveless: [ 'sleeveless', 'levelness', 'valveless', 'loveless', 'sleepless' ]
+
+ +From here, you can analyze the output and do the replacements yourself: + +
dresses_data['SleeveLength'].replace('sleevless', 'sleeveless', inplace = True)
+
+ +### What's the Benefit? + +This is where you ask "What's the difference if it doesn't automatically fix my data?" + +When you have large datasets, it can be hard to individually identify which items are misspelled. Using this method will allow you to have a list of all the items that are misspelled which can let you deal with it in a systematic way. \ No newline at end of file diff --git a/content/blog/DebuggingAndPerformance.md b/content/blog/DebuggingAndPerformance.md new file mode 100644 index 0000000..b98ee88 --- /dev/null +++ b/content/blog/DebuggingAndPerformance.md @@ -0,0 +1,86 @@ +--- +title: "Debugging and Performance" +date: 2019-06-15T10:59:30-04:00 +draft: false +--- + +I've come to like the GNU Debugger (GDB) and the `perf` tool recently. This post will be a short summary of the various interesting commands you can use. + +## GNU Debugger + +To attach gbd to an existing process do the following + +```bash +gdb -p pid_of_process +``` + +Otherwise you can start a new application + +```bash +gdb name_of_executable +``` + +Once it loads it will bring you into it's own `REPL` environment. Usually once this comes up I find it useful to add breakpoints to the program. You can either do it by function name or by line number. + +```bash +(gdb) break FunctionName +``` + +```bash +(gdb) break code.cpp:81 +``` + +If you just started a new application you can begin running the program with whatever arguments you wish + +```bash +(gdb) run -arg1 -arg2 +``` + +If you have attached to a process then you can continue its execution. + +```bash +(gdb) continue +``` + +### Breakpoints + +If you have set a breakpoint, it will stop the processes' execution when it lands on the breakpoint. From here, we can take a look at what's on the stack, print variables, and do whatever other debugging we wish. + +**Print variables on stack:** + +```bash +(gdb) info locals +``` + +**Print a specific variable:** + +```bash +(gdb) print variable_name +``` + +**Show backtrace:** + +```bash +(gdb) bt +``` + +**Continue on with program execution:** + +```bash +(gdb) continue +``` + +## Perf + +I haven't played with `perf` as much but one thing I found that was cool was the `perf top` command. This command gives you samples of which function calls keeps the program the most busy. + +To attach to a process and show samples: + +```bash +perf top -p pid -K +``` + + + + + diff --git a/content/blog/_index.md b/content/blog/_index.md new file mode 100644 index 0000000..9bff67d --- /dev/null +++ b/content/blog/_index.md @@ -0,0 +1,3 @@ +--- +title: Blog +--- diff --git a/content/blog/abstractdef.md b/content/blog/abstractdef.md new file mode 100644 index 0000000..84a5172 --- /dev/null +++ b/content/blog/abstractdef.md @@ -0,0 +1,77 @@ +--- +title: "Useful Abstract Definitions" +date: 2019-10-27T23:49:57-04:00 +draft: false +--- + +## Chapter 17 + +By a **ring** we mean a set $A$ with operations called addition and multiplication which satisfy the following axioms: + +- $A$ with addition alone is an abelian group +- Multiplication is associative +- Multiplication is distributive over addition + +Since $\langle A, + \rangle$ is an abelian group, there is in $A$ a neutral element for addition. This is called the **zero** element. Also, every element has an additive inverse called its **negative**. + +If multiplication in a ring $A$ is commutative then we say that $A$ is a **commutative ring**. + +If a ring $A$ has a neutral element for multiplication then we say that the neutral element is the **unity** of $A$. + +If $A$ is a ring with unity, there may be elements in $A$ which have a multiplicative inverse. Such elements are said to be **invertible**. + +If $A$ is a commutative ring with unity in which every nonzero element is invertible, then $A$ is called a **field**. + +In any ring, a nonzero element $a$ is called a **divisor of zero** if there is a nonzero element $b$ in a ring such that the product $ab$ or $ba$ is equal to zero. + +An **integral domain** is defined to be a commutative ring with unity that has the cancellation property. Another way of saying this is that an integral domain is a commutative ring with unity and has no zero divisors. + +## Chapter 18 + +Let $A$ be a ring, and $B$ be a nonempty subset of $A$. $B$ is called a **subring** if it satisfies the following properties: + +- Closed with respect to addition +- Closed with respect to negatives +- Closed with respect to multiplication + +Let $B$ be a subring of $A$. We call $B$ an **ideal** of $A$ if $xb, bx \in B$ for all $b \in B$ and $x \in A$. + +The **principle ideal generated by $a$**, denoted $\langle a \rangle$ is the subring defined by fixing an element $a$ in a subring $B$ of $A$ and multiplying all elements of $A$ by $a$. +$$ +\langle a \rangle = \{ xa : x \in A \} +$$ +A **homomorphism** from a ring $A$ to a ring $B$ is a function $f : A \to B$ satisfying the identities: +$$ +f(x_1 + x_2 ) = f(x_1) + f(x_2) \\ +f(x_1x_2) = f(x_1)f(x_2) +$$ +If there is a homomorphism from $A$ onto $B$, we call $B$ a **homomorphic image** of $A$. + +If $f$ is a homomorphism from a ring $A$ to a ring $B$, the **kernel** of $f$ is the set of all the elements of $A$ which are carried by $f$ onto the zero element of $B$. In symbols, the kernel of $f$ is the set +$$ +K = \{x \in A: f(x) = 0\} +$$ +If $A$ and $b$ are rings, an **isomorphism** from $A$ to $B$ is a homomorphism which is a one-to-one correspondence from $A$ to $B$. In other words, it is injective and surjective homomorphism. + +If there is an isomorphism from $A$ to $B$ we say that $A$ is **isomorphic** to $B$, and this fact is expressed by writing $A \cong B$. + +## Chapter 19 + +Let $A$ be a ring, and $J$ an ideal of $A$. For any element $a \in A$, the symbol $J + a$ denotes the set of all sums $j + a$ as $a$ remains fixed and $j$ ranges over $J$. That is, +$$ +J + a = \{j + a : j \in J\} +$$ +$J + a$ is called a **coset** of $J$ in $A$. + +Now think of the set which contains all cosets of $J$ in $A$. This set is conventionally denoted by $A / J$ and reads $A$ mod $J$. Then, $A / J$ with coset addition and multiplication is a ring. + +An ideal $J$ of a commutative ring is said to be a **prime ideal** if for any two elements $a$ and $b$ in the ring, +$$ +ab \in J \implies a \in J \text{ or } b \in J +$$ +Theorem: If $J$ is a prime ideal of a community ring with unity $A$, then the quotient ring $A / J$ is an integral domain. + +An ideal $J$ of $A$ with $J \ne A$ is called a **maximal ideal** if there exists no proper ideal $K$ of $A$ such that $J \subseteq K$ with $J \ne K$. + +Theorem: If $A$ is a commutative ring with unity, then $J$ is a maximal ideal of $A$ iff $A/J$ is a field. + diff --git a/content/blog/adding-fonts.md b/content/blog/adding-fonts.md new file mode 100644 index 0000000..88fd008 --- /dev/null +++ b/content/blog/adding-fonts.md @@ -0,0 +1,13 @@ +--- +title: "Adding Fonts" +date: 2019-05-27T12:15:25-04:00 +draft: false +--- + +**Warning: This blog post partially applies to Ubuntu-based operating systems** + +I wanted to add a font to an image on GIMP. Now I wanted to make it so that the font is available system-wide in case I ever needed it again. + +Following this [blog post from It's FOSS](https://itsfoss.com/install-fonts-ubuntu/) I decided to make a `.fonts` folder in my home directory. After that you can download various font's from [Font Squirrel](https://www.fontsquirrel.com/), [dafont](https://www.dafont.com), [Google Fonts](https://fonts.google.com/), and others and drop the `.otf` or `.ttf` files into the `.fonts` folder. + +Then to finally achieve my goal, I made sure I added `/home/user/.fonts` folder to my fonts as outlined on the [GIMP documentation](https://docs.gimp.org/2.10/en/gimp-using-fonts.html) \ No newline at end of file diff --git a/content/blog/albuquerque.md b/content/blog/albuquerque.md new file mode 100644 index 0000000..57ca1c2 --- /dev/null +++ b/content/blog/albuquerque.md @@ -0,0 +1,105 @@ +--- +id: 2234 +title: Albuquerque Real Estate Multiple Regression model +date: 2017-07-12T01:07:39+00:00 +author: Brandon Rozek +layout: revision +guid: https://brandonrozek.com/2017/07/2227-revision-v1/ +permalink: /2017/07/2227-revision-v1/ +--- +### Introduction + +Albuquerque, New Mexico is a city of thriving culture. The population has grown drastically within the past several years and is a hotspot for New Mexico. Albuquerque’s one-of-a-kind southwestern culture is all around the city, from the quaint shops, Pueblo and Spanish inspired architecture and world famous cuisine, to the music and art of the city. Being the largest city in the state, it has a wide variety of homes across the entire city whether it be within the actual city of Albuquerque ore in the outskirts. Many people flock to the city for the weather. It is a mildly dry climate with roughly 310 days of solid sunshine each year, making it a literal hotspot for people who enjoy the outdoors and warm weather. The city has little to no natural disasters that threaten everyday life, make it a safe place to settle. In the city of Albuquerque, there is a wide variety of living communities throughout the area. As mentioned above, there are different diverse communities. The housing availability is vast as well. The housing market in this region is vast. Because there is little to no potential for natural disasters it causes the market to grow due to less of a liability for increased damage from weather. Albuquerque, has one of the lowest costs of living than anywhere else in the country which makes it a great place to invest in the housing market. The goal of this project is to figure out details of real estate, specifically in the city of Albuquerque, New Mexico. In the dataset given, the predictors available are square footage, age of home, number of features, amount in taxes, and several binary variables. Those binary variables being whether or not the home was of a custom design, is located in a corner location, or if it is located in the northeast quadrant of the city. + +### Descriptive Statistics + +Our dataset features a representative sample of 117 homes in Albuquerque, New Mexico. From this dataset, we can describe the key patterns that arise and build an intuition for what is to come in our inferential statistics section. It is important to build this intuition since it helps when generalizing to a population. + +#### Distribution of Data + +To understand the boxplot of interactions shown by Figure 1, we first need to establish what each of the indices or numbers under the x-axis represent. The first index discloses whether or not the home is located in the northeast quadrant of Albuquerque, New Mexico. The second 1index tells us whether or not the home had a custom design. And finally, the third index indicates whether or not the home is located in the corner of an intersection. From the boxplot of interactions, we can see that homes with a custom design tend to have a higher price than homes that don’t. There are no other patterns from this figure that we can readily pick up in terms of how the different combination of factors affect a home’s price. Figure 2 consists of multiple boxplots each comparing the price distribution of the different levels in all the categorical variables. From this we can reconfirm that having a custom design leads to a higher price distribution. We also see that the Northeast quadrant has a larger variation in price. There does not seem to be any significant difference in the price of homes depending on if it’s located on a corner. Finally, the more features a home has, the larger the variation in prices become. Figure 3 shows a scatterplot matrix of our data. From the matrix we can see the possibility of a linear correlation between price and square footage, as well as, price and tax. There is no evidence, however, of linear correlation between price and the age of the home. This suggests that perhaps age will not become a significant factor in our model. Figure 4 contains histograms of the different quantitative variables. As shown in the figure, the histograms are all right skewed. This shows that the majority of homes are in the lower price range while there are a few homes in the upper price region that might skew our model. Figure 5 shows the distribution of the data in terms of the categorical variables. It is interesting to note that the number of features falls in a gaussian like curve which is unimodal and symmetric at about 4 features. There are more homes that do not have a custom design and do not lie on a corner than ones that do. In this dataset, there are also more homes in the northeast quadrant than homes that are not. Figure 6 shows the distribution of taxes to be right skewed as well. + +#### Effect/Interaction Plots + +In the following section we will consider the effect of different categorical variables on the price of homes in Albuquerque and the other variables. The effect plots are used primarily to build an intuition on an individual variable’s effect on the price of a home. Interaction plots, however, analyze the influence of a variable on another’s effect on the price of a home. If the lines in an interaction plot intersect, it tells us that a categorical variable has a significant influence on another’s effect on the price of a home. The main effect plots in Figure 7 shows us the mean price of a home in relation to the different levels for each of the factors in the dataset. Similar to what was discovered in the boxplot figures, having a custom design increases the price of a home drastically compared to the increase of the price of a home by other factors. Having a home in a non-corner location slightly decreases the value of a home on average. Finally, it is shown in the Feature Effect plot that increases in the number of features increases the price of a home. An interesting thing to note is how in the case of 8 features, the average price of a home decreases. Figures 8, 9, and 10 show the interaction plots of different categorical variable combinations. In Figures 8 and 9, the lines do not intersect, therefore we can conclude that being in the northeast bears no influence on how custom design influences the price of the home and being in the northeast also bears no influence on how the corner location affect on the price. Figure 10, however, shows an interaction between corner location and custom design. This suggests that corner location has an influence on how custom design effects the price. + +#### Missing Data + +In the dataset provided, 44% of the homes are missing some data. Missing data, like outliers, are not to be ignored. To deal with missing data, one needs to know the implications of missing data on the analysis. From there, we can think of several techniques to deal with the absence of the data. One of the most important implications to check is to see if the data is missing at random. If the data is not missing at random, then it taints the representability of the sample, making it harder to generalize to a population. In the dataset provided there are two variables that contain missing data. Figure 11 shows how 42% of the data is missing the age variable and 9% of the data is missing the Tax variable. Looking at the right side of Figure 11, we can see the pattern of missing data in our set. 35% of the data in our set is only missing the age variable, 7% of our data is missing the age and tax variable, and only 2% of our data is missing the tax variable alone. Figure 12 shows us the missing data with respect to quantitative variables such as price, square footage, and tax. As seen in the figure, the missing data is spread equally throughout the distribution. Figure 13 shows us the missing data with respect to the categorical variables in our dataset. As seen in the figure, the proportion of missing data in the binary variables are about the same for each level. When looking at the number of features, however, there is a higher proportion of data missing in the homes with fewer features than in the homes with more features. Looking at the scatterplot matrix of missing values in Figure 14, we can see that the missing values in red are spread out evenly through the observed values in blue. Missing data with respect to age was not considered since the majority of the missing data comes from the age variable. + +### Inferential Statistics + +Now that we’ve described the sample, we can now look forward to generalizing our suspicions to the population. In this section, we define the hypotheses of interest in our model and then consider different techniques that lead up to the final model and analysis. +Hypotheses The main hypothesis of interest is if the model is significant. +➢ H​ 0​ : There is no linear association between the price of homes in Albuquerque, New Mexico and any of the following: square footage, age of the home, tax, number of features, corner location, northeast location, or custom design. +➢ H​ A​ : There is a linear association between the price of homes in Albuquerque, New Mexico and at least one of the following predictors: square footage, age of the home, tax, number of features, corner location, northeast location, or custom design. Afterwards, we consider if square footage, age, tax, number of features, corner location, northeast location, or custom design are significant predictors in the model individually. + +#### Ignore Missing Data Technique + +One of the first regression models we considered is if we ignore all of the missing data. Since 44% of our data have missing values, this drops our degrees of freedom significantly to 61. This technique also doesn’t utilize all of the data, which is prefered so that it doesn’t affect the coefficients of our model. Running the stepwise algorithm to maximize the AIC, we obtain the following model +PRICE = 97.92321 + 0.33638(SQFT) + 0.52308(TAX) + 177.18519(CUST1) − 77.82234(COR1) +Where the p-value of the model is less than 2.2e-16. At a 5% significance level, there is a linear association between the price of the home and at least one of the following predictors: square footage, tax, custom design, or corner location. Looking at the individual t-tests for predictor significance, square footage, tax, and custom design all have a p-value around or less than 0.01 which rejects the null hypotheses of those predictors. This tells us that square footage, tax, and custom design are all significant predictors in our model. However, corner location only have a p-value of 0.09, which at a 5% significant level, fails to reject the null hypothesis. Corner location is not a significant predictor in our model. The residual standard error in this model is $155,400 which is about 15% of the mean price value of a home. The adjusted R​ 2 value is 0.8523, which means that about 85% of the variation in the prices are accounted for in the variation of the model. Not all of the conditions are met for this model and since we ignore a good chunk of the data, this model is not fully appropriate for our usage. In our next attempt, we will increase the number of observations that we include in our analysis. + +#### Remove Age Column Technique + +##### Justification of Removal of Age Variable + +Most of the data missing is in the age variable. Age is also not a significant predictor in the model made in the previous section, therefore, our next idea was to remove the age variable from the dataset. It is important, however, to establish that the age data is truly missing at random and removing it won’t significantly affect the analysis. We do this by removing the only other variable that has missing data (tax) from the dataset. Looking at Figures 17 and 18, it did not change significantly the distribution of missing data with respect to the different variables. This lets us comfortably remove the age column from our dataset. From here, we then repeat the Ignore Missing Data technique. This time since only 9% of the data is missing, our degrees of freedom in this analysis increases from 61 to 102. Having a greater degrees of freedom allows us to have more statistical power in our analysis. + +##### Variable Selection and Test Results + +Running through the stepwise algorithm to maximize AIC, we get the following model +PRICE = 175.16603 + 0.67707(TAX) + 156.81481(CUST1) + 0.20760(SQFT) − 83.40126(COR1) +The p-value of this model is less than 2.2e-16, which at a 5% significance level, leads us to reject the null hypothesis and state that price has a linear association between at least one of the predictors in the model. Looking at the t-tests for predictor significance, all of the p-values are less than 0.05, which leads us to reject all the null hypotheses, and state that all of the predictors in this model: tax, custom design, square footage, and corner location are significant. The residual standard error in this model is $162,300 which is slightly higher from the $155,400 in the previous model. Though the proportion that this residual standard error is of the mean of the price set is the same at 15%. The adjusted R​ 2 value is 0.8213, which means that 82% of the variation in the prices are accounted for by the variation in the model. This dropped from the previous 85% value from the +previous model. The residual standard error and adjusted R​ 2 values indicate that this model is worse in terms of its predictive ability. This model, however, takes more of the data into account, which makes it more accurate when considering the data as a whole and not the subsetted data that arrives from removing the null entries. In this model, we still lose about 9% of our data. In our next model, we will consider a technique that allows us to use the entire dataset. + +#### Multiple Imputation + +To take the entire dataset into account we need to decide how to handle the missing values. Multiple imputation is a technique that randomly samples from the existing distribution to take place of the missing data multiple times. The benefits of multiple imputation is that it preserves the mean and variance of the data. For multiple imputation to work, the data must be missing at +random. In the missing data section, we described how the missing data is spread equally with respect to the different variables. This allows us to say that the Missing at Random condition is met. + +##### Variable Selection and Test Results + +Running the stepwise algorithm to maximize the AIC value, we get the following model +PRICE = 138.09421 + 0.65373(TAX) + 0.23709(SQFT) + 124.31776(CUST2) − 6 7.17475(COR2) +From the F-Test, we can reject the null hypothesis at a 5% significance level due to the fact that the p-value is less than 2.2e-16. This means that there is a linear association between price and one of the predictors: tax, square footage, custom design, and corner office. All of the T-Tests for predictor significance aside from COR2 have a p-value of less than 0.05. Meaning, we reject the appropriate null hypotheses and state that tax, square footage, and custom design are significant predictors. The residual standard error is $167,700 with 112 degrees of freedom. This value corresponds to 16% of the mean price of a home. The adjusted R​ 2 value is 0.8056, which means that about 81% of the variation in the prices is accounted for by this model. The residual standard error and adjusted R​ 2 values are again worse than the previous model. However, since this model uses the entire dataset, we can say that this is a more representative sample of the data than the previous models. To lower the amount of error in this model, we considered removing the outliers. In this model there are six outliers as shown in Figure 19. Since they are significantly far from the middle 50% of the price distribution, we removed them in the following section to better make a model that describes the main portion of the data. + +#### Multiple Imputation without Outliers + +Removing the outliers from the model and running the stepwise algorithm to maximize AIC, we obtain +PRICE = 76.47917 + 0.64130(TAX) + 0.27290(SQFT) + 77.58816(CUST2) +6For the F-Statistic, the p-value is less than 2.2e-16. At a 5% significance level, we reject the null hypothesis and state that there is a linear association between price and at least one of the following: tax, square footage, or custom design. The p-values of the T-Tests for predictor significance tells us that at a 5% significant level. all of the predictors are significant since all of the p-values are less than 0.05. The residual standard error of this model is $112,700 which is 11% of the mean of the dataset. +The adjusted R​ 2 value is 0.8901, which means that 89% of the variation in the prices is accounted for by the variation of the model. In this model, the residual standard error is lower and the adjusted R​ 2 value is higher than the previous models. This tells us that it is a better fit for the data without the outliers. Looking at the outlier effect on the coefficients, we can see that without the outliers the term relating to the corner location goes away from the model. That then significantly changes the +coefficients of CUST2 and the y-intercept. + +##### Checking the Conditions for Inference + +Before we conclude with the analysis, we must first check the conditions for inference to see if the technique is appropriate for our data. +Independence Assumption: +A house’s selling price can depend on another’s so this condition is not met. +Randomization Condition: +The dataset is comprised of a random sample of records of resale of homes which satisfies the +randomization condition. +Straight Enough Condition: +The scatterplot matrix in Figure 20 shows that for the predictors square footage and tax that the +scatterplot is straight enough and doesn’t have any bends or curves. +Equal Variance Assumption: +The residual analysis in Figure 21 shows that the outliers are not spread equally on the +scatterplot. Therefore, the equal variance assumption is not met. +Nearly Normal Condition: +The QQ-Plot in Figure 21 shows that the residuals follow a unimodal and symmetric distribution. +Taking out the outliers in the model also did not introduce any new outliers in the boxplot. +Missing At Random Condition: +7The discussion in the descriptive statistics section about the missing data tells us that the data +is missing evenly with respect to the different variables. Therefore, it is safe to assume that the +data is missing at random +Multicollinearity Condition: +All of the VIF values are lower than 10, therefore this condition is met. + +The conditions for inference are not fully met due to the equal variance assumption. This means that our model will be more inaccurate for some price range of homes than others. Looking at our residual analysis, it appears that the inaccuracies happen when the price of the home is higher. There weren’t many outliers in the dataset (6 out of 117 or 5%) so removing these outliers makes the model more representative to the majority of the houses in the market. Since this model is intended to be used when analyzing prices of homes in the area, it is better not to include the outliers that most people don’t intend to buy. Since the error term is unimodal and symmetric, we can be at ease that there isn’t any other confounding factor in our model. Overall, this is a good model to use for inference and prediction as long as one doesn’t use it to describe the outliers. + +### Conclusion + +The multiple imputation model without outliers is the best model outlined in this paper for describing the price of housing in this region. The formula is re-expressed here +PRICE = 76.47917 + 0.64130(TAX) + 0.27290(SQFT) + 77.58816(CUST2) +This states that for every dollar of tax spent on the home, the home increases on average by $64 given the other parameters stay constant. The same concept applies to square footage and custom design. For every square foot added to the home, the value of it increases on average by $27. Having a home with a custom design increases the value of the home by $7700. This model is more reliable the lower the price of the home is. When it comes to high cost homes, the error produced by the model increases. From this model, we conclude that property tax, square footage, and whether or not a home is built from a custom design are the most significant factors in the price of a home in Albuquerque, New Mexico. \ No newline at end of file diff --git a/content/blog/archivingsites.md b/content/blog/archivingsites.md new file mode 100644 index 0000000..14e9a5e --- /dev/null +++ b/content/blog/archivingsites.md @@ -0,0 +1,17 @@ +--- +title: "Archiving Sites" +date: 2019-08-02T22:42:16-04:00 +draft: false +--- + +I have several old Wordpress sites that are now only alive for archival purposes. I've been trying to migrate off of Wordpress since I don't like having yet another system to manage. Luckily for archival type sites, I don't need the whole backend of Wordpress since I don't actually need any CRUD functionality. (Well I need the R part) + +Solution... wget comes to the [rescue](https://stackoverflow.com/questions/538865/how-do-you-archive-an-entire-website-for-offline-viewing#538878) + +Thanks to user [chuckg](https://stackoverflow.com/users/63193/chuckg), I now know you can run `wget -m -k -K -E https://url/of/web/site` to get a full offline copy of a website. + +[Joel Gillman](https://stackoverflow.com/users/916604/jgillman) expanded out the command to `wget --mirror --convert-links --backup-converted --adjust-extension https://url/of/web/site` + +There are other solutions in that stack overflow post, but something about the simplicity of `wget` appealed to me. + +[Check out this now Wordpress free site of mine!](https://sentenceworthy.com) \ No newline at end of file diff --git a/content/blog/aspell.md b/content/blog/aspell.md new file mode 100644 index 0000000..85bf963 --- /dev/null +++ b/content/blog/aspell.md @@ -0,0 +1,8 @@ +--- +title: "aspell" +date: 2019-12-10T22:20:48-05:00 +draft: false +images: [] +--- + +When I was working on my honors thesis, I realized that I needed a way to spell check the file. After a quick search, I stumbled upon `aspell` which is a `curses` based tool to provide an interactive way for dealing with misspellings. Try it out when you have the chance! \ No newline at end of file diff --git a/content/blog/bashflags.md b/content/blog/bashflags.md new file mode 100644 index 0000000..24b8351 --- /dev/null +++ b/content/blog/bashflags.md @@ -0,0 +1,32 @@ +--- +title: "Bash Flags" +date: 2019-08-06T16:55:47-04:00 +draft: false +--- + +I was creating a bash script and was looking around for a solution for parsing command line arguments. [This StackOverflow post](https://stackoverflow.com/questions/192249/how-do-i-parse-command-line-arguments-in-bash) has a variety of different solutions available. I want to describe my favorite of these posts. + +[Inanc Gumus](https://stackoverflow.com/users/115363/inanc-gumus) proposed the following: + +```bash +#!/bin/bash + +while [[ "$#" -gt 0 ]]; do case $1 in + -d|--deploy) deploy="$2"; shift;; + -u|--uglify) uglify=1;; + *) echo "Unknown parameter passed: $1"; exit 1;; +esac; shift; done + +echo "Should deploy? $deploy" +echo "Should uglify? $uglify" +``` + +Let me quickly describe what it does. While the number of arguments left to process is greater than zero.... + +- Check to see if the argument matches any of the flags + - If it does... + - If the flag requires an additional argument grab it. Then discard an argument. + - If it doesn't. Error out. + - Then get rid of an argument. + +At the end of the while loop, you would've evaluated all the arguments! \ No newline at end of file diff --git a/content/blog/bashprocesses.md b/content/blog/bashprocesses.md new file mode 100644 index 0000000..d39feb1 --- /dev/null +++ b/content/blog/bashprocesses.md @@ -0,0 +1,28 @@ +--- +title: "Handling Background Processes in Bash" +date: 2019-06-17T19:50:30-04:00 +draft: false +--- + +For multi-process applications, I want to be able to start it up using the `bash` command processor and be able to stop all the processes just by hitting `CTRL-C`. + +As a quick reminder, to have a task run in the background you need to add a `&` at the end of the line. + +```bash +execute_app & +``` + +Previously, I was grabbing the PID of this background process, trapping the interrupt signal and taking the time to send the interrupt signal to all of the background processes. + +You can get the child pid by referencing the variable `$!` after sending a process to the background. + +Now I just use `setsid` to set the process group of the background processes to be the same as the bash process itself. The following demo script here will show the capability. + +```bash +#!/bin/bash +setsid sleep 5 & +setsid sleep 10 & +wait +``` + +This script will send two processes to the background and will wait until all the processes are finished. Hitting `CTRL-C` during execution will send the interrupt signal to all of the processes achieving my goal. diff --git a/content/blog/blogworkflow.md b/content/blog/blogworkflow.md new file mode 100644 index 0000000..bae3b34 --- /dev/null +++ b/content/blog/blogworkflow.md @@ -0,0 +1,31 @@ +--- +title: "Blog Workflow" +date: 2019-10-28T00:16:44-04:00 +draft: false +--- + +You may be curious on how I create content for this blog. There's pros and cons to my approach. One pro is that it's relatively easy for me to crank something out and upload it to my site. The downside is that it's not as easily customizable. + + + +I use Hugo as my static site generator. It works with Markdown files. I begin every blog post by typing + +```bash +hugo new blog/title.md +``` + +This creates a file called `title.md` in `content/blog` with front-matter yaml information such as the title and the datetime that I created the post. + +I then use my favorite Markdown editor `typora` to open up the file in the background. + +```bash +typora content/blog/title.md & +``` + +Write some great words down, compile the website, then sync it to my site! + +```bash +hugo +rsync -Paz --delete public/ brandonrozek.com:/path/to/site/folder +``` + diff --git a/content/blog/borgbackup.md b/content/blog/borgbackup.md new file mode 100644 index 0000000..11eed8d --- /dev/null +++ b/content/blog/borgbackup.md @@ -0,0 +1,55 @@ +--- +title: "Borg Backup" +date: 2019-05-21T22:35:31-04:00 +draft: false +--- + +I started using [Borg Backup](https://www.borgbackup.org/) in order to efficiently and securely do my backups. I did some research before choosing this solution as I required three things: + +- Compression +- Encryption +- Deduplication + +Each point is important on their own. Ideally I would be able to put this onto a cloud solution. Due to this I would want compression and deduplication to keep my costs down and encryption in order to maintain privacy. + +Luckily Borg does all of these things and more! It's also easily available on the AUR and the Ubuntu repositories. + +## Getting Started + +This will be a short post just describing the basic usage of the tool. I haven't fully implemented this tool yet so forgive me if this doesn't match your exact use case. This is also a great way for me to document the basic commands for myself as well. + +First to initialize a borg repo encrypted with a password at `repolocation`: + +```bash +borg init --encryption=repokey repolocation +``` + +Then to create a backup in the repo with key `backup1`: + +```bash +borg create --stats --progress --compression lzma repolocation::backup1 folderToBackup +``` + +You can actually replace the compression algorithm if wanted, here is a short description from their [website](https://borgbackup.readthedocs.io/en/stable/): + +- lz4 (super fast, low compression) +- zstd (wide range from high speed and low compression to high compression and lower speed) +- zlib (medium speed and compression) +- lzma (low speed, high compression) + +To list what backups you have in the repo: + +```bash +borg list repolocation +``` + +To mount and unmount the repository + +```bash +borg mount repolocation mountlocation +``` + +```bash +borg umount mountlocation +``` + diff --git a/content/blog/chirp.md b/content/blog/chirp.md new file mode 100644 index 0000000..ce15ae5 --- /dev/null +++ b/content/blog/chirp.md @@ -0,0 +1,28 @@ +--- +title: "Chirp" +date: 2019-09-27T22:46:52-04:00 +draft: false +--- + +In the land of Ham Radio, you can program your radio with a very popular open source software called `chirp`. For Ubuntu users to install it, it is recommended you use the PPA to keep up to date with radio software... + +```bash +sudo apt-add-repository ppa:dansmith/chirp-snapshots +sudo apt update && sudo apt install chirp-daily +``` + +Once you're in, it is recommended that you download the configuration currently set on your radio and store it somewhere safe. You never know when you'll want the Stock configuration again... + +The way the Software works is that you can store a certain amount of channels into your radio. For the Baofeng F8-HP, 128 channels can be stored. The software gives you a table to manage them. The software is nice since you can cut and paste entries around. + +When you're importing frequencies from various sources, pay attention to what entry numbers you're importing to. Otherwise you might overwrite another import you've made. I recommend adding the following types of frequencies to your radio... + +- Repeaters: Can be added by using RepeaterBook + - I used proximity search. It takes a zip code and the radius in miles of what you want to import. +- Local frequencies: You need a prenium account from Radio Reference in order to obtain these. + - Though honestly, a premium account is $15 for half a year. Not bad if you just go in once and download a bunch of frequencies for your area. Depending on where you live, your area might not have frequencies update all the time... + - Imagine being stuck in traffic and getting to know what's happening around you.... +- National Calling Frequencies +- MURS/FRS/GMRS frequencies +- Marine/Railroad frequencies (if you have space) + diff --git a/content/blog/collabpandocbeamer.md b/content/blog/collabpandocbeamer.md new file mode 100644 index 0000000..71f0067 --- /dev/null +++ b/content/blog/collabpandocbeamer.md @@ -0,0 +1,15 @@ +--- +title: "Collaborating on Beamer Pandoc Slides" +date: 2019-11-22T14:49:19-05:00 +draft: false +--- + +Recently I've been making slides using Pandoc with Beamer. However, I came across the issue where I needed to collaborate with someone using already existing slides written in Markdown. + +Sadly, I don't think this person (and most people for that matter) wants to edit slides in Markdown and use Pandoc. So I needed to convert this into another source material. My original plan was to convert this into a Powerpoint and put it into Google Slides. When I went to convert it using Pandoc, it stripped my math typing and theme. Unfortunately, that wasn't going to work for me. + +The solution I ultimately ended using was the following. +1. Convert the Markdown into Latex +2. Upload the latex document into Overleaf +3. Use the share feature in Overleaf + diff --git a/content/blog/colormanipulation.md b/content/blog/colormanipulation.md new file mode 100644 index 0000000..731c1c2 --- /dev/null +++ b/content/blog/colormanipulation.md @@ -0,0 +1,47 @@ +--- +title: "Color Manipulation with Sass" +date: 2019-05-21T23:10:06-04:00 +draft: false +--- + +There are many times that I need to slightly mess with a color. The easiest way I found to do it is to use one of the many color functions in the program `Sass`. [Sass](https://sass-lang.com/) is a CSS preprocessor, meaning that it has it's own syntax and it compiles down to CSS. I remember using this before CSS variables became a thing and that was one of the main driving points of Sass. + +Since I don't work in Web Development anymore, I don't actually have Sass installed on my computer but instead go to [SassMeister.com](https://www.sassmeister.com/) to do my color manipulations. ThoughtBot already wrote a really nice [post](https://thoughtbot.com/blog/controlling-color-with-sass-color-functions) describing all the different color functions, but I'll quickly describe what I do to mess with colors. + +## Quick Color Manipulation + +Now you do need to write special scss syntax in order for this to work, but luckily most of it you can just copy paste and change what you want. For example, to get Sass to make red 10% lighter you would do the following: + +```scss +p { + color: lighten(red, 10%); +} +``` + +Sass will then output the following: + +```css +p { + color: #ff3333; +} +``` + +And BAM just like that you got the hex code for a lighter version of red. You can also get all crazy and nest statements into each other which is usually what I do when I play with these colors. + +If you rather have the RGBA version of this you can do the following: + +```scss +p { + color: rgba(lighten(red, 10%), 0.5); +} +``` + +And it will output: + +```css +p { + color: rgba(255, 51, 51, 0.5); +} +``` + +So in summary, all you need is to replace the section after `color:` and you're all set for manipulating colors! Check out the [ThoughtBot Post above](https://thoughtbot.com/blog/controlling-color-with-sass-color-functions) in order to see all the variety of functions included with Sass such as saturating, hue-shifting, and much more. \ No newline at end of file diff --git a/content/blog/composesystemd.md b/content/blog/composesystemd.md new file mode 100644 index 0000000..4247e5f --- /dev/null +++ b/content/blog/composesystemd.md @@ -0,0 +1,46 @@ +--- +title: "Ensuring Docker Compose Startup with Systemd" +date: 2019-12-16T20:57:36-05:00 +draft: false +images: [] +--- + +I've been having trouble getting some docker containers such as `nginx` to start automatically on bootup, even with the `restart: always` flag. + +To compensate, I wrote a small systemd script and enabled it on startup. + +`/etc/systemd/system/docker-compose.service` + +```ini +[Unit] +Description=Docker Compose Application Service +Requires=docker.service +After=docker.service + +[Service] +Type=oneshot +User=brandonrozek +Group=brandonrozek +RemainAfterExit=yes +WorkingDirectory=/home/brandonrozek/docker/ +ExecStart=/usr/bin/docker-compose up -d +ExecStop=/usr/bin/docker-compose down +TimeoutStartSec=0 + +[Install] +WantedBy=multi-user.target + +``` + +To enable on startup + +```bash +sudo systemctl enable docker-compose +``` + +To start now + +```bash +sudo systemctl start docker-compose +``` + diff --git a/content/blog/copytoram.md b/content/blog/copytoram.md new file mode 100644 index 0000000..3af8f93 --- /dev/null +++ b/content/blog/copytoram.md @@ -0,0 +1,13 @@ +--- +title: "Copy to RAM Please" +date: 2019-08-02T22:37:12-04:00 +draft: false +--- + +I bought a 1U server recently, and I forgot to purchase a SSD to actually hold data. Since I couldn't hold my excitement to play with the server, I decided to load an operating system entirely into RAM and never turn it off for the meantime. + +I browsed [List of Linux Distributoins that run from RAM](https://en.wikipedia.org/wiki/List_of_Linux_distributions_that_run_from_RAM) and found [Slax](https://www.slax.org/) a [debian](https://www.debian.org/) derivative. + +It's not what I would use for my daily driver but in terms of doing this task its perfect. It loads up quickly and lets me perform nice basic user functions. It's also based on debian so I have a whole repository of packages available I can install. + +Now by default, if you're on a USB it'll try to run in a persistent mode, just press ESC in the boot splash to have the option to copy to ram. \ No newline at end of file diff --git a/content/blog/coqgroups.md b/content/blog/coqgroups.md new file mode 100644 index 0000000..8ba48dc --- /dev/null +++ b/content/blog/coqgroups.md @@ -0,0 +1,6 @@ +--- +title: "Group Theory in Coq" +date: 2019-05-21T22:17:00-04:00 +draft: true +--- + diff --git a/content/blog/coredns.md b/content/blog/coredns.md new file mode 100644 index 0000000..9ef792c --- /dev/null +++ b/content/blog/coredns.md @@ -0,0 +1,90 @@ +--- +title: "coredns" +date: 2019-12-13T02:00:29-05:00 +draft: false +images: [] +--- + +Domain names are the easiest way for a reverse proxy to split up services in a homelab. Since I'm going full docker-compose in my homelab, I decided to use `coredns`. + +The server I'm hosting my services on runs Ubuntu 18.04 at the time of writing. This verison of Ubuntu comes packaged with their own DNS resolver `systemd-resolved` which runs on port 53. Therefore in order to stop this, we need to edit `/etc/systemd/resolved.conf`: + +```ini +DNS=127.0.0.1 +FallbackDNS= +Domains=~. +DNSStubListener=no +``` +You might be wondering about the `~.` option in Domains. From the [Arch Wiki](https://wiki.archlinux.org/index.php/Systemd-resolved), "Without the `Domains=~.` option, systemd-resolved might use the per-link DNS servers." + +You also need to remove the already existing `/etc/resolv.conf` file. +```bash +sudo rm /etc/resolv.conf +``` + +Now to setup `coredns` I used the following docker-compose snippet: +```yaml +coredns: + image: coredns/coredns + command: -conf coredns-config/Corefile + ports: + - 53:53/udp + volumes: + - /Volumes/coredns/coredns-config:/coredns-config/ +``` +Noticed that I mounted the configuration directory in a volume. `coredns` is managed by a configuration file. This would be located under `/Volumes/coredns/coredns-config/Corefile` in the host system. + +Let's say we own the domain example.com and want subdomains of that to point to different to our server. To do that, we need to define a zonefile for that domain name. We will save that under `/Volumes/coredns/coredns-config/homelab.db` in our host system. Every other domain we will either pass to a public DNS server like Google's `8.8.8.8` or you can even use a PiHole. + +Example Corefile: +``` +example.com:53 { + file /coredns-config/homelab.db + log + errors +} + +.:53 { + log + errors + forward . 8.8.8.8 + cache +} +``` +I do recommend that whatever domain you do use for your homelab is one you own. Otherwise you might name conflict with a public service that you would want to access in the future. + +The `cache` directive will cache results from the other DNS provider for quicker delivery at a later point. + +The zonefile `homelab.db` could look like the following: +``` +$TTL 3600 +$ORIGIN example.com. +@ IN SOA ns.example.com. contact.example.com. ( + 2019121301 ; serial + 1d ; refresh + 2h ; retry + 4w ; expire + 1h ; nxdomain ttl + ) + IN NS ns.example.com. +@ IN A 192.168.1.10 +* IN A 192.168.1.10 +@ IN A 10.10.100.10 +* IN A 10.10.100.10 +``` + +In the zone file, `@` means whatever the value of `$ORIGIN` is and `*` is a wildcard meaning any subdomain. You can assign a local LAN address first and then a VPN ip address if you have one set up to access services remotely. + +The serial number needs only to be unique across SOA entries, and is conventionally the date and hour in which the entry was modified. + +I have this setup since all my services are on one physical machine. If you want to split it up through many different machines, specify it by adding the subdomains in place of the `*` or `@`. + +After the `Corefile` and `homelab.db` are made, the DNS server is all ready to be up and running. Just execute `docker-compose up -d coredns` and the DNS server will start happily responding to requests. + +A good way to verify it works is to request an `A` record from your site and an external site. + +```bash +dig @serverip example.com A +dig @serverip google.com A +``` + diff --git a/content/blog/cryptogames.md b/content/blog/cryptogames.md new file mode 100644 index 0000000..ce93e10 --- /dev/null +++ b/content/blog/cryptogames.md @@ -0,0 +1,101 @@ +--- +title: "Cryptographic Games" +date: 2020-01-13T21:35:09-05:00 +draft: false +images: [] +--- + +When analyzing cryptographic algorithms, we characterize the strength of the crypto-system by analyzing what happens in various crypto games. Below are a couple examples of crypto games used in literature. + +Actors typically involved in crypto games: + +| Actor | Role | +| ---------- | ---------------------------------------------------------- | +| Oracle | Encrypts a given message. | +| Challenger | Sets up the game between the oracle and adversary. | +| Adversary | Sends messages to the oracle and makes a guess at the end. | + + + +## Left-Right Game + +Here we will have two oracle's `left` and `right` both with a random key $k$. + +The challenger will create a random bit $b$ which is either $0$ or $1$. + +If the bit is $0$, then the adversary will send messages to `left`. Otherwise, the adversary will send messages to `right`. + +After a certain number of interactions the adversary needs to guess which oracle it is talking to. + +We define the adversary's advantage by the distance the probability is away from $\frac{1}{2}$. +$$ +advantage = |p - \frac{1}{2}| +$$ +Why the absolute value? Well if we only guess correctly $10\%$ of the time, then we just need to invert our guess to be correct $90\%$ of the time. + +``` +Generate key for both oracles +Generate random bit b +while game not done: + advesary generates message m + if b = 0: + send m to left oracle + receive c from left oracle + else: + send m to right oracle + receive c from right oracle +Adversary guesses whether b = 0 or 1 +``` + +## Real-Random Game + +This game is very similar to the last one except one of the oracle's only produces random bitstrings. + +An oracle is initialized with a random key $k$ and the challenger creates a random bit $b$. + +If $b = 0$, then the adversary will send messages to the oracle with the proper encryption function and will receive ciphertexts. Otherwise, the adversary will send messages to the random bitstring generator. + +At the end of the game, the adversary needs to guess whether its talking to a proper oracle or a random bitstring generator. + +The same metric `adversary's advantage` is used to characterize the strength of a crypto-system as the last one. + +``` +Generate key for both oracles +Generate random bit b +while game not done: + advesary generates message m + if b = 0: + send m to proper oracle + receive c from proper oracle + else: + send m to random oracle + receive random bitstring c from random oracle +Adversary guesses whether b = 0 or 1 +``` + +## Random Function - Random Permutation Trick + +One trick that we can use in proofs is to say that two procedures are the same up to a certain point when it diverges. + +Let us define $f$ to be some function that given a bitstring $X$ produces a random bitstring $Y$. + +Now, $image(f)$ is initially undefined since we don't know which bitstrings will be randomly generated. + +However, as we calculate $Y$ we will store it to build up $image(f)$. + +At some point, we'll generate $Y$ that already exists in $image(f)$. In that moment we will split based off of whether the procedure is a random function or random permutation. + +If random function, then just return the same $Y$ and end the procedure. Otherwise, return a random bitstring outside of the $range(f)$ and end the procedure. + +``` +Initialize function f with range(f) empty +Generate different random bitstring X +While f(X) not in range(f): + Add f(X) to range(f) + Generate different random bitstring X +If random function: + return f(X) +Else: + return random bitstring Y not in range(f) +``` + diff --git a/content/blog/ctf.md b/content/blog/ctf.md new file mode 100644 index 0000000..d2d5420 --- /dev/null +++ b/content/blog/ctf.md @@ -0,0 +1,31 @@ +--- +title: "Capture The Flag" +date: 2019-05-22T21:25:22-04:00 +draft: false +--- + +There is an event in Computer Security called "Capture The Flag". The purpose is to test the skills of security engineers and students through a variety of tasks in order to get a pass phrase which is called a flag. I noticed that Dr. Andrew Marshall wanted to set up this event at the University of Mary Washington for a while, so I and a few others decided to help make this a reality for him. + +**I didn't know you studied security?** Well honestly I don't. But that doesn't stop me from learning and creating cool challenges. + +## Challenges I Implemented + +In this post, I'll describe the various challenges I've implemented. I won't give the full problem description or answer just in case the problems get recycled in later years. + +### Web Archive Search + +In this problem I describe a discussion that an alumni and the student has. The alumni has trouble remembering a certain detail of an event held on campus. Key words and descriptions are given about the event and it is the job of the student to find the detail that the alumni wants. + +The juicy part of this problem is that the event is no longer on the current version of the university website. This means that ideally the student would go to the [Web Archive](http://web.archive.org/) to search and find for the information. + +*Funny enough, one contestant found the information by reading a really old publication from the time period described.* + +### Audio Recording + +In this challenge, I recorded a flag in an audio recording and distorted it using various tools in audacity. The idea is that you would get the audio clip and not be able to hear what the flag is and then have to import it into an audio editor of choice and manipulate it until the flag is clear. + +*Sadly no one was able to complete this challenge.* I think I made it too hard by voicing individual characters instead of doing a phrase. This would make ambiguous letters like "B" and "P" barely distinguishable from each other. + +### Hidden Text + +This challenge involves hiding text in the web page through some means. Hidden Text was meant to be one of the easiest problems to ease people onto the competition. You can easily solve this type of challenge by opening up the web inspector tool. \ No newline at end of file diff --git a/content/blog/custom-python-repl.md b/content/blog/custom-python-repl.md new file mode 100644 index 0000000..62c369b --- /dev/null +++ b/content/blog/custom-python-repl.md @@ -0,0 +1,32 @@ +--- +title: "Custom Python REPL" +date: 2019-10-27T23:43:12-04:00 +draft: false +--- + +Are you tired of importing the same libraries and setting up the same variables? Why not just create your own custom REPL? Now of course, we're not going to do it from scratch, but instead utilize what Python already gives us. + +Key Ingridient: + +```bash +python -i prompt.py +``` + +This tells Python to run prompt.py and then take you into an interactive prompt. + +Now let's populate `prompt.py` + +```python +#!/bin/env python +import favorite_libraries + +print("Welcome to your own custom REPL!") +print("Type help('function_name') to get a more detailed description on some of your own custom functions!") + +def help(function_name): + if function_name is "help": + print("Your very own help tool!") + else: + print("Sorry we don't have a help written for that yet :(") +``` + diff --git a/content/blog/digialmodes.md b/content/blog/digialmodes.md new file mode 100644 index 0000000..bae96c2 --- /dev/null +++ b/content/blog/digialmodes.md @@ -0,0 +1,78 @@ +--- +title: "Getting started with Digital Modes in Linux" +date: 2019-09-04T09:52:21-04:00 +draft: false +--- + +This blog post is going to describe what steps I took to be able to decode signals using digital modes. Hardware wise, you will either need a RTL-SDR receiver or a transceiver radio with a cable plugging into the computer's soundcard. + +## Software Required + +- Gqrx (depends on GNU Radio) + + - This is if you are trying to work with RTL-SDR + - It acts as a AM/FM/CW/etc demodulator for the data sent by the equipment + +- Fldigi + + - This is what decodes the protocol used to package the data + - It acts as a modem and provides capability to transmit data using a transceiver + +- Pavucontrol + + - This connects both Gqrx and Fldigi if using RTL-SDR + +As you can see, if you are only using a transceiver then you can skip the parts mentioning Gqrx and Pavucontrol + +## Process + +### Gqrx + +When you first open up Gqrx, it'll ask you to configure the device. I have the RTL2832U, so if you have the same tool... + +Select the profile partially labeled RTL2832U. If you want to look at frequencies between 0 and 28MHz then add to the device string "direct_samp=3". Otherwise don't add that string. + +You can keep the rest of the settings the same. + +### Fldigi + +When you first open up Fldigi, it'll ask you for our operator info. + +| Field | description | +| ----------------- | ----------------------------------------- | +| Station Callsign | Your callsign | +| Station QTH | City, State | +| Station Locator | Your grid code. (Can look this up on QRZ) | +| Operator Callsign | Your callsign | +| Operator Name | Your name | +| Antenna | Your antenna type | + +In Audio->Devices, make sure you select the physical device if you're using a transceiver, otherwise select PulseAudio. + +You can keep the rest of the settings as the default. + +### Pavucontrol + +Finally to link the two, run the following lines in bash to create a sink in order to push the audio from Gqrx to Fldigi. + +```bash +pacmd load-module module-null-sink sink_name=MyLoopback +pacmd update-sink-proplist MyLoopback device.description=MyLoopback +pacmd load-module module-loopback sink=MyLoopback +``` + +Now open up `pavucontrol`. On the Playback tab, change the output device of GQRX to be "MyLoopback" + +On the Recording tab, change the input of fldigi to "Monitor of Null Output" + +## Conclusion + +Now the software is sufficiently setup to be able to receive and decode signals. Best of luck finding things out there! + +## Beginner Pitfalls + +Since I'm also a beginner, I will share what I got stuck on and how you can avoid it. + +Make sure that you know the appropriate mode to demodulate the signal. I've had luck getting information from https://www.sigidwiki.com/wiki/Signal_Identification_Guide + +-> This needs to be configured on both Gqrx and Fldigi \ No newline at end of file diff --git a/content/blog/discoveringhamradio.md b/content/blog/discoveringhamradio.md new file mode 100644 index 0000000..ee0591c --- /dev/null +++ b/content/blog/discoveringhamradio.md @@ -0,0 +1,13 @@ +--- +title: "Discovering Ham Radio" +date: 2019-07-01T22:06:23-04:00 +draft: false +--- + +I feel like Ham Radio has been hiding in the background as I move through life. I knew someone that kept a Ham radio in his car, Noah talks about it frequently on his [podcast](http://www.asknoahshow.com/), and it seemed like the next step after [playing with](https://github.com/brandon-rozek/radiotuner) [software defined radio](https://www.amazon.com/RTL-SDR-Blog-RTL2832U-Software-Telescopic/dp/B011HVUEME/ref=sr_1_3). + +One of the things that I think pushed me over to wanting to get my Technician's license is the discovery of [digital data modes](http://www.arrl.org/digital-data-modes). Hams even have their own [email](https://www.winlink.org/)! + +Why is this more interesting than Internet? Well Ham Radio doesn't need any physical infrastructure setup (other than your radio and maybe some repeaters) to get you connected to other people. In fact, Hams often [volunteer](http://www.arrl.org/public-service) in natural disasters when the phone systems are down. + +This convinced to buy a [study guide](https://www.amazon.com/ARRL-Radio-License-Manual-Spiral/dp/1625950829/ref=sr_1_6) and start preparing to take my technicians test this summer. If you're interested in Ham Radio, please contact me at my email on my home page :) diff --git a/content/blog/docker-image-bash.md b/content/blog/docker-image-bash.md new file mode 100644 index 0000000..0a01784 --- /dev/null +++ b/content/blog/docker-image-bash.md @@ -0,0 +1,48 @@ +--- +title: "Advanced Docker Image Construction with Bash" +date: 2019-12-26T21:01:37-05:00 +draft: false +images: [] +--- + +On current versions of Docker, you can't mount volumes during image construction. This poses an issue for me as I don't want to replicate gigabytes of data already existing on my disk when it won't appear on the final build. Therefore, instead of building an image with a traditional Dockerfile, we're going to use a bash script on a running base image container and export the filesystem to create the image from. + +So first run the base image with the mounts that you want + +```bash +docker run -v /mnt:/mnt -td --name containername baseimage /bin/bash +``` + +Then copy whatever `setup` script you have and execute it on the running container + +```bash +docker cp setup containername:/setup +docker exec -it containername /setup +``` + +Once the setup script finalizes, we can export the container filesystem into a file called `image.tar` + +```bash +docker export --output="image.tar" containername +``` + +Once we've exported the filesystem, we can get rid of the existing container + +```bash +docker stop containername && docker rm containername +``` + +Now create a `Dockerfile` with the following: + +```dockerfile +FROM scratch +ADD image.tar / +CMD ["bin/bash"] +``` + +Now you can create the image by building the Dockerfile + +```bash +docker build -t finalimagename . +``` + diff --git a/content/blog/externalmediaformats.md b/content/blog/externalmediaformats.md new file mode 100644 index 0000000..fd41045 --- /dev/null +++ b/content/blog/externalmediaformats.md @@ -0,0 +1,18 @@ +--- +title: "External Media Formats" +date: 2019-05-22T22:03:38-04:00 +draft: false +--- + +I received an external SSD recently and I decided that it would be a great place to offload some of my backups. Before I got started, I became curious as to what filesystem to put on the SSD. After some research, it seems that if I want to be able to access it using Windows I am actually quite limited. In fact only three make sense: + +- FAT32 +- exFAT +- NTFS + +Now FAT32 is a legacy filesystem, Windows 95 type of legacy. So let's rule that one out. exFAT is supposed to be based on FAT32 but increases the file size limits significantly. It is also known for being very slim and as such does not having journaling support. NTFS is the filesystem that Windows 10 uses for default for it's installation. That file system supports journaling. + +I ended up going with NTFS due to its journaling support. Why is journaling important to me? Well this helps keep the file system internally consistent. The details are outside the scope of this post, but [Wikipedia has a nice entry](https://en.wikipedia.org/wiki/Journaling_file_system) about it. + +Well as it turns out, the drive that I was going to use already was formatted as NTFS. Though for sake of completeness, I will say that you can format drives with tools like `parted`, `gparted`, and `partitionmanager`. Just make sure that the drive you're formatting is what you think it is! + diff --git a/content/blog/fmradiotuner.md b/content/blog/fmradiotuner.md new file mode 100644 index 0000000..fbedf78 --- /dev/null +++ b/content/blog/fmradiotuner.md @@ -0,0 +1,26 @@ +--- +title: "FM Radio Tuner" +date: 2019-05-21T22:08:54-04:00 +draft: true +--- + +I recently bought a [RTL-SDR Receiver](https://www.amazon.com/RTL-SDR-Blog-RTL2832U-Software-Telescopic/dp/B011HVUEME/ref=sr_1_3) off of Amazon to get started with [Software Defined Radio](https://en.wikipedia.org/wiki/Software-defined_radio). To start off, I thought that it would be great if I can write a fm receiver. + +To begin you will need to install `gnuradio` and follow the following [instructions](https://osmocom.org/projects/rtl-sdr/wiki/Rtl-sdr). + +## GNURadio + + + + + +## QT + + + + + +## Modifying GNURadio Python Script + + + diff --git a/content/blog/gitlabcicd.md b/content/blog/gitlabcicd.md new file mode 100644 index 0000000..dba7ccc --- /dev/null +++ b/content/blog/gitlabcicd.md @@ -0,0 +1,9 @@ +--- +title: "Gitlab CI/CD" +date: 2019-07-01T21:36:56-04:00 +draft: false +--- + +One of the greatest benefits I believe of integrating Gitlab's CI/CD into your workload is code linting and building. This immediately eliminates the easy mistakes that developers make and wastes less people's time. + +I'm working towards getting the build setup just right in one of the projects I'm currently working. However, in the meantime, Gitlab supports running it's CI/CD jobs under the `shell executor`. I would like to go to the default Docker route in the future once I figure out all of the dependencies of the project I'm building. \ No newline at end of file diff --git a/content/blog/gitlens.md b/content/blog/gitlens.md new file mode 100644 index 0000000..3991a88 --- /dev/null +++ b/content/blog/gitlens.md @@ -0,0 +1,12 @@ +--- + +title: "Git Lens" +date: 2019-10-27T23:38:45-04:00 +draft: false +--- + +Git Lens is a great Visual Studio code extension. It annotates the line your cursor is on with the commit it came from. Extreemely useful for determining the reason that line of code is written or even who wrote it. + +Images from the github page. (If they still exist when you read this) + +![Current Line Blame](https://raw.githubusercontent.com/eamodio/vscode-gitlens/master/images/docs/current-line-blame.png)![Git Code Lens](https://raw.githubusercontent.com/eamodio/vscode-gitlens/master/images/docs/code-lens.png) \ No newline at end of file diff --git a/content/blog/groupssimplified.md b/content/blog/groupssimplified.md new file mode 100644 index 0000000..31cbfa6 --- /dev/null +++ b/content/blog/groupssimplified.md @@ -0,0 +1,38 @@ +--- +title: "Groups Simplified" +date: 2019-12-10T21:40:00-05:00 +draft: false +images: [] +--- + +This post is inspired by the book "Term Rewriting & All That" by Franz Baader and Tobias Nipkow. + +Let us have a set $G$ together with a binary operation $*$. We will use multiplicative notation throughout meaning $ab = a * b$. Let $x, y, z \in G$. If $\langle G , * \rangle$ has the following properties: + +1. $(x y)z = x (y z)$ +2. $ex = x$ +3. $x^{-1} x = e$ + +for some fixed $e \in G$, then we say that $\langle G, * \rangle$ is a group. In class, we needed to show that $xe = x$ and $xx^{-1} = e$. However, these can be derived by the prior properties. + +### Prove $xx^{-1} = e$ +\begin{align*} +e &= (xx^{-1})^{-1}(x x^{-1}) \\\\ +&= (xx^{-1})^{-1} (x (ex^{-1})) \\\\ +&= (xx^{-1})^{-1} (x ((x^{-1} x) x^{-1})) \text{ ----- (A)} \\\\ +&= (x x^{-1})^{-1} (x (x^{-1} x)x^{-1}) \\\\ +&= (x x^{-1})^{-1}((x x^{-1})xx^{-1}) \\\\ +&= (x x^{-1})^{-1} ((xx^{-1}) (x x^{-1})) \\\\ +&= ((x x^{-1})^{-1}(x x^{-1})) (x x^{-1}) \\\\ +&= e(xx^{-1}) \\\\ +&= xx^{-1} +\end{align*} +### Prove $xe = x$ + +Once we showed $xx^{-1} = e$, the proof of $xe = e$ is simple. +\begin{align*} +x &= ex \\\\ +&= (xx^{-1})x \\\\ +&= x(x^{-1}x) \\\\ +&= xe +\end{align*} diff --git a/content/blog/haskellrealsequences.md b/content/blog/haskellrealsequences.md new file mode 100644 index 0000000..950b89d --- /dev/null +++ b/content/blog/haskellrealsequences.md @@ -0,0 +1,49 @@ +--- +title: "Real Analysis Sequences in Haskell" +date: 2019-05-21T22:18:21-04:00 +draft: false +--- + +In Real Analysis it is useful to look at terms of a sequence. One of the best ways I've found to do this is in believe it or not Haskell. This is mainly for these two reasons + +- Support for infinite data structures + +- Built-in Data Type to keep fractional precision + +## Code + +Let's get started, first let us define a sequence by the following: +$$ +f(1) = 1, f(2) = 2, f(n) = \frac{1}{2}(f(n - 2) + f(n - 1)) +$$ +That is equivalent to the following haskell code: + +```haskell +f :: Integral a => a -> Ratio a +f 1 = 1 +f 2 = 2 +f n = 0.5 * (f (n - 2) + f (n - 1)) +``` + +Now to generate the sequence we just need to map $f$ onto the natural numbers. + +```haskell +nsequence = map f [1..] +``` + +If you want to look at specific subsequences, such as even or odd: + +```haskell +odd_generator n = 2 * n - 1 +odds = map odd_generator [1..] + +even_generator n = 2 * n +evens = map odd_generator [1..] +``` + +To look at the differences between each term: + +```haskell +diff x = map (\(a, b) -> a - b) $ zip (tail x) (init x) +``` + diff --git a/content/blog/limitbandwidth.md b/content/blog/limitbandwidth.md new file mode 100644 index 0000000..9900477 --- /dev/null +++ b/content/blog/limitbandwidth.md @@ -0,0 +1,37 @@ +--- +title: "Limit Bandwidth through Terminal" +date: 2020-01-15T19:51:45-05:00 +draft: false +images: [] +--- + +Have you ever wondered how an application or a system would operate under low bandwidth environments? Luckily `wondershaper` is a tool to help with just that! + +```bash +sudo apt install wondershaper +``` + +To get started, first find out the network `interface` that you want to throttle. + +```bash +ip addr show +``` + +To show the state of the interface, + +```bash +sudo wondershaper [interface] +``` + +To set the bandwidth, + +```bash +sudo wondershaper [interface] [downlink] [uplink] +``` +where downlink and uplink are defined in kilobits per second. + +To clear the rules, + +```bash +sudo wondershaper clear [interface] +``` \ No newline at end of file diff --git a/content/blog/linuxdesktopicons.md b/content/blog/linuxdesktopicons.md new file mode 100644 index 0000000..88f8960 --- /dev/null +++ b/content/blog/linuxdesktopicons.md @@ -0,0 +1,21 @@ +--- +title: "Linux Desktop Icons" +date: 2019-06-03T21:05:37-04:00 +draft: false +--- + +I get asked a decent number of times how to add desktop icons on Linux. Luckily it's incredibly easy. [It's a `freedesktop` standard](http://standards.freedesktop.org/desktop-entry-spec/latest/). + +In fact the simplest file would follow the format: + +```yaml +[Desktop Entry] +Name=Application Name +Exec=/path/to/executable -randomFlag +Icon=/optional/path/to/icon +Terminal=false +Type=Application +``` + +Once you have this saved to `yourapplication.desktop` move it to either `/usr/share/applications` if you want it system-wide or `/home/user/.local/share/applications` if you want it just for your `user`. + diff --git a/content/blog/livedoc.md b/content/blog/livedoc.md new file mode 100644 index 0000000..9601a8e --- /dev/null +++ b/content/blog/livedoc.md @@ -0,0 +1,21 @@ +--- +title: "Live Documentation" +date: 2019-09-27T23:07:19-04:00 +draft: false +--- + +This blog post is mostly for one of my teams in which I use Jupyter Notebooks for documentation. Perhaps after reading this post, you the reader can understand why it might be beneficial to use Jupyter Notebooks as a form of documentation. + +## Why? + +So why Jupyter Notebooks? + +- Follows the literate programming approach. You can write text explaining a feature and then immediately show code and it's result. +- It's modifiable. If your user wants to play around with the documentation, the environment is set up for them to do so. +- It's exportable. Let's say another user doesn't want to bother setting it up. Well it's super simple to just export the notebook as a PDF and send that to them instead. + +## Setting up + +Jupyter Notebooks are part of the [Project Jupyter](https://jupyter.org/) suite of products. You can install it via a `pip` package, but it is more commonly installed via the [Anaconda Distribution](https://www.anaconda.com/) + +Once you have that installed, run `jupyter lab` in the directory that you wish to execute code from. You might need to be in the `bash` shell for this to work since the installer modifies those environmental variables. \ No newline at end of file diff --git a/content/blog/localrepoiso.md b/content/blog/localrepoiso.md new file mode 100644 index 0000000..6a5ddeb --- /dev/null +++ b/content/blog/localrepoiso.md @@ -0,0 +1,29 @@ +--- +title: "Local Repo From Live Installer" +date: 2019-08-30T20:26:53-04:00 +draft: false +--- + +I'm going to share my experience setting up a local repo from a CentOS live CD. These instructions should work similarly in REHL. + +When working with off-network systems, it is often useful to have the base packages on the system after the installation process. Luckily the base packages are commonly included in the ISO installer. + +First I'm going to assume that you've mounted the ISO at `/mnt`. + +```bash +sudo mkdir -p /repos/local +sudo rsync -Paz /mnt/Packages /repos/local/Packages +sudo rsync -Paz /mnt/repodata /repos/local/repodata +``` + +Then create the file `/etc/yum.repos.d/local.repo` + +```yaml +[local] +name=Local Repo +baseurl=file:///repos/local/ +gpgcheck=0 +enabled=1 +``` + +Now you're all set to go with the packages on the Live CD! \ No newline at end of file diff --git a/content/blog/lxdtmpfs.md b/content/blog/lxdtmpfs.md new file mode 100644 index 0000000..dc9de48 --- /dev/null +++ b/content/blog/lxdtmpfs.md @@ -0,0 +1,102 @@ +--- +title: "LXD on tmpfs" +date: 2019-12-31T22:35:21-05:00 +draft: false +images: [] +--- + +Container images are designed to be as small as possible. Wouldn't it be cool if we can hold entire containers in RAM? This post outlines how to accomplish this using LXD. It turns out that it is a lot easier to setup custom storage pools on LXD than with Docker. + +## Setting up tmpfs + +`tmpfs` is a temporary filesystem that resides in memory. To get started, first create a directory that you want to mount with `tmpfs` + +```bash +mkdir /tmp/ramdisk +``` + +To only do this temporarily, then you can run the following command + +```bash +sudo mount -t tmpfs -o size=4G myramdisk /tmp/ramdisk +``` + +You can replace `4G` with any size less than your current RAM size. + +To set it up permanently, you will have to edit `/etc/fstab` + +``` +myramdisk /tmp/ramdisk tmpfs defaults,size=3G,x-gvfs-show 0 0 +``` + +## Setting up LXD + +LXD is a lightweight container hypervisor in Linux. To install and setup, please follow the beginning sections of https://linuxcontainers.org/lxd/getting-started-cli/ + +Once you've setup the initial configuration with `lxd init`, we can create a new storage pool using our newly created `tmpfs` + +```bash +lxc storage create tmplabel dir source=/tmp/ramdisk +``` + +We can then create a container that will use this storage pool + +```bash +lxc launch ubuntu:18.04 mycontainer -s tmplabel +``` + +In the last command, the `-s` flag indicates which storage pool we want to use. + +With this, our entire container filesystem lives in RAM! + +## (Optional) Setting up mounts + +One downside to putting the entire filesystem in RAM is that it isn't persistent across reboots. You can think of the container then as ephemeral and setup mountpoints to the host in order to save important configuration information. + +If the mount point is configured to be world writable or you only need it to be readonly, then this is very simple to setup! + +```bash +lxc config device add mycontainer dirlabel disk source=/path/on/host path=/path/on/container +``` + +This is because files in the container are marked as `nobody:nogroup`. If you want to be able to write to the mounted directory that's not setup to be world-writable then there's extra steps we need to take. + +Most of the following information is taken from: https://tribaal.io/nicer-mounting-home-in-lxd.html + +Let's say that you want LXD to be able to write to a folder that you own. First we need to allow LXD to remap your user ID. + +```bash +echo "root:$UID:1" | sudo tee -a /etc/subuid /etc/subgid +``` + +We only need to do this once per host system. + +The Ubuntu container has a user called `ubuntu` with UID 1000. We can remap that userid, otherwise you would have to create another user on the container to remap. + +If you create another user, make sure you get its id for the next command: + +```bash +# In the container +id -u username +``` + +For the rest of this tutorial, we will assume that you have a user named ubuntu with UID 1000. + +Once LXD is able to remap your user id, you can tell it to do so for the container of interest. + +```bash +lxc config set mycontainer raw.idmap "both $UID 1000" +``` + +Now to setup the mount + +```bash +lxc config device add myubuntu homedir disk source=$HOME path=/home/ubuntu +``` + +Restart the container and now the `ubuntu` user will be able to write to the mount! + +```bash +lxc restart mycontainer +``` + diff --git a/content/blog/male-vs-female-life-expectancy2052-revision-v1-Male-vs-Female-Life-Expectancy.md b/content/blog/male-vs-female-life-expectancy2052-revision-v1-Male-vs-Female-Life-Expectancy.md new file mode 100644 index 0000000..747b121 --- /dev/null +++ b/content/blog/male-vs-female-life-expectancy2052-revision-v1-Male-vs-Female-Life-Expectancy.md @@ -0,0 +1,208 @@ +--- +id: 2169 +title: Male vs Female Life Expectancy +date: 2017-03-16T14:12:40+00:00 +author: rozek_admin +layout: revision +guid: https://brandonrozek.com/2017/03/2052-revision-v1/ +permalink: /2017/03/2052-revision-v1/ +--- +![](https://brandonrozek.com/wp-content/uploads/2017/03/LifeExpectancyBoxplot.png) + +## Do females live longer than males? + +It is well known that females live longer than males, but does that statement hold statistically? Matthew Martinez and I set out to find out. + + + +## Population and the hypothesis + +Our population of concern is citizens of the United States. We found a dataset on [WorldLifeExpectancy](http://www.worldlifeexpectancy.com/) listing by county the average life expectancy for both males and females. With this we form our null and alternative hypothesis + +H0: The average life expectancy for both males and females are the same in the United States + +HA: The average female life expectancy is higher than the average male life expectancy in the United States + +## Data preparation + +Since the website gives us an overlook at all of the counties in the United States we want to take a small sample of that so we can perform statistics. Using the entire dataset will result in looking at population parameters which doesn’t leave room for inference. + +A random number was chosen to pick the state and then the county. This was done a total of 101 times. The CSV file is located [here](https://brandonrozek.com/wp-content/uploads/2017/03/LifeExpectancy.csv) for convenience. + +## R Programming + +For the rest of this article, we will use R for analysis. This article will focus more on the analysis, however, than the R code. + +Read the CSV file into R + +
rm(list=ls())
+
+# Read in file
+LifeExpectancy = read.csv("~/LifeExpectancy.csv")
+maleExpectancy = LifeExpectancy$Life.Expectancy.Male
+femaleExpectancy = LifeExpectancy$Life.Expectancy.Female
+
+ +## Summary Statistics + +Before we begin our inferential statistics, it is a good idea to look at what we have in our sample. It will give us a good feeling for what we’re working with and help us answer some questions involving the assumptions in parametric tests. + +We’re interested in the minimum, mean, maximum, and interquartile range of the data + +

+# Summary statistics
+male_row = c(min(maleExpectancy), mean(maleExpectancy), max(maleExpectancy), IQR(maleExpectancy))
+female_row = c(min(femaleExpectancy), mean(femaleExpectancy), max(femaleExpectancy), IQR(femaleExpectancy))
+summary = rbind(male_row, female_row)
+colnames(summary) = c("Min", "Mean", "Max", "IQR")
+rownames(summary) = c("Male", "Female")
+
+ +Looking at the table below, we can see that the average male lives to be around 69 years old in our sample while the average female lives to be about 71 years old. One interesting thing to note is how small the variation is between all the counties life expectancy that we sampled. + +
summary
+##         Min   Mean  Max   IQR
+## Male   69.0 74.952 80.9 2.775
+## Female 76.1 80.416 84.1 2.350
+ +## Inferential Statistics + +From here on out, we will perform a hypothesis test on the two hypothesis stated earlier in the text. + +Since our data is quantitative in nature, we will attempt to perform a two sample t-test + +### Check for Assumptions + +Performing a t-test comes with several assumptions we need to check before confidently reporting our results. + +Independence Condition: One county’s life span does not affect the lifespan of another. + +Independent groups assumption: The lifespan of a male does not directly impact a lifespan of a female. + +Nearly Normal Condition: We need to check the histograms to see if they’re unimodal and symmetric and check to see if any outliers exist + +The male life expectancy distribution appears to be unimodal and symmetric. + +
# Check for normality
+hist(maleExpectancy, main = "Male Life Expectancy", xlab = "Age")
+ + + +Same with the female life expectancy distribution + +
hist(femaleExpectancy, main = "Female Life Expectancy", xlab = "Age")
+ + + +Looking at the boxplot, we can see that the IQR of the female life expectancy is higher than the one of the males. The hypothesis test will show us if this is of significant difference. On the male’s side there are two outliers. This violates the Nearly Normal Condition so we must proceed with caution in our test. + +
boxplot(maleExpectancy, femaleExpectancy, names = c("Male Life Expectancy", "Female Life
+                                                        Expectancy"), ylab = "Age")
+ + + +Since the nearly normal condition was not met, we do not meet the assumptions necessary to perform a t-test. However, since the condition was violated by an outlier, let us perform a t-test with the outlier and without the outlier and compare the results. + +### Calculate the Test Statistic + +Let us conduct a two sample t-test with the alternative hypothesis being that the female average life expectancy is greater than that of the males + +Running the test below shoes us a p-value of less than 0.001. This tells us that the probability of obtaining a sample as extreme as the one obtained is close to zero. Therefore at a significance level of 5%, we reject the null hypothesis and state that there is strong evidence to suggest that females have a greater life expectancy that that of males. + +
# Test alternative hypothesis
+t.test(femaleExpectancy, maleExpectancy, alternative='g')
+ +
## 
+##  Welch Two Sample t-test
+## 
+## data:  femaleExpectancy and maleExpectancy
+## t = 18.858, df = 182.48, p-value < 2.2e-16
+## alternative hypothesis: true difference in means is greater than 0
+## 95 percent confidence interval:
+##  4.984992      Inf
+## sample estimates:
+## mean of x mean of y 
+##    80.416    74.952
+ +In fact, we are 95% confident that the difference between the average female life expectancy and the average male life expectancy in the United States is between 5 and 6 years. Females live on average 5-6 years longer than males in the United States. + +# Find confidence interval<br /> +t.test(femaleExpectancy, maleExpectancy) + +
## 
+##  Welch Two Sample t-test
+## 
+## data:  femaleExpectancy and maleExpectancy
+## t = 18.858, df = 182.48, p-value < 2.2e-16
+## alternative hypothesis: true difference in means is not equal to 0
+## 95 percent confidence interval:
+##  4.892333 6.035667
+## sample estimates:
+## mean of x mean of y 
+##    80.416    74.952
+ +### Outlier Analysis + +We cannot forget that we had outliers in our dataset. This might affect the results of our test. The point of outlier analysis is to see if such changes are significant. + +First let us remove the outliers in R + +
# Remove outliers
+maleExpectancy2 = maleExpectancy[!maleExpectancy %in% boxplot.stats(maleExpectancy)$out]
+
+ +Then let us check the histogram and boxplots to see if the nearly normal condition is now met. + +Looking at the boxplot, there are no more outliers present + +

+# Check graphs again
+boxplot(maleExpectancy2, ylab = "Age", main = "Male Life Expectancy w/o Outliers")
+ + + +The histogram still appears to be unimodal and symmetric + +
hist(maleExpectancy2, xlab = "Age", main = "Male Life Expectancy w/o Outliers")
+ + + +Without the outliers present, the nearly normal condition is now met. We can perform the t-test. + +We can see that the hypothesis test returns the same results as before, this tells us that the outliers did not have a significant impact on our test results + +
# Test new alternative
+t.test(femaleExpectancy, maleExpectancy2, alternative='g')
+ +
## 
+##  Welch Two Sample t-test
+## 
+## data:  femaleExpectancy and maleExpectancy2
+## t = 19.471, df = 184.03, p-value < 2.2e-16
+## alternative hypothesis: true difference in means is greater than 0
+## 95 percent confidence interval:
+##  5.000048      Inf
+## sample estimates:
+## mean of x mean of y 
+##  80.41600  74.95204
+ +Redoing the confidence intervals, we can see that it did not change greatly + +
# Find new confidence interval
+t.test(femaleExpectancy, maleExpectancy2)
+ +
## 
+##  Welch Two Sample t-test
+## 
+## data:  femaleExpectancy and maleExpectancy2
+## t = 19.471, df = 184.03, p-value < 2.2e-16
+## alternative hypothesis: true difference in means is not equal to 0
+## 95 percent confidence interval:
+##  4.910317 6.017601
+## sample estimates:
+## mean of x mean of y 
+##  80.41600  74.95204
+ +## Conclusion + +By running the tests and checking the effects of the outliers in the dataset and seeing that the results did not change, we can safely conclude that our interpretations stated before are correct. There is enough evidence to suggest that females in the United States live on average longer than males. We are 95% confident that they live longer than males by 5 to 6 years. \ No newline at end of file diff --git a/content/blog/manpandoc.md b/content/blog/manpandoc.md new file mode 100644 index 0000000..27f7341 --- /dev/null +++ b/content/blog/manpandoc.md @@ -0,0 +1,58 @@ +--- +title: "Man Pages with Pandoc" +date: 2019-11-07T21:42:08-05:00 +draft: false +--- + +[Ethan Martin](https://emar10.dev) recently showed off the Pandoc tool to me. In case you don't know, Pandoc is a swiss-army knife of markup languages. It allows you to easily convert from one markup language to another. + +This got me thinking my love for Markdown as the lowest common denominator for my notes. I can write markdown files for my website, for presentations, and output it into PDF and Word. Of course you don't get to have the fine control as you do with Latex, but with document classes, you can at least theme it any way you like! + +Now to focus this blog post, I do want to share one really cool feature I found out about Pandoc. It can create man pages. I thought of this as a great way to create documentation for a software project. I'll give you an example to kick things off. + +Note: The content is stolen from the `git` man page. + +```markdown +--- +title: git +section: 1 +header: Git Manual +--- + +# NAME + git - the stupid content tracker + +# SYNOPSIS + git `[--version] [--help]` + +# DESCRIPTION + Git is a fast, scalable, distributed revision control system with an unusually rich command set that provides both high-level operations and full access to internals. + + See **gittutorial**(7) to get started, then see **giteveryday**(7) for a useful minimum set of commands. The **Git User’s Manual**[1] has a more in-depth introduction. + + After you mastered the basic concepts, you can come back to this page to learn what commands Git offers. You can learn more about individual Git commands with "git help command". **gitcli**(7) manual page gives you an overview of the command-line command syntax. + + A formatted and hyperlinked copy of the latest Git documentation can be viewed at **https://git.github.io/htmldocs/git.html**. + +# OPTIONS + --version + Prints the Git suite version that the git program came from. + + --help + Prints the synopsis and a list of the most commonly used commands. If the option --all or -a is given then all available commands are printed. If a Git command is named this option will bring up the manual page for that command. + + Other options are available to control how the manual page is displayed. See git-help(1) for more information, because git --help ... is converted internally into git help .... +``` + +Then execute + +```bash +pandoc -s -t man -o git.1 git.md +``` + +Here's what the command means: "Run `pandoc` on standalone mode converting `git.md` into a man page called `git.1`" + +To see the results run `man ./git.1` + +![1573183066061](/files/images/1573183066061.png) + diff --git a/content/blog/memoryerrorsgo.md b/content/blog/memoryerrorsgo.md new file mode 100644 index 0000000..72beb7c --- /dev/null +++ b/content/blog/memoryerrorsgo.md @@ -0,0 +1,20 @@ +--- +title: "Memory Errors in Go" +date: 2019-08-02T22:35:53-04:00 +draft: false +--- + +I enjoy playing with Valgrind. Sometimes I view it as a game to get rid of memory errors. When I wrote a go script, I noticed that I received a lot of memory errors. I decided to double check by writing a simple hello world program in Go. + +```go +package main +import "fmt" +func main() { + fmt.Println("Hello World") +} +``` +Running this then gives me a bunch of memory errors of the form `Invalid read of size 4`. + +Now this doesn't mean that the program is leaky. Valgrind does confirm that no leaks are possible. It then begs the question, does this type of memory error even matter? + +To avoid thinking about that I decided to play with [Rust](https://rust-lang.org) instead. \ No newline at end of file diff --git a/content/blog/mergerfs.md b/content/blog/mergerfs.md new file mode 100644 index 0000000..8745a3c --- /dev/null +++ b/content/blog/mergerfs.md @@ -0,0 +1,44 @@ +--- +title: "MergerFS" +date: 2020-01-14T23:10:17-05:00 +draft: false +images: [] +--- + +[MergerFS](https://github.com/trapexit/mergerfs) is a great filesystem for an expandable storage system in a homelab. Mostly since it allows you to add disks one at a time without having to, for example, resilver a ZFS pool. MergerFS won't be as efficient as a filesystem that stripes your data across disks, but in the case of a disk failure the disks unaffected will still have part of the data. + +[Plenty](https://blog.linuxserver.io/2017/06/24/the-perfect-media-server-2017/) of other [people](https://www.teknophiles.com/2018/02/19/disk-pooling-in-linux-with-mergerfs/) described MergerFS, so I'll keep this post simple. + +First install MergerFS, + +```bash +sudo apt install mergerfs +``` + +The way I have my drives in my homelab setup is to have `/mnt/data/N` where `N` is the number of the drive. + +Examples: `/mnt/data/1`, `/mnt/data/2`, `/mnt/data/3` + +This is mainly so that I can use wildcards to capture all the drives at once. + +Temporary mounting solution: + +```bash +sudo mergerfs -o defaults,allow_other,use_ino,fsname=data /mnt/data/\* $HOME/data +``` + +Permanent solution (Edit `/etc/fstab`) + +```bash +/mnt/data/* /home/user/data fuse.mergerfs defaults,allow_other,use_ino,fsname=data 0 0 +``` + +Quick summary of options passed + +| Option | Description | +| ----------- | ------------------------------------------------------------ | +| defaults | Shortcut for atomic_o_trunc, auto_cache, big_writes, default_permissions, splice_move, splice_read, splice_write | +| allow_other | Allows users beside the mergerfs owner to view the filesystem. | +| use_ino | MergerFS supplies inodes instead of libfuse | +| fsname | Name of the mount as shown in `df` and other tools | + diff --git a/content/blog/missingdata.md b/content/blog/missingdata.md new file mode 100644 index 0000000..afb020b --- /dev/null +++ b/content/blog/missingdata.md @@ -0,0 +1,14 @@ +--- +title: "Considerations with Missing Data" +date: 2019-05-22T23:18:45-04:00 +draft: true +--- + +Write something about "Missing Completely at Random" (MCAR) and maybe talk about a couple R packages for visualizing this.. + + + +Oh and also techniques for imputing + +- multiple imputation with chained equations +- random forest \ No newline at end of file diff --git a/content/blog/networkthroughput.md b/content/blog/networkthroughput.md new file mode 100644 index 0000000..e968925 --- /dev/null +++ b/content/blog/networkthroughput.md @@ -0,0 +1,27 @@ +--- +title: "Network Throughput Testing" +date: 2019-08-30T20:11:26-04:00 +draft: false +--- + +I ended up upgrading the wiring in my place to CAT7 recently and I wanted to see if there was a noticeable performance difference to my previous cabling. This blog post won't be a product comparison, but instead I'll show how you can do network throughput testing at your own location. + +There is a great package called `iperf`. It's in most repositories under Linux, and binaries for Windows and macOS exist as well. + +For a more in depth tutorial [check out this post from Linode](https://www.linode.com/docs/networking/diagnostics/install-iperf-to-diagnose-network-speed-in-linux/). + +*For the 5 second spiel...* + +One one machine, start the server + +```bash +iperf -s +``` + +On another machine connect to the server and begin testing the connection + +```bash +iperf -c 192.168.0.2 +``` + +You can also use the `-t` flag to specify the number of seconds you want to run the test for. diff --git a/content/blog/ngrok.md b/content/blog/ngrok.md new file mode 100644 index 0000000..fc42645 --- /dev/null +++ b/content/blog/ngrok.md @@ -0,0 +1,24 @@ +--- +title: "Ngrok" +date: 2019-11-20T20:56:19-05:00 +draft: false +--- + +Let's say you want to spin up a quick demo for a client and you don't want to use a VPS, and they can't access your laptop through the network. + +The easiest way I've known for the past few years to allow another person to access a specific port on your machine is through [ngrok](https://ngrok.com/). Ngrok is nice because not only do they offer a free plan, but they also offer paid plans. This means that you can trust that it'll at least be in business for a little while longer ;) + +## The Process + +You'll need to sign up for an account first. I was then going to write about some of the following steps, but `ngrok` has a really nice quad chart when you login + +![steps](/files/images/0932485094325.png) + +Just note that in step (3) you will actually have a random sequence of characters after `authtoken`. + +Something else you might want to know is how to enable TLS support, luckily that's a simple command line argument. + +```bash +ngrok http -bind-tls=true port +``` + diff --git a/content/blog/notimplemented.md b/content/blog/notimplemented.md new file mode 100644 index 0000000..a2f6454 --- /dev/null +++ b/content/blog/notimplemented.md @@ -0,0 +1,16 @@ +--- +title: "NotImplemented" +date: 2019-10-27T23:35:17-04:00 +draft: false +--- + +Let's say you overwrite the `__mul__` operator in a class in Python, but you don't want the function to be called for all kinds of input. You can specify the type by just returning `NotImplemented` for types you don't want. + +```python +class A: + def __mul__(self, x): + if not isinstance(x, A): + return NotImplemented + return someOperation() +``` + diff --git a/content/blog/ohmyzsh.md b/content/blog/ohmyzsh.md new file mode 100644 index 0000000..c7488e4 --- /dev/null +++ b/content/blog/ohmyzsh.md @@ -0,0 +1,45 @@ +--- +title: "Oh My Zsh" +date: 2019-07-21T08:45:03-04:00 +draft: false +--- + +Zsh is an extension of the sh that contains a lot more features than the default bash shell installed on most systems. + +For example, one of my new favorite features is being able to type in part of a command in your history and using the up-arrow to find it. + +For example: + +```bash +vim test.hi +``` + +Then typing `vim` and up-arrow will expand it to `vim test.hi`. Super handy when you have to type of long commands frequently. + +*Oh My Zsh* is a community project that superpowers zsh which allows you to easily add plugins and themes. The theme I'm currently using is [powerlevel10k](https://github.com/romkatv/powerlevel10k#oh-my-zsh) which is a custom theme. + +The list of plugins I have is: + +- git +- colored-man-pages +- colorize +- command-not-found +- cp +- rsync +- screen +- ssh-agent +- web-search +- docker +- node +- npm +- nvm +- gem +- ruby +- pip +- python +- pyenv +- virtualenv +- debian +- systemd +- sudo +- zsh-syntax-highlighting \ No newline at end of file diff --git a/content/blog/proofdef.md b/content/blog/proofdef.md new file mode 100644 index 0000000..2a863db --- /dev/null +++ b/content/blog/proofdef.md @@ -0,0 +1,17 @@ +--- +title: "Theorem Proving Definitions" +date: 2019-12-29T11:21:07-05:00 +draft: false +images: [] +--- + +When I look into a new field, sometimes I get confused by the whole new set of vocab terms I need to encounter. This post will serve to keep me straight with the terms involved in theorem proving. + +| Word | Definition | +| ------------ | ------------------------------------------------------------ | +| Modus Ponens | If $P$ implies $Q$ and $P$ is asserted to be true, then $Q$ must be true. | +| Complete | If every formula having the property can be derived using the system. (i.e The system does not miss a result) | +| Decidable | An effective method exists for deriving the correct answer in a finite time. | +| Sound | Every formula that can be proved in the system is logically valid with respect to the semantics of the system. (i.e The system does not produce a wrong result) | + +Hopefully, I'll come back and add more terms as I get confused. \ No newline at end of file diff --git a/content/blog/pythonpathhacks.md b/content/blog/pythonpathhacks.md new file mode 100644 index 0000000..baa9659 --- /dev/null +++ b/content/blog/pythonpathhacks.md @@ -0,0 +1,31 @@ +--- +title: "Python Path Hacks" +date: 2020-01-13T22:26:16-05:00 +draft: false +images: [] +--- + +There are two quick ways to hack together custom imports in Python. One is by using the `PYTHONPATH` environmental variable, and the other way is by using the `sys` module in Python. + +## Method 1: `PYTHONPATH` + +Before you call `python` set the environmental variable. + +```bash +PYTHONPATH=$PYTHONPATH:/other/path +``` + +Then you can call `python`. + +## Method 2: `sys` + +In the beginning of your Python script add the following code. + +```python +import sys +sys.path.append('/other/path') +``` + +## Remarks + +Of course this isn't the best way to add custom libraries to your Python scripts. Ideally, we would use `pip` to manage our dependencies. Perhaps a future blog post will cover this! \ No newline at end of file diff --git a/content/blog/pythonsymmetricgroups.md b/content/blog/pythonsymmetricgroups.md new file mode 100644 index 0000000..dc4db75 --- /dev/null +++ b/content/blog/pythonsymmetricgroups.md @@ -0,0 +1,109 @@ +--- +title: "Symmetric Groups in Python" +date: 2019-05-22T20:02:21-04:00 +draft: false +--- + +**Warning:** This post is meant for someone whose familiar with concepts of Abstract Algebra. + +## Refresher + +### Definitions + +An **operation** on a set is a calculation that maps one element in a set onto another element of the set. + +A **group** in mathematics is a set and an operation that follows the three properties: + +- There exists an identity element. +- The operation is associative. +- For every element, there exists an inverse of that element in the set. + +**Symmetric Groups** are groups whose elements are all bijections from the set onto itself and operation which is composition of functions. + +### Example + +Let's look at the group $\mathbb{Z}_3$. Here is an example of an element of its symmetric group. +$$ +\begin{pmatrix} +0 & 1 & 2 \\ +1 & 2 & 0 +\end{pmatrix} +$$ +This element maps $0 \rightarrow 1$, $1 \rightarrow 2$, and $2 \rightarrow 0$. + +A good way to check if something similar to the above is an element of a symmetric group is pay attention to the second row. Make sure that it only contains the elements of the set you care about (ex: $\mathbb{Z}_3$) and that there are no repeats. + +Let's look at an example of composing two elements from this symmetric group. +$$ +\begin{pmatrix} +0 & 1 & 2 \\ +1 & 2 & 0 +\end{pmatrix} +\circ +\begin{pmatrix} +0 & 1 & 2 \\ +0 & 2 & 1 \\ +\end{pmatrix} += +\begin{pmatrix} +0 & 1 & 2 \\ +1 & 0 & 2 \\ +\end{pmatrix} +$$ +The main thing to remember here is that you must compose from right to left. + +$0 \rightarrow 0$ and then $0 \rightarrow 1$, so ultimately $0 \rightarrow 1$. + +$1 \rightarrow 2$ and $2 \rightarrow 0$, so ultimately $1 \rightarrow 0$. + +$2 \rightarrow 1$ and $1 \rightarrow 2$, so ultimately $2 \rightarrow 2$. + +### Finding Inverses + +Finding the inverse is simple, since all you need to do is flip the two rows and sort it again. +$$ +\begin{pmatrix} +0 & 1 & 2 \\ +1 & 2 & 0 +\end{pmatrix}^{-1} = +\begin{pmatrix} +1 & 2 & 0 \\ +0 & 1 & 2 +\end{pmatrix} = +\begin{pmatrix} +0 & 1 & 2 \\ +2 & 0 & 1 +\end{pmatrix} +$$ + + ### Code Implementation + +For Abstract Algebra homework, there was a lot of compositions of these symmetric elements. Sadly, I get pretty lazy doing these by hand for many hours. So like any Computer Scientist, I created a simple script in Python to help me compute these. + +The code is located in [this gist](https://gist.github.com/Brandon-Rozek/adf9e1e64e2fbfcd3f8d3bc5da9322bf). + +#### Basic Usage + +`SymmetricElement` takes in the second row of the matrices we were playing with. You can find the inverse with `element.inverse()` and you can compose two symmetric elements together with the `*` operation. + +```python +SymmetricElement(1,2,3) +# array([[1., 2., 3.], +# [1., 2., 3.]]) +``` + +```python +SymmetricElement(1,2,3) * SymmetricElement(2,1,3) +#array([[1., 2., 3.], +# [2., 1., 3.]]) + +``` + +```python +SymmetricElement(1,2,3).inverse() +#array([[1., 2., 3.], +# [1., 2., 3.]]) +``` + + + diff --git a/content/blog/pythontyping.md b/content/blog/pythontyping.md new file mode 100644 index 0000000..e566c1e --- /dev/null +++ b/content/blog/pythontyping.md @@ -0,0 +1,14 @@ +--- +title: "Python Typing" +date: 2019-10-28T00:12:34-04:00 +draft: false +--- + +There's a typing module built right into Python that you can use on your applications. Sobolevn write a great [blog post](https://sobolevn.me/2019/01/simple-dependent-types-in-python) about it. One thing that threw me off at first is that if you add type annotations and then run python like you normally would, it would act as if the annotations weren't there. + +Why use type annotations then? + +1. It enhances your internal docs. VS Code and other editors pick this up and show it to the user in their IDE. +2. You can use `mypy` to perform type checking for you. + +I go back and forth with type checking in Python, but I do think that forcing yourself to follow type safety makes you a better programmer. \ No newline at end of file diff --git a/content/blog/quickstoragesetup.md b/content/blog/quickstoragesetup.md new file mode 100644 index 0000000..8b81411 --- /dev/null +++ b/content/blog/quickstoragesetup.md @@ -0,0 +1,71 @@ +--- +title: "Quickly Setting up a Storage Device" +date: 2020-01-12T21:43:26-05:00 +draft: false +images: [] +--- + +This post exists mostly to aid myself for when I buy new drives for my home server. It's a quick and easy way to create an ext4 filesystem over the entire drive. + +To go through this post, you'll need to know the name of your drive. + +```bash +sudo fdisk -l +``` + +or + +```bash +lsblk +``` + +The drive is most likely one of the larger devices with no partitions set. It'll likely be of the format `/dev/sdX`. + +To begin, we'll have to set the label. Here we'll use `gpt`. + +```bash +sudo parted /dev/sdX mklabel gpt +``` + +Then we can create a primary partition formatted with ext4 covering the entire device. + +```bash +sudo parted -a opt /dev/sdX mkpart primary ext4 0% 100% +``` + +Now we can let `ext4` format the drive, + +```bash +sudo mkfs.ext4 /dev/sdX +``` + +I like to set up my mount points to be `/mnt/data/N` where N is the number of the drive I'm working with. + +```bash +sudo mkdir /mnt/data/N +``` + +To temporarily mount it, just to make sure it works you can run + +```bash +sudo mount /dev/sdX /mnt/data/N +``` + +You can unmount it with `umount` + +```bash +sudo umount /dev/sdX +``` + +When you're ready to make it permanent, we'll have to edit the `/etc/fstab` file. We should note the drive by its UUID so that it's not dependent on the slot the hard drive sits in. You can find it by running this command + +```bash +lsblk -o UUID /dev/sdX1 +``` + +Now you can append your `/etc/fstab` with the following: + +```bash +UUID=uuid-here /mnt/data/N ext4 defaults 0 0 +``` + diff --git a/content/blog/robustdd.md b/content/blog/robustdd.md new file mode 100644 index 0000000..b8038ef --- /dev/null +++ b/content/blog/robustdd.md @@ -0,0 +1,33 @@ +--- +title: "Robustdd" +date: 2019-09-27T22:45:56-04:00 +draft: false +--- + +This blog post is going to assume that we're writing to `/dev/sdX`. Please change this to whatever disk you're actually trying to write to. I bear no responsibility if you accidentally write to your OS drives. + +Make sure the disk you wish to write to is unmounted. + +```bash +sudo umount /dev/sdX +``` + +For good measure check `lsblk`.... + +Then perform the writing operation + +```bash +sudo dd bs=4M if=/path/to/distro.iso of=/dev/sdX conv=fdatasync status=progress +``` + +`fdatasync` will wait until the data is physically written into the drive before finishing. + +Once that operation is done we can check to see if it is performed properly. This step will only work for ISOs that have prepared a file similar to `md5sum.txt` that Ubuntu provides.... + +```bash +sudo mount /dev/sdX /mnt +cd /mnt +md5sum -c md5sum.txt +``` + +Hopefully you'll see all `OK` and we're good to go! diff --git a/content/blog/rsa.md b/content/blog/rsa.md new file mode 100644 index 0000000..4f3ec5a --- /dev/null +++ b/content/blog/rsa.md @@ -0,0 +1,72 @@ +--- +title: RSA Cryptography +date: 2019-12-10T22:15:21-05:00 +draft: false +images: [] +--- + +# Introduction + +Why do we need Cryptography? Well let's say Bob is purchasing things from Alice over the internet. He wants to give Alice his credit card details to complete his transaction, but he feels uncomfortable with the thought that others can possibly read it as well. RSA is a cryptosystem that underlies HTTPS, and this gives Bob a sense of security that only Alice can see his message. + +The journey of RSA starts in 1976 when Whitfield Diffie and Martin Hellman published a framework describing an asymmetric public-private key cryptosystem through four key steps: + +1. Key Generation +2. Key Distribution +3. Encryption with one-way function (using a public key) +4. Decryption (using a private key) + +They left the one-way function undefined, making it an open problem for the community. Ron **R**ivest, Adi **S**hamir, and Leonard **A**dleman at MIT took up this challenge. Rivest and Shamir were Computer Scientists trying to come up with this function while Adleman was the mathematician tasked with finding flaws in their discoveries. After working together to develop the RSA cryptosystem in 1977, Rivest, Shamir, and Adleman went on to found the organization RSA Data Security in 1982. + +# RSA Algorithm + +In this section, we'll look at the RSA algorithm through the lens of the four steps listed in the previous section. + +#### Key Generation + +Alice needs to generate public and private keys through the following method: + +1. Choose two distinct prime integers $p$ and $q$. +2. Compute $n = pq$. The integer $n$ will be later released as part of the *public key*. +3. Calculate $\phi(n)$ which by the Euler's Totient Product of Primes property is $(p - 1)(q - 1)$. +4. Choose $e \in \mathbb{Z}$ such that $e$ and $\phi(n)$ are relatively prime. The integer $e$ will also be released as part of the *public key*. +5. Calculate $d$, the multiplicative inverse of $e$ modulo $\phi(n)$. The integer $d$ will be kept secret as the *private key*. + +#### Key Distribution + +For Bob to send a message to Alice, he will need to know Alice's public key $n$ and $e$. Bob, however, does not need to know Alice's prime integers $p$ and $q$ that divide $n$. Nor does he need to know the private key $d$. + +#### Encryption + +Let $m \in \mathbb{Z}_n$ be the message that Bob wants to send. Bob calculates this number from his message using an agreed-upon reversible algorithm. The ciphertext or encrypted block $c$ is computed by, $c \equiv m^e$ (mod $n$). Bob then sends the ciphertext to Alice. + +#### Decryption + +Alice receives this ciphertext $c$ from Bob and then can recover the original message $m$ by computing $c^d$ modulo $n$. How is this possible? Well recall that $c^d \equiv (m^e)^d$. Then, $c^d \equiv m^{ed}$ by exponent rules. Recall that $e$ and $d$ are multiplicative inverses modulo $\phi(n)$. Therefore by definition, $ed = 1 + \phi(m)t$ for some $t \in \mathbb{Z}$. Then, + +\begin{align*} +c^d &\equiv m^{1 + \phi(n)t} \\\\ + &\equiv m(m^{\phi(n)})^t +\end{align*} + +Well since $n$ is prime, by Euler's Theorem $m^{\phi(n)} \equiv 1$ modulo $n$. Thus, $c^d \equiv m \cdot 1^t \equiv m$ modulo $n$. Through this short proof, we can see that Alice successfully retrieves Bob's message $m$ just by raising the ciphertext $c$ to the power of the private key $d$. + +## Example + +Let's run through a short example of this algorithm with small integers. Let $p = 3, q = 5$. Then $n = pq = 15$. We then calculate $\phi(n) = \phi(p)\phi(q) = 2(4) = 8$. An integer $e$ that is relatively prime to $\phi(n)$ is $11$. Finally we compute the inverse of $e$ modulo $\phi(n)$. + +\begin{align*} +11d &\equiv 1 \text{ (mod $8$) } \\\\ +11d &\equiv 33 \text{ (mod $8$)} \\\\ +d &\equiv 3 \text{ (mod $8$)} +\end{align*} + + +Alice then gives Bob the integers $n = 15$ and $e = 11$. Bob can then encode his message (say $m = 12$) by raising $m$ to the power of $e$. Thus, $c = m^e = 12^{11} = 743008370688 \equiv 3$ modulo 15. Alice can then recover $m = 12$ by raising $c = 3$ to the power of her private key $d$. $m \equiv c^d \equiv 3^3 \equiv 27 \equiv 12$ modulo $15$. + + +# Discussion + +Well if it's this simple to calculate, why is it secure? It is actually extremely difficult to factor a large prime number $n$. If $n$ can be factored into $p$ and $q$, then it is easy to compute $d \equiv e^{-1}$ modulo $\phi(pq)$. It is also really hard to efficiently solve for $m$ in the congruence $c \equiv m^e$ modulo $n$. RSA Laboratories on March 1991 issued a challenge tasking the public to calculate prime factors of $n$ (called RSA numbers) of increasing digits. They offered a cash prize of up to \$200,000 for solving RSA-2048 which is a 617 digit long number. As of the time of the presentation, the largest factored RSA number was RSA-768 (768 bits or 232 decimal digits) which was calculated over the span of two years. As of the time of this writing, towards the end of this year (2019) the largest known factored RSA number is actually RSA-240 (795 bits or 240 decimal digits). Currently the National Institute of Standards and Technology (NIST) recommends the use of 2048-bit keys for use in RSA. So for the time being, our communications are safe. + + diff --git a/content/blog/rsynckey.md b/content/blog/rsynckey.md new file mode 100644 index 0000000..9b9127c --- /dev/null +++ b/content/blog/rsynckey.md @@ -0,0 +1,28 @@ +--- +title: "Rsync with a Different Key" +date: 2019-07-06T09:20:05-04:00 +draft: false +--- + +To use Rsync with a different key, follow the command structure below. + +```bash +rsync -e "ssh -i $HOME/.ssh/key" user@hostname:/from/dir/ /to/dir/ +``` + +Though for syncing my local website to my VPS, I usually like having more options with my rsync command + +```bash +rsync -Paz --delete -e "ssh -i $HOME/.ssh/key" user@hostname:/from/dir/ /to/dir/ +``` + +Quick option definitions (from man page) + +| Option | Description | +| -------------- | ------------------------------------------------------------ | +| -e | Allows you to override the default shell used as the transport for rsync. Command line options are permitted after the command name. | +| -a, --archive | This is equivalent to -rlptgoD. It is a quick way of saying you want recursion and want to preserve almost everything (with -H being a notable omission). The only exception to the above equivalence is when --files-from is specified, in which case -r is not implied.
Note that -a does not preserve hardlinks, because finding multiply-linked files is expensive. You must separately specify -H. | +| -P | Equivalent to --partial --progress. Its purpose is to make it much easier to specify these two options for a long transfer that may be interrupted. | +| -z, --compress | Compress file data during the transfer | +| --delete | Delete extraneous files from dest dirs | + diff --git a/content/blog/scrcpy.md b/content/blog/scrcpy.md new file mode 100644 index 0000000..7f24d5b --- /dev/null +++ b/content/blog/scrcpy.md @@ -0,0 +1,27 @@ +--- +title: "Scrcpy" +date: 2020-01-09T21:36:30-05:00 +draft: false +images: [] +--- + +With [Scrcpy](https://github.com/Genymobile/scrcpy) you can control an Android device remotely! + +![1578623897330](/files/images/1578623897330.png) + +The `README` on the Github page has all the information you need though it boils down to a few simple steps. + +1. Install `scrcpy`. +```bash +sudo snap install scrcpy +``` +2. [Enable adb debugging](https://developer.android.com/studio/command-line/adb.html#Enabling) on your device +3. (Optional for remote capability) Enable adb over TCP/IP on your device +```bash +adb tcpip 5555 +``` +4. (Optional Continued) Connect to the device + ```bash + adb connect DEVICE_IP:5555 + ``` + 5. Run `scrcpy` \ No newline at end of file diff --git a/content/blog/screwuppresentations.md b/content/blog/screwuppresentations.md new file mode 100644 index 0000000..f2136c0 --- /dev/null +++ b/content/blog/screwuppresentations.md @@ -0,0 +1,124 @@ +--- +title: "Notes on '13 Ways Designers Screw Up Client Presentations'" +date: 2019-05-21T22:20:14-04:00 +draft: false +--- + +I watched a great talk by [Mike Monteiro](http://mikemonteiro.com/) recently called [13 Ways Designers Screw Up Client Presentations](https://www.youtube.com/watch?v=IXXKqwrEql4). You should really watch the talk but this post is just a quick summary of the points he got across in the presentation. + +## Intro + +You need to sell your work! Great work is worth nothing if you can't persuade the client it is good. + +Don't leave the selling to other people. That is your job. Every decision you make is backed by some data or experience. If you're not there, then you lose context and won't be there for feedback. + +On to the mistakes.... + +## 1. You are not there to be the client's friend + +You are there to solve the client's goal. Happiness is the side-effect of good design, not a goal. + +You are there to convince the client not to go down avenues that run counter to their goals. That's what they hired you for. You need to present yourself as the expert that they believed they hired. + +For example, your doctor needs to tell you if you have a cracked tooth. Do you think that they would hide this information from you because it might hurt your feelings? No, because it is their job to tell you this information. + +## 2. Not getting off your ass + +It should be obvious when you enter the room, who is in charge of the presentation. + +Confidence isn't about you feeling better, it is about your client feeling better. + +## 3. Starting with an apology + +Every time you apologize for something you are freaking the client out. No matter how much you hoped to present at the presentation, by the time you get to that room, you have the perfect amount of stuff. + +If you don't feel like the work is up to spec, cancel the presentation. Do not have a presentation of work you cannot stand behind. It is better to cancel than waste people's time. You can get away with this exactly once during a project. + +Your client probably works for somebody higher up, the minute you start apologizing to them, they imagine themselves apologizing to their boss! + +## 4. Not Setting the Stage Properly + +You have gathered busy people together, they probably have other things they can be doing, so let them know what this presentation is for. + +Let them know why they are a necessary and important part of this conversation. + +You need to address these two things at the beginning of the presentation + +1. Why are we here? + 1. Let them know what their roles are, why they are here, what you are going to show, and what you need from them. +2. When can we leave? + 1. Let them know what it takes for the goal of the meeting to be met. The minute you get it, the meeting is over. Never give a client time to unmake a decision, especially a decision in your favor. + +Once you have gotten what you need, keep quiet. Everything you do beyond that threatens to undo the victory you just got. + +## 5. Giving the Real Estate Tour + +You don't sell a house by talking about the sheetrock. You sell it by getting a buyer to picture themselves in the neighborhood, by picturing the kids in the playground, etc. + +You sell the benefits of the work, and you sell how the work matches the project goals. + +Every decision on that page should be made with the benefit of data and good research, but people make decisions based on stories. + +## 6. Taking Notes + +Find somebody else to take the notes. You are giving the presentation. + +## 7. Reading a Script + +You need to convince the client that you are excited about the product. + +"Without promotion something terrible happens.... Nothing" - PT. Barnum + +## 8. Getting Defensive + +You are not your work, and your work is not you. + +Your work is a product made to meet a client's goals. The client is free to criticize the work and is free to tell you whether they believe it has met the goals or not. You are free to present evidence to the contrary but not get hurt by the criticism. + +When the client starts critiquing the work listen to what they're saying, don't feel like you have to defend everything they're saying right then and there. You also don't have to promise them anything then and there, sometimes it's best to sit on it for a while. + +When a client is giving you feedback it is a great time to keep your mouth shut. + +## 9. Mentioning Typefaces + +Clients don't care about typefaces. You don't really want their input on this. Clients are uncomfortable in your field. The more you dive into these things, the more uncomfortable they're going to get. And it's going to look like you're inviting them to do your job for them. + +Stop asking for permission to do a job you were hired for. + +Their comfort zone is their business needs, which is great since you are never going to be an expert on their domain. Talk about your work in terms of their business and needs. + +## 10. Talking about how hard you worked + +You're not getting a grade on effort. + +If you do the work right, it will look like it was effortless. + +## 11. Reacting to questions as change requests + +"Why is this blue?" + +"Oh I can change it." + +Sometimes the client just has a question! They're just looking for your reasoning. + +## 12. Not guiding the feedback loop + +Most clients have no idea what kind of feedback you are looking for. They are not trained in your work. Anything that helps you do your job is part of your job. Know what you want before calling the presentation. + +Some suggestions: + +1. How well does this reflect your brand? +2. How well does this reflect your users' needs as we discussed in the research? +3. How well does this reflect your ad strategy? + +They're not going to give it to you unless you explicitly ask for it. + +## 13. Asking "Do you like it?" + +If it had a like button on it would you push it? + +All the work you and your team did went down the drain! The client is no longer looking at you as an expert. + +Every decision on the project has been made with the benefit of expertise and data and you just uttered the most subjective phrase. + +If you want to make your client's happy, make them successful. \ No newline at end of file diff --git a/content/blog/shutdownafterjob.md b/content/blog/shutdownafterjob.md new file mode 100644 index 0000000..4899a8f --- /dev/null +++ b/content/blog/shutdownafterjob.md @@ -0,0 +1,22 @@ +--- +title: "Shutdown After Job" +date: 2019-08-30T20:43:56-04:00 +draft: false +--- + +I'm back to running longer jobs as part of my research. If I run a task overnight, I want to conserve energy and not keep it running after I finish. I suppose this would also apply to cloud billing, you want it to do the job and then stop. + +This technique will require you to have sudo privileges on the machine. + +1. Change user to root. + +```bash +sudo su +``` + +2. Run job as regular user, write output to file, and then poweroff. + +```bash +su -u user task > output.txt && chown user:user output.txt && poweroff +``` + diff --git a/content/blog/simulators.md b/content/blog/simulators.md new file mode 100644 index 0000000..a3958e6 --- /dev/null +++ b/content/blog/simulators.md @@ -0,0 +1,15 @@ +--- +title: "Simulators" +date: 2019-07-01T22:22:29-04:00 +draft: false +--- + +Part of my job involves integrating multiple different sensors together to make a cohesive product. One thing that I appreciate about my current team, is the rich set of tooling built around the project. I am definitely learning a lot from this project. One thing I wanted to share was the use of *simulators*. + +Now since we're working with sensor data, it doesn't always make sense to need to be connected to a whole system. There's also the additional hassle of dealing with safety and working outside. So in order to do some programming and still be at ease that we didn't break anything, we make heavy use of simulators. + +Example: Have a GPS hooked up to your system? Well with a tool you can make waypoints and generate a file which you then feed in as a fake GPS device! + +Now when I say fake device, I don't mean I'm actually emulating the device on the machine. It's easier to have your device interfacers publish to the local network and have your other parts of the application subscribe to it. So in this case, you will just need to produce those messages directly. + +So in conclusion, I think this pattern will work well for my personal projects. It helps keep your code modular and easily testable! diff --git a/content/blog/sshconfig.md b/content/blog/sshconfig.md new file mode 100644 index 0000000..b1cf506 --- /dev/null +++ b/content/blog/sshconfig.md @@ -0,0 +1,16 @@ +--- +title: "SSH Config" +date: 2019-09-27T22:46:39-04:00 +draft: false +--- + +Have you ever gone through the hassle of having multiple public/private keys for accessing your remote servers? Before recently, I used to specify the identity file in all my transactions `ssh -I ~/.ssh/private_key user@host` but no longer! I discovered you can add the following to your `~/.ssh/config` to specify which key you want to use! + +``` +Host someaddress + Hostname someaddress + user usernameonserver + IdentityFile ~/.ssh/private_key +``` + +Of course you can add multiple of these entries in that file so that you can `ssh` without having to worry about explicitly using keys. \ No newline at end of file diff --git a/content/blog/sshlocalportforwarding.md b/content/blog/sshlocalportforwarding.md new file mode 100644 index 0000000..9bf4c2d --- /dev/null +++ b/content/blog/sshlocalportforwarding.md @@ -0,0 +1,19 @@ +--- +title: "SSH Local Port Forwarding" +date: 2019-08-06T16:50:00-04:00 +draft: false +--- + +There are some services that I don't want to run all the time which makes me not want to open a port for it. One good example of this is [Jupyter Notebooks](https://jupyter.org/). Therefore, what I sometimes do is run it locally and forward the port so that another machine can access it. + +Example command: + +```bash +ssh -L 8888:localhost:8888 -N 192.168.0.2 +``` + +The `-L` flag allows you to specify the `localsocket:host:remotesocket`. + +`-N` makes it so that it doesn't execute any additional commands + +Then finally you put the address of the machine you wish to connect to. diff --git a/content/blog/systemdstartup.md b/content/blog/systemdstartup.md new file mode 100644 index 0000000..3a783b4 --- /dev/null +++ b/content/blog/systemdstartup.md @@ -0,0 +1,23 @@ +--- +title: "Analyzing Startup Times with Systemd" +date: 2019-12-26T22:52:59-05:00 +draft: false +images: [] +--- + +Startup times feeling slow? Check to see if there are any uneeded services slowing you down! + +To see how long it takes to bootup + +```bash +systemd-analyze +``` + +To see the length of time each service took to initialize + +```bash +systemd-analyze blame +``` + +Then you can `disable` any services that you don't need. + diff --git a/content/blog/systemdwithpythonenvs.md b/content/blog/systemdwithpythonenvs.md new file mode 100644 index 0000000..80e77ca --- /dev/null +++ b/content/blog/systemdwithpythonenvs.md @@ -0,0 +1,29 @@ +--- +title: "Systemd with Python environments" +date: 2019-08-25T20:04:20-04:00 +draft: false +--- + +It took me some time to realize why I couldn't start a project during startup. I then realized that it was because I was using a python virtual environment and didn't tell systemd about it. + +Here's how you can do so... + +```yaml +[Unit] +Description=Start Service +# After=network.target # If you want a python webserver... + +[Service] +Type=Simple +User=brandon +WorkingDirectory=/home/brandon/Development +ExecStart=/bin/sh -c ". /home/brandon/Development/pythonenv/bin/activate; /home/brandon/Development/start" + +[Install] +WantedBy=multi-user.target +``` + + + + + diff --git a/content/blog/tempresolve.md b/content/blog/tempresolve.md new file mode 100644 index 0000000..2fa1a7f --- /dev/null +++ b/content/blog/tempresolve.md @@ -0,0 +1,24 @@ +--- +title: "Temporarily Resolving Hostnames" +date: 2020-01-04T21:26:16-05:00 +draft: false +images: [] +--- + +Let's say that we're testing a webserver where the pages served depended on a domain that you don't own. The most common way I know to test this is to modify your `/etc/hosts` file to contain the hostname and ip address you want to map it to. + +``` +192.168.1.2 custom.domain +``` + +I've recently discovered that the command line utility `curl` has a quick and easy option to forge the hostname of a request. + +```bash +curl --resolve domain:port:ipaddr url +``` + +There are also browser extensions that you can use such as [LiveHosts](https://github.com/Aioros/livehosts) to get around this as well. This post isn't entirely useful when talking about permanent services. + +If this is going to be a publicly facing service, then you should just set the records of your domain name to point to the server. + +If it's a non-public routable service, then perhaps try looking into setting up your own private [dns server](https://brandonrozek.com/blog/coredns/). \ No newline at end of file diff --git a/content/blog/tensorboard.md b/content/blog/tensorboard.md new file mode 100644 index 0000000..749ae19 --- /dev/null +++ b/content/blog/tensorboard.md @@ -0,0 +1,6 @@ +--- +title: "Tensorboard" +date: 2019-05-26T19:04:47-04:00 +draft: true +--- + diff --git a/content/blog/togglingxinput.md b/content/blog/togglingxinput.md new file mode 100644 index 0000000..65c9439 --- /dev/null +++ b/content/blog/togglingxinput.md @@ -0,0 +1,30 @@ +--- +title: "Toggling X Input" +date: 2020-01-07T20:46:32-05:00 +draft: false +images: [] +--- + +On X, we can easily enable or disable input devices using the `xinput` command. This is a great use case when you're tired of accidentally hitting the red Thinkpad nub or having your palm be recognized when drawing with a pen. + +Running the `xinput` command performs the action temporarily. Your default settings will be restored upon a reboot. + +To list `xinput` devices run: + +```bash +xinput +``` + +To disable a device: + +```bash +xinput disable [id] +``` + +To enable a device: + +```bash +xinput enable [id] +``` + +The ids are listed when you list the devices. \ No newline at end of file diff --git a/content/blog/traefiknginx.md b/content/blog/traefiknginx.md new file mode 100644 index 0000000..4c51c73 --- /dev/null +++ b/content/blog/traefiknginx.md @@ -0,0 +1,70 @@ +--- +title: "Traefik & Nginx" +date: 2019-12-16T19:55:47-05:00 +draft: false +images: [] +--- + +I've been enjoying Traefik for its auto-discovery of containers. The only problem is that for a couple containers such as Plex and HomeAssistant I have host networking enabled. This usually results in Traefik failing to forward the traffic properly. + +Having more fine grained control is exactly what Nginx is for! I don't want to switch my whole setup to Nginx since that would be a lot of configuration files for every docker container. But I think having configuration files for containers that use host networking is manageable. + +In your docker-compose file first make sure that Traefik is disabled for containers that use host networking by adding the label `traefik.enable=false` + +```yaml + homeassistant: + image: homeassistant/home-assistant + container_name: homeassistant + hostname: homeassistant + network_mode: host + environment: + - PUID=1000 + - PGID=1000 + volumes: + - /Volumes/homeassistant/config:/config + restart: always + labels: + - traefik.enable=false +``` + +Then add a new section for `nginx` adding the domains that you wish it to manage in the labels + +```yaml +nginx: + image: linuxserver/nginx + container_name: nginx + environment: + - PUID=1000 + - PGID=1000 + volumes: + - /Volumes/nginx/config:/config + restart: always + labels: + - traefik.http.routers.my-container.rule=Host(`plex.example.com`,`homeassistant.example.com`) +``` + +Now on the host system add the configuration files for nginx to consume. Example: + +```nginx +server { + listen 80; + listen [::]:80; + + server_name plex.example.com; + + location / { + proxy_pass http://homelanip:32400; + proxy_http_version 1.1; + proxy_set_header Upgrade $http_upgrade; + proxy_set_header Connection 'upgrade'; + proxy_set_header Host $host; + proxy_cache_bypass $http_upgrade; + } +} +``` + +Similarly add a configuration file for `homeassistant` or any other service you have. + +Now for this example, the subdomains `plex.example.com` and `homeassistant.example.com` are managed by Nginx. + +To finish it off, `docker-compose start nginx`. diff --git a/content/blog/unattended-upgrades.md b/content/blog/unattended-upgrades.md new file mode 100644 index 0000000..01eeaaf --- /dev/null +++ b/content/blog/unattended-upgrades.md @@ -0,0 +1,11 @@ +--- +title: "Unattended Upgrades" +date: 2019-05-26T12:52:03-04:00 +draft: false +--- + +I'm a big believer of reducing maintenance. One of the things that I didn't bother setting up before but should've is *unattended upgrades*. The benefits of this is that you don't have to repeatedly log into your sever to upgrade your system. + +Why bother managing your own server in the first place? Well with a virtualized system you can set up any type of application that you like. You're not limited to only hosting static sites or whatever applications the C-Panel instance allows. + +Now there's no need for me to reiterate what's been done before, so here's a [useful post from libre-software](https://libre-software.net/ubuntu-automatic-updates/) describing how to set it up so that a Ubuntu server updates itself automatically. \ No newline at end of file diff --git a/content/blog/usbredirection.md b/content/blog/usbredirection.md new file mode 100644 index 0000000..de989b5 --- /dev/null +++ b/content/blog/usbredirection.md @@ -0,0 +1,9 @@ +--- +title: "Wacom and USB Redirection in Virtual Machines" +date: 2019-05-24T22:15:56-04:00 +draft: false +--- + +[Virt-Manager](https://virt-manager.org/) is a great tool for managing virtual machines under Linux. Today I learned of [Spice USB redirection](https://blog.wikichoon.com/2014/04/spice-usb-redirection-in-virt-manager.html). Essentially it allows you to switch USB devices from the host to the virtualized environment. This came in handy when I noticed that the graphics tablet device was not able to do pressure sensitivity on the Windows guest. + +To achieve this goal, I removed the graphics tablet hardware device and manually redirected that USB device to the guest. I then remembered to install the [Wacom drivers](https://www.wacom.com/en-us/support/product-support/drivers) for the Windows VM. \ No newline at end of file diff --git a/content/blog/videosandgifs.md b/content/blog/videosandgifs.md new file mode 100644 index 0000000..00a604e --- /dev/null +++ b/content/blog/videosandgifs.md @@ -0,0 +1,22 @@ +--- +title: "Videos and GIFs" +date: 2019-12-04T10:13:35-05:00 +draft: false +images: [] +--- + +I like using GIFs in Google Slides because it doesn't require any interaction to start playing right away. Therefore, I looked at a couple resources to add a GIF from a video into my presentation. Of course this is all using one of my favorite terminal tools `ffmpeg`. + +First of all, I wanted to include a video of a bot playing Pong. The video was a little long, so I decided speed it up for a more time-lapse type feel. + +[From the FFMPEG website](https://trac.ffmpeg.org/wiki/How%20to%20speed%20up%20/%20slow%20down%20a%20video): To 10x the speed `ffmpeg -i input.mkv -filter:v "setpts=0.1*PTS" output.mkv` + +You just need to replace the `0.1` with the appropriate decimal number to change the speed. + +Giphy has a great [writeup](https://engineering.giphy.com/how-to-make-gifs-with-ffmpeg/) describing the commands to use in order to make your GIF look nice. + +```bash +ffmpeg -i inputvideo.mp4 -filter_complex "[0:v] palettegen" palette.png +ffmpeg -i inputvideo.mp4 -i palette.png -filter_complex "[0:v][1:v] paletteuse" output.gif +``` + diff --git a/content/blog/virtualdisks.md b/content/blog/virtualdisks.md new file mode 100644 index 0000000..e200e75 --- /dev/null +++ b/content/blog/virtualdisks.md @@ -0,0 +1,84 @@ +--- +title: "Virtual Disks" +date: 2020-01-06T22:26:58-05:00 +draft: false +images: [] +--- + +Have you wanted to [play with ZFS](https://wiki.archlinux.org/index.php/ZFS/Virtual_disks) or any other filesystem without creating a dedicated partition or device? We can do this through virtual disks! + +First, we need to create a [sparse file](https://en.wikipedia.org/wiki/Sparse_file) called `scratch.img` with some max capacity. Let's say 2G. + +```bash +truncate -s 2G $HOME/scratch.img +``` + +Now the file is only sparse, if your filesystem supports it. To see, run `du -sh $HOME/scratch.img`. If it says that the size is `0` then your filesystem supports sparse files. Otherwise it does not. + +Then, we can format the file with any filesystem we will like. One popular tool is `mkfs` which depending on your operating system can support [`bfs`](https://en.wikipedia.org/wiki/Be_File_System), [`cramfs`](https://en.wikipedia.org/wiki/Cramfs), [`ext2`](https://en.wikipedia.org/wiki/Ext2), [`ext3`](https://en.wikipedia.org/wiki/Ext3), [`ext4`](https://en.wikipedia.org/wiki/Ext4), [`fat`](https://en.wikipedia.org/wiki/File_Allocation_Table), [`minix`](https://en.wikipedia.org/wiki/MINIX_file_system), `msdos`, [`ntfs`](https://en.wikipedia.org/wiki/NTFS), [`vfat`](https://en.wikipedia.org/wiki/File_Allocation_Table#VFAT), [`reiserfs`](https://en.wikipedia.org/wiki/ReiserFS), etc. + +To format with `ext4`, + +```bash +mkfs -t ext4 $HOME/scratch.img +``` + +Then we can create the mount-point `/mnt/scratch` and mount `scratch.img` to it. + +```bash +sudo mkdir /mnt/scratch +sudo mount -t auto -o loop $HOME/scratch.img /mnt/scratch +``` + +With this, we now have a mounted `ext4` filesystem on `/mnt/scratch`. `cd` into it and have a blast! + +## Resizing the Virtual Disk + +To resize the virtual disk, we will first need to unmount the virtual disk so we don't create inconsistencies. + +```bash +sudo umount /mnt/scratch +``` + +Now we can extend or shrink the drive with `truncate`. + +Extend by 1G: `truncate -s +1G $HOME/scratch.img` + +Shrink by 1G: `truncate -s -1G $HOME/scratch.img` + +Check the filesystem to make sure that no inconsistencies occured. With `ext(2/3/4)` we can do this with the `e2fsck` command. + +```bash +e2fsck $HOME/scratch.img +``` + +Then we need to tell the filesystem to resize itself. For `ext(2/3/4)` you can do this with the `resize2fs` command. + +```bash +resize2fs $HOME/scratch.img +``` + +Now the virtual disk is successfully resized! We can mount it back with the previous mount command. + +```bash +sudo mount -t auto -o loop $HOME/scratch.img /mnt/scratch +``` + +## Removing the Virtual Disk + +To remove the virtual disk, we first need to unmount the virtual drive + +```bash +sudo umount /mnt/scratch +``` + +Then we can remove the mount-point and file. + +```bash +sudo rm -r /mnt/scratch +rm $HOME/scratch.img +``` + +## Conclusion + +With virtual disks we can experiment with different types of filesystems and perhaps try out snapshotting in supported filesystems. If we create virtual disks on [`tmpfs` ](/blog/lxdtmpfs/), then we can have a super fast file system as well! \ No newline at end of file diff --git a/content/blog/virtualenv.md b/content/blog/virtualenv.md new file mode 100644 index 0000000..68b1453 --- /dev/null +++ b/content/blog/virtualenv.md @@ -0,0 +1,42 @@ +--- +title: "Python Virtual Environments" +date: 2019-05-21T23:04:54-04:00 +draft: false +--- + +Dependency management is hard. Luckily with Python there is a program called `virtualenv` that can help isolate different projects and manage dependencies. + +## Commands + +To create a new python 3.7 environment type in the following: + +```bash +virtualenv --python=python3.7 environment_name +``` + +Of course you can replace the python version with whichever version you like. Now to go into the environment do the following: + +```bash +source environment_name/bin/activate +``` + +This now sets up your python interpretor and other utilities to use the installation in the `environment_name` folder. You can now install python packages using `pip` and have it only reside in this environment. + +To save all currently installed packages into `requirements.txt`: + +```bash +pip freeze > requirements.txt +``` + +You can then install those packages in a different virtualenv session with: + +```bash +pip install -r requirements.txt +``` + +You can leave the virtualenv session with: + +```bash +deactivate +``` + diff --git a/content/blog/virtualizingwithclonezilla.md b/content/blog/virtualizingwithclonezilla.md new file mode 100644 index 0000000..f7b0ba3 --- /dev/null +++ b/content/blog/virtualizingwithclonezilla.md @@ -0,0 +1,11 @@ +--- +title: "Virtualizing Environments with Clonezilla" +date: 2019-08-25T20:09:28-04:00 +draft: false +--- + +[Clonezilla](https://clonezilla.org/) advertises itself as a disk cloning and backup utility. I've been starting to think of it as a little more than that. Let's say that you go to a client site and they have a machine in production. Instead of messing around with their machine, you make a Clonezilla copy of it. You can then take it back and place it on a computer you're not using to play around with it. + +Now even better, instead of using bare metal, what if you virtualize it? It's essentially the same process as putting it on baremetal, except now you have a virtual copy that you can make clones of, backup, etc. + +Now if the OS is looking for hardware that doesn't exist, that might make life a bit harder.... \ No newline at end of file diff --git a/content/blog/virtuallivecd.md b/content/blog/virtuallivecd.md new file mode 100644 index 0000000..1f684e1 --- /dev/null +++ b/content/blog/virtuallivecd.md @@ -0,0 +1,45 @@ +--- +title: "Playing with Live CDs" +date: 2020-01-12T22:45:06-05:00 +draft: false +images: [] +--- + +I was curious on how Lubuntu 19.10 looked but I didn't feel like rebooting my computer and loading into a new ISO. Luckily there is a nice easy way to play around with live CDs. + +Here's the command + +```bash +virt-install --name=Lubuntu \ + --nodisks --livecd \ + --graphics spice \ + --vcpu=4 \ + --ram=4096 \ + --os-type=linux \ + --sound \ + --accelerate \ + --cdrom=$HOME/Downloads/lubuntu-19.10-desktop-amd64.iso +``` + +The arguments mean the following + +| Argument | Meaning | +| ---------- | ------------------------------------------------------------ | +| nodisks | No storage disks are created | +| livecd | Set the boot to the cdrom after installation | +| graphics | Sets the graphics mode | +| vcpu | Number of virtual CPUs | +| RAM | Size of RAM | +| os-type | Linux/Windows/etc. | +| sound | Attach a virtual audio device | +| accelerate | Make use of the KVM or KQEMU kernel acceleration capabilities if available. | +| cdrom | Location of ISO | + +Once you run this command once, the image is "installed". This means that we can easily access it in the future with the following commands + +```bash +virsh start Lubuntu +virt-viewer Lubuntu +``` + +![1578887790276](/files/images/1578887790276.png) \ No newline at end of file diff --git a/content/blog/vncsetup.md b/content/blog/vncsetup.md new file mode 100644 index 0000000..d488d43 --- /dev/null +++ b/content/blog/vncsetup.md @@ -0,0 +1,23 @@ +--- +title: "VNC Setup" +date: 2019-05-24T23:21:43-04:00 +draft: false +--- + +I mostly following this [Digital Ocean Tutorial](https://www.digitalocean.com/community/tutorials/how-to-install-and-configure-vnc-on-ubuntu-18-04) on getting a working VNC setup on my desktop computer. There is one main difference on my end since I use KDE. I edited the `/home/$USER/.vnc/xstartup` file to appear as + +```bash +#!/bin/sh +unset SESSION_MANAGER +unset DBUS_SESSION_BUS_ADDRESS +dbus-launch --exit-with-session startkde +``` + +And I added the following script to make my life easier + +```bash +#!/bin/bash +ssh -L 5901:127.0.0.1:5901 -C -N -l rozek 192.168.0.104 & +krdc vnc://127.0.0.1:5901 +``` + diff --git a/content/blog/whyzeromq.md b/content/blog/whyzeromq.md new file mode 100644 index 0000000..2196f75 --- /dev/null +++ b/content/blog/whyzeromq.md @@ -0,0 +1,62 @@ +--- +title: "Why ZeroMQ" +date: 2019-06-16T19:26:50-04:00 +draft: false +--- + +I've been playing around with ZeroMQ recently and it's been really exciting. This blog post is going to outline why I think you should be using ZeroMQ today. + +First of all, before you compare this to other products like RabbitMQ, DDS, etc. Realize that this is a static library that you link to in your application as opposed to a broker you run. This means that you can get the benefits with this library for very little overhead. + +## Easier Sockets + +Instead of talking about how easy ZeroMQ is to use, I'm going to just show you the code to implement a server-client relationship in Python. + +**Server.py** + +```python +import zmq +import time + +port = "5556" +context = zmq.Context() +socket = context.socket(zmq.REP) +socket.bind("tcp://*:%s" % port) + +while True: + msg = socket.recv() + print(msg) + time.sleep(1) + socket.send_string("Server Message To Client") +``` + +**Client.py** + +```python +import zmq +import time + +port = "5556" +context = zmq.Context() +socket = context.socket(zmq.REQ) +socket.connect("tcp://localhost:%s" % port) + +while True: + socket.send_string("client message to server") + time.sleep(1) + msg = socket.recv() + print(msg) + +``` + +And just like that we have a way to transport messages back and forth. No need to make a special header before each message to know the appropriate size of the packets. ZeroMQ abstracts those details from you. + +## Different Transports Available + +You're not limited to only `TCP`. You can use `inproc` for thread-to-thread messaging, `ipc` for inter-process communication, and `epgm` or `pgm` for multicast messaging. Most of the time, just changing the connection string in `socket.connect` just works! + +## Common Networking Patterns Built In + +Sometimes we just want a dumb pipe between two ends (`pipe`) but most of the times we're writing applications that follow the `server-client` or `publisher-subscriber` architecture. That gets defined in `context.socket`. + +Ex: `context.socket(zmq.PAIR)` \ No newline at end of file diff --git a/content/blog/wireguardvpn.md b/content/blog/wireguardvpn.md new file mode 100644 index 0000000..af91c76 --- /dev/null +++ b/content/blog/wireguardvpn.md @@ -0,0 +1,103 @@ +--- +title: "Wireguard VPN" +date: 2019-11-20T20:09:59-05:00 +draft: false +--- + +Having some sort of VPN solution has always been a necessity for me. Whether it's back in the day where LAN games where the rage and I wanted to play it with my distant friends, or nowadays when I need to be able to access my Desktop running simulations behind my home LAN. + +This blog post is going to describe how I settled on Wireguard VPN as my preferred solution and how I use it to create a small secured network. + +Keep note that I am not talking about a VPN that masks your internet traffic. For that, look up a VPN provider such as Private Internet Access or ProtonVPN. + +## About Wireguard + +Wireguard is a point-to-point protocol. This means that you will be exchanging public and private keys between two clients and only those two clients will communicate with one another. + +In a way this makes it a lot simpler than other VPN solutions like OpenVPN where you have to set up a key server. That doesn't mean, however, that we cannot build upon this concept to create a secure network. + +Now in order to create this network, we'll need at least one publicly accessible through the Internet computer. I use a VPS instance on [DigitalOcean](https://www.digitalocean.com/) to act as my *server*. + +## Key Generation + +First you'll want to get [Wireguard installed](https://www.wireguard.com/install/), and then create public-private keys for both the *server* and the *client* computers. + +**On each machine:** + +```bash +cd /etc/wireguard +sudo umask 077 +sudo wg genkey | tee privatekey | wg pubkey > publickey +``` + +**On the server:** + +Edit `/etc/wireguard/wg0.conf` + +```yaml +[Interface] +Address = 10.10.100.1/24 +SaveConfig = false +ListenPort = 51826 +PrivateKey = + +[Peer] +PublicKey = +AllowedIPs = 10.10.100.2/32 + +[Peer] +PublicKey = +AllowedIPs = 10.10.100.3/32 +``` + +You might be wondering why we have `/24` in the Address field but `/32` in the AllowedIPs field. + +This is because we want our address to be in the `/24` subnet, but we only want that specific IP to be able to connect via that specific public key. + +Warning: Make sure you have 51826 open on your firewall. + +Now to have your server route traffic between the different clients connected to it, you need to enable IPv4 forwarding. + +*For current session:* + +```bash +sysctl -w net.ipv4.ip_forward=1 +``` + +*For persistence across reboots:* + +Edit `/etc/sysctl.d/99-sysctl.conf` to make sure `net.ipv4.ip_forward=1` + +**On the client machines:** + +Edit `/etc/wireguard/wg0.conf` + +```yaml +[Interface] +Address = 10.10.100.x/32 +PrivateKey = +PostUp = ping -c1 10.10.100.1 +DNS = 10.10.100.y # Include only if relevant + +[Peer] +PublicKey = +Endpoint = public_ip_or_domain:51826 +AllowedIPs = 10.10.100.0/24 +PersistentKeepalive = 21 +``` + +Replace `x` with a unique value per client. This configuration file has the client establish a connection to the server, send a packet via ping to initiate the connection and then try to persistently keep it alive. + +The DNS server is helpful if you have a DNS server running in that private network to access local resources. If you don't have an existing DNS server in the network, do not include that line. Also if you receive any errors in the future, you might need to make sure `resolvconf` is a command on your system. + +**On all machines:** + +Have the wireguard service start at boot + +```bash +sudo systemctl enable wg-quick@wg0 +sudo systemctl start wg-quick@wg0 +``` + +And enjoy a fully secure routable network! + diff --git a/content/blog/wormhole.md b/content/blog/wormhole.md new file mode 100644 index 0000000..bed32ca --- /dev/null +++ b/content/blog/wormhole.md @@ -0,0 +1,23 @@ +--- +title: "Wormhole" +date: 2019-11-20T21:21:23-05:00 +draft: false +--- + +A dead simple way to send files between two linux machines not on the same network is to use a utility called [Magic Wormhole](https://github.com/warner/magic-wormhole). It is typically included in the standard repositories and is so simple the this blog post is going to end soon. + +**Send a file:** + +```bash +wormhole send filename +``` + +This will generate a code for you to share like `6-speculate-allow` + +**Receive a file:** + +```bash +wormhole receive 6-speculate-allow +``` + +Done. diff --git a/content/blog/xephyr.md b/content/blog/xephyr.md new file mode 100644 index 0000000..f32fe08 --- /dev/null +++ b/content/blog/xephyr.md @@ -0,0 +1,55 @@ +--- +title: "Nested X Sessions with Xephyr" +date: 2019-12-25T00:52:02-05:00 +draft: false +images: [] +--- + +The X Window System was designed at a time when applications that ran on your computer were assumed to be trusted. Therefore there are minimal restrictions in place to prevent applications from grabbing images of whats on another applications screens. This feature as you might imagine is quite useful for screen clipper applications. + +Now I know that we're slowly moving towards Wayland on the Linux desktop, but X11 is still a reality even in my KDE Neon version that's based on Ubuntu 18.04. + +So in the meantime, we can put our untrusted applications into a nested X server using `Xephyr`. + +First, we need to find an empty display variable. Chances are this would be `:1` for you. Though if you have multiple of these nested X-sessions running, then this script will be handy. + +```bash +for ((DNum=1 ; DNum <= 100 ; DNum++)) ; do + [ -e /tmp/.X11-unix/X$DNum ] || break +done +``` + +At the end, `DNum` will be set to an empty display variable. + +Then to start your nested X session, + +```bash +Xephyr :$DNum \ + -extension MIT-SHM \ + -extension XTEST \ + -nolisten tcp \ + -screen 1920x1080 \ + -resizeable & +``` + +If we're going to be using this nested X server for one application, then I recommend using the `ratpoison` window manager as it will make the application full screen and supports the reizability of the Xephyr window. + +```bash +ratpoison -d :$DNum & +``` + +Finally, you should set your display variable so that any future GUI applications you execute from the terminal will show up in your new Xephyr window. + +```bash +DISPLAY=:$DNum +``` + +Now if you want to run multiple applications, you're likely better off using your native window manager. + +```bash +# Set the display before starting the window manager +DISPLAY=:$DNum +x-window-manager & +``` + +Of course you can replace ratpoison and your native x-window manager with any other window manager of your choice. It actually makes it a great way to test different environments. \ No newline at end of file diff --git a/content/blog/xpra.md b/content/blog/xpra.md new file mode 100644 index 0000000..829db2c --- /dev/null +++ b/content/blog/xpra.md @@ -0,0 +1,58 @@ +--- +title: "xpra" +date: 2020-01-15T18:29:57-05:00 +draft: false +images: [] +--- + +[`xpra`](http://xpra.org/) allows one to run persistent X applications on a remote host and display it on a local machine. It's a combination of [SSH X11 Forwarding](https://wiki.archlinux.org/index.php/OpenSSH#X11_forwarding) and [Screen](https://www.gnu.org/software/screen/). + +To get started you need to install the `xpra` package on both the server and client. On Ubuntu 18.04, this package isn't configured properly so one should use this PPA instead. + +```bash +sudo add-apt-repository ppa:mikhailnov/xpra +``` + +To install, + +```bash +sudo apt install xpra +``` + +Now you can from the client open up an application with one command + +```bash +xpra start ssh:user@host --exit-with-children --start-child="executable" +``` + +If you want it to behave more like screen. Then on the server. + +```bash +xpra start :100 +``` + +Where you can replace `:100` with another high display number. + +Then you can run the executable, + +```bash +DISPLAY=:100 executable +``` + +From the client, + +```bash +xpra attach ssh:user@host:100 +``` + +`xpra` has heuristics that determines the encoding of the images passed. You can however override it using the `--encoding`s flag to better tailor to your needs. + +- `rgb`: Raw pixel format that is lossless and uses compression. Best in high bandwidth environments. +- `png` compressed, lossless, but CPU intensive. May result in skipped frames +- `h264`, `vp8`, `vp9` are lossy formats that have tunable quality and speed parameters + + +More resources: +- [Arch Wiki](https://wiki.archlinux.org/index.php/Xpra) +- [Ubuntu Wiki](https://help.ubuntu.com/community/Xpra) + diff --git a/content/blog/yubikey.md b/content/blog/yubikey.md new file mode 100644 index 0000000..8cd53f1 --- /dev/null +++ b/content/blog/yubikey.md @@ -0,0 +1,14 @@ +--- +title: "YubiKey" +date: 2019-07-07T14:31:47-04:00 +draft: false +--- + +The YubiKey is a hardware authentication device manufactured by Yubico. It is a write only device that is meant to hold various authentication keys. The fact that it is write only means that people can't duplicate these keys. [Noah Chelliah](https://twitter.com/kernellinux) from Altispeed says that he uses YubiKeys at his company so that when employees moves on from his company he only needs to take their YubiKey. + +Now I don't manage any infrastructure larger than a couple computers, so why are these things interesting from a home use perspective? Well it allows you to have two-factor authentication separate from your smart phone. I was never a large fan of using my cell phone for two factor since you usually change cell phones every couple years. + +What I wanted to highlight is how easy it is to integrate it with Linux. The Pluggable Authentication Module (PAM) is responsible for authentication and other various utilities in Linux. By adding a couple of lines to a couple of text files, you can add two-factor authentication to your laptop! + +Instead of rewriting a bunch of instructions I got from somewhere else, I'll direct you to Yubico's own [documentation entry](https://developers.yubico.com/yubico-pam/Authentication_Using_Challenge-Response.html). Happy hacking! + diff --git a/content/community.md b/content/community.md new file mode 100644 index 0000000..c854e93 --- /dev/null +++ b/content/community.md @@ -0,0 +1,22 @@ +--- +title: Community +description: Various groups and activities that I participate in +--- + +## ./UMWLUG +I was the co-founder and vice president of UMW's Linux Users Group. I mainly brought interesting people to come and talk about Linux and open source. + +[Main Website](https://umwlug.github.io/) + +[My Records](umwlug) + +## Cybersecurity - Capture the Flag +Capture the Flag (CTF) is a competition in where teams try to find *flags* by doing different types of cybersecurity type problems. This can include using the wayback machine, breaking a simple cryptosystem, as well as finding exploits in a sandboxed system. + +I was part of a committee of four people making problems for UMW's first CTF competition. + +If you're interested in this sort of thing and just starting out, one website that I found which is really cool is called [OverTheWire](https://overthewire.org/wargames/bandit/). + +## Datakind + +In the summer of 2018, I attended the month Datakind events in DC. In it, I mostly performed data cleaning and verification for non-profit organizations in the area. diff --git a/content/community/_index.md b/content/community/_index.md new file mode 100644 index 0000000..e69de29 diff --git a/content/community/umwlug.md b/content/community/umwlug.md new file mode 100644 index 0000000..4ac7145 --- /dev/null +++ b/content/community/umwlug.md @@ -0,0 +1,32 @@ +--- +title: ./UMWLUG +description: My involvement in UMW's Linux Users Group +--- + +## Sweet Logo Designs + +I have a small amount of pride in the logos I made for this group. Check them out! + +[Light Theme Logo](/files/umwlug/logo.pdf) + +[Dark Theme Logo](/files/umwlug/darklogo.pdf) + +## Events Organized +I helped organize a variety of different events while I was part of the group, below are the link to the fliers I designed for them: + +[Cybersecurity: The Art of Analyzing, Protecting, and Defending your Network](/files/umwlug/tedtalk.pdf) + +[Fall 2019 Interest Meeting](/files/umwlug/interestfall2019.pdf) + +[How I Get Paid to Write Free Software](/files/umwlug/petertalk.pdf) + +[Spring 2019 Interest Meeting](/files/umwlug/interestspring2019.pdf) + +[Linux Audio Workshop](/files/umwlug/audio.pdf) + +[Fall 2018 Interest Meeting](/files/umwlug/interestfall2018.pdf) + +[Linux/Unix: Why are they related, but not the same](/files/umwlug/linuxvunix.pdf) + +[Spring 2018 Interest Meeting](/files/umwlug/interestspring2018.pdf) + diff --git a/content/notes.md b/content/notes.md new file mode 100644 index 0000000..281baaf --- /dev/null +++ b/content/notes.md @@ -0,0 +1,26 @@ +--- +title: Notes +description: Documents pertaining to courses I've taken +--- + +# Courses + +Below are the courses that I have documents up online for. + +[Probability and Statistical Inference I](stat381) + +[Real Analysis Quick Facts](realanalysis) + +[Some Abstract 2 Definitions](abstract2def) + +[Handy Facts about Quadratic Congruences](quadraticcongruences) + +## Coursera Courses +Occassionally during breaks, I like to take some coursera courses. I will post my notes from the lecture here as well. + +[Bayesian Statistics](bayesianstatistics) + +[Reproducible Research](reproducibleresearch) + +## Self/Small Group Study +Chris Richters, Ethan Martin, and I embarked on the book ["Algorithms" by Jeff Erickson](http://jeffe.cs.illinois.edu/teaching/algorithms/). I took some notes during our discussions but you should really just read the book instead. [Notes Page](algorithms) diff --git a/content/notes/.Stat381.md.swp b/content/notes/.Stat381.md.swp new file mode 100644 index 0000000..fb7c6e9 Binary files /dev/null and b/content/notes/.Stat381.md.swp differ diff --git a/content/notes/_index.md b/content/notes/_index.md new file mode 100644 index 0000000..e69de29 diff --git a/content/notes/abstract2def.md b/content/notes/abstract2def.md new file mode 100644 index 0000000..d3a8009 --- /dev/null +++ b/content/notes/abstract2def.md @@ -0,0 +1,73 @@ +# Abstract Algebra 2 Definitions + +## Chapter 17 + +By a **ring** we mean a set $A$ with operations called addition and multiplication which satisfy the following axioms: + +- $A$ with addition alone is an abelian group +- Multiplication is associative +- Multiplication is distributive over addition + +Since $\langle A, + \rangle$ is an abelian group, there is in $A$ a neutral element for addition. This is called the **zero** element. Also, every element has an additive inverse called its **negative**. + +If multiplication in a ring $A$ is commutative then we say that $A$ is a **commutative ring**. + +If a ring $A$ has a neutral element for multiplication then we say that the neutral element is the **unity** of $A$. + +If $A$ is a ring with unity, there may be elements in $A$ which have a multiplicative inverse. Such elements are said to be **invertible**. + +If $A$ is a commutative ring with unity in which every nonzero element is invertible, then $A$ is called a **field**. + +In any ring, a nonzero element $a$ is called a **divisor of zero** if there is a nonzero element $b$ in a ring such that the product $ab$ or $ba$ is equal to zero. + +An **integral domain** is defined to be a commutative ring with unity that has the cancellation property. Another way of saying this is that an integral domain is a commutative ring with unity and has no zero divisors. + +## Chapter 18 + +Let $A$ be a ring, and $B$ be a nonempty subset of $A$. $B$ is called a **subring** if it satisfies the following properties: + +- Closed with respect to addition +- Closed with respect to negatives +- Closed with respect to multiplication + +Let $B$ be a subring of $A$. We call $B$ an **ideal** of $A$ if $xb, bx \in B$ for all $b \in B$ and $x \in A$. + +The **principle ideal generated by $a$**, denoted $\langle a \rangle$ is the subring defined by fixing an element $a$ in a subring $B$ of $A$ and multiplying all elements of $A$ by $a$. +$$ +\langle a \rangle = \{ xa : x \in A \} +$$ +A **homomorphism** from a ring $A$ to a ring $B$ is a function $f : A \to B$ satisfying the identities: +$$ +f(x_1 + x_2 ) = f(x_1) + f(x_2) \\ +f(x_1x_2) = f(x_1)f(x_2) +$$ +If there is a homomorphism from $A$ onto $B$, we call $B$ a **homomorphic image** of $A$. + +If $f$ is a homomorphism from a ring $A$ to a ring $B$, the **kernel** of $f$ is the set of all the elements of $A$ which are carried by $f$ onto the zero element of $B$. In symbols, the kernel of $f$ is the set +$$ +K = \{x \in A: f(x) = 0\} +$$ +If $A$ and $b$ are rings, an **isomorphism** from $A$ to $B$ is a homomorphism which is a one-to-one correspondence from $A$ to $B$. In other words, it is injective and surjective homomorphism. + +If there is an isomorphism from $A$ to $B$ we say that $A$ is **isomorphic** to $B$, and this fact is expressed by writing $A \cong B$. + +## Chapter 19 + +Let $A$ be a ring, and $J$ an ideal of $A$. For any element $a \in A$, the symbol $J + a$ denotes the set of all sums $j + a$ as $a$ remains fixed and $j$ ranges over $J$. That is, +$$ +J + a = \{j + a : j \in J\} +$$ +$J + a$ is called a **coset** of $J$ in $A$. + +Now think of the set which contains all cosets of $J$ in $A$. This set is conventionally denoted by $A / J$ and reads $A$ mod $J$. Then, $A / J$ with coset addition and multiplication is a ring. + +An ideal $J$ of a commutative ring is said to be a **prime ideal** if for any two elements $a$ and $b$ in the ring, +$$ +ab \in J \implies a \in J \text{ or } b \in J +$$ +Theorem: If $J$ is a prime ideal of a community ring with unity $A$, then the quotient ring $A / J$ is an integral domain. + +An ideal $J$ of $A$ with $J \ne A$ is called a **maximal ideal** if there exists no proper ideal $K$ of $A$ such that $J \subseteq K$ with $J \ne K$. + +Theorem: If $A$ is a commutative ring with unity, then $J$ is a maximal ideal of $A$ iff $A/J$ is a field. + diff --git a/content/notes/algorithms.md b/content/notes/algorithms.md new file mode 100644 index 0000000..9178b7b --- /dev/null +++ b/content/notes/algorithms.md @@ -0,0 +1,17 @@ +--- +title: Algorithms Book Study +--- + +# Algorithms Book Study +A couple of my friends and I decided to start a book club following "Algorithms" by Jeff Erickson. One bonus is that he gives it away for free on [his website](http://jeffe.cs.illinois.edu/teaching/algorithms/)! + +Of course you should totally check his book out rather than reading my notes. There are tons of witty and fun things in his textbook, not a dry reading I promise. These notes are here mostly for archival purposes. + +## Notes +[Chapter 1](recursion) + +[Chapter 2](backtracking) + +[Chapter 3](dynamic) + +[Chapter 4](greedy) \ No newline at end of file diff --git a/content/notes/algorithms/backtracking.md b/content/notes/algorithms/backtracking.md new file mode 100644 index 0000000..5f9c7ae --- /dev/null +++ b/content/notes/algorithms/backtracking.md @@ -0,0 +1,62 @@ +# Backtracking +This algorithm tries to construct a solution to a problem one piece at a time. Whenever the algorithm needs to decide between multiple alternatives to the part of the solution it *recursively* evaluates every option and chooses the best one. + + +## How to Win +To beat any *non-random perfect information* game you can define a Backtracking algorithm that only needs to know the following. +- A game state is good if either the current player has already won or if the current player can move to a bad state for the opposing player. +- A game state is bad if either the current player has already lost or if every available move leads to a good state for the opposing player. + +``` +PlayAnyGame(X, player) + if player has already won in state X + return GOOD + if player has lost in state X + return BAD + for all legal moves X -> Y + if PlayAnyGame(y, other player) = Bad + return GOOD + return BAD +``` + +In practice, most problems have an enormous number of states not making it possible to traverse the entire game tree. + +## Subset Sum + +For a given set, can you find a subset that sums to a certain value? + +``` +SubsetSum(X, T): + if T = 0 + return True + else if T < 0 or X is empty + return False + else + x = any element of X + with = SubsetSum(X \ {x}, T - x) + without = SubsetSum(X \ {x}, T) + return (with or without) +``` + +X \ {x} denotes set subtraction. It means X without x. + +``` +ConstructSubset(X, i, T): + if T = 0 + return empty set + if T < 0 or n = 0 + return None + Y = ConstructSubset(X, i - 1, T) + if Y does not equal None + return Y + Y = ConstructSubset(X, i - 1, T - X[i]) + if Y does not equal None + return Y with X[i] + return None +``` + +## Big Idea + +Backtracking algorithms are used to make a *sequence of decisions*. + +When we design a new recursive backtracking algorithm, we must figure out in advance what information we will need about past decisions in the middle of the algorithm. \ No newline at end of file diff --git a/content/notes/algorithms/dynamic.md b/content/notes/algorithms/dynamic.md new file mode 100644 index 0000000..5d1b785 --- /dev/null +++ b/content/notes/algorithms/dynamic.md @@ -0,0 +1,82 @@ +# Dynamic Programming + +The book first goes into talking about the complexity of the Fibonacci algorithm + +``` +RecFibo(n): + if n = 0 + return 0 + else if n = 1 + return 1 + else + return RecFibo(n - 1) + RecFibo(n - 2) +``` + +It talks about how the complexity of this is exponential. + +"A single call to `RecFibo(n)` results in one recursive call to `RecFibo(n−1)`, two recursive calls to `RecFibo(n−2)`, three recursive calls to `RecFibo(n−3)`, five recursive calls to `RecFibo(n−4)`" + +Now consider the memoized version of this algorithm... + +``` +MemFibo(n): + if n = 0 + return 0 + else if n = 1 + return 1 + else + if F[n] is undefined: + F[n] <- MemFibo(n - 1) + MemFibo(n - 2) + return F[n] +``` + +This actually makes the algorithm run in linear time! + +![1564017052666](/home/rozek/Documents/StudyGroup/Algorithms/1564017052666.png) + +Dynamic programming makes use of this fact and just intentionally fills up an array with the values of $F$. + +``` +IterFibo(n): + F[0] <- 0 + F[1] <- 1 + for i <- 2 to n + F[i] <- F[i - 1] + F[i - 2] + return F[n] +``` + +Here the linear complexity becomes super apparent! + +Interesting snippet + +"We had a very interesting gentleman in Washington named Wilson. He was secretary of Defense, and he actually had a pathological fear and hatred of the word *research*. I’m not using the term lightly; I’m using it precisely. His face would suffuse, he would turn red, and he would get violent if people used the term *research* in his presence. You can imagine how he felt, then, about the term *mathematical*.... I felt I had to do something to shield Wilson and the Air Force from the fact that I was really doing mathematics inside the RAND Corporation. What title, what name, could I choose?" + + + +Dynamic programming is essentially smarter recursion. It's about not repeating the same work. + +These algorithms are best developed in two distinct stages. + +(1) Formulate the problem recursively. + +(a) Specification: What problem are you trying to solve? + +(b) Solution: Why is the whole problem in terms of answers t smaller instances exactly the same problem? + +(2) Find solutions to your recurrence from the bottom up + +(a) Identify the subproblems + +(b) Choose a memoization data structure + +(c) Identify dependencies + +(d) Find a good evaluation order + +(e) Analyze space and running time + +(f) Write down the algorithm + +## Greedy Algorithms + +If we're lucky we can just make decisions directly instead of solving any recursive subproblems. The problem is that greedly algorithms almost never work. \ No newline at end of file diff --git a/content/notes/algorithms/greedy.md b/content/notes/algorithms/greedy.md new file mode 100644 index 0000000..5477c9a --- /dev/null +++ b/content/notes/algorithms/greedy.md @@ -0,0 +1,36 @@ +# Greedy Algorithms + +Greedy Algorithms are about making the best local choice and then blindly plowing ahead. + +An example of this is documents on a tape. Let's say to read any given document on a tape, you first need to read all the documents that come before it. + +What is the best way to have the documents laid out in order to decrease the expected read time? + +Answer: Putting the smaller documents first. + +The book then generalizes it further by adding access frequencies. The answer to that is to sort by increasing length first and then decreasing access times. + +## Scheduling Classes +To maximize the number of classes one can take one greedy algorithm is to always select the class that ends first. + +That will produce one maximal conflict free schedule. + +## Structure of Correctness Proofs for Greedy Algorithms + +- Assume that there is an optimal solution that is different from the greedy solution. +- Find the first "difference" between the two solutions. +- Argue that we can exchange the optimal choice for the greedy choice without making the solution worse. + +## Hospital-Doctor Matching +Let's say you have a list of doctors that need internships and hospitals accepting interns. We need to make it so that every doctor has a job and every hospital has a doctor. + +Assuming we have the same number of doctors and hospitals and that each hospital offers only one internship, how do we make an algorithm to ensure that no unstable matchings exist? + +An unstable match is when +- a is matched with some other hospital A even though she prefers B +- B is matched with some doctor b even though they prefer a. + +The Gale-Shapley algorithm is a great greedy fit. It goes like this + +1. An arbitrary unmatched hospital A offers its position to the best doctor a who has not already rejected it. +2. If a is unmatched, she tentatively accepts A's offer. If a already had a match but prefers A, she rejects her current match and tentatively accepts the new offer from A. Otherwise a rejects the new offer. \ No newline at end of file diff --git a/content/notes/algorithms/recursion.md b/content/notes/algorithms/recursion.md new file mode 100644 index 0000000..96c2383 --- /dev/null +++ b/content/notes/algorithms/recursion.md @@ -0,0 +1,86 @@ +# Recursion + +## Reductions + +Quote: *Reduction* is the single most common technique used in designing algorithms. Reduce one problem $X$ to another problem $Y$. + +The running time of the algorithm can be affected by $Y$, but $Y$ does not affect the correctness of the algorithm. So it is often useful to not be concerned with the inner workings of $Y$. + +## Simplify and Delegate + +Quote: *Recursion* is a particularly powerful kind of reduction, which can be described loosely as follows: + +- If the given instance of the problem can be solved directly, then do so. +- Otherwise, reduce it to one or more **simpler instances of the same problem.** + +The book likes to call the delegation of simpler tasks "giving it to the recursion fairy." + +Your own task as an algorithm writer is to simplify the original problem and solve base cases. The recursion fairy will handle the rest. + +Tying this to mathematics, this is known as the **Induction Hypothesis**. + +The only caveat is that simplifying the tasks must eventually lead to the **base case** otherwise the algorithm might run infinitely! + +#### Example: Tower of Hanoi + +Assuming you know how the game works, we will describe how to solve it. + +Quote: We can't move it all at the beginning, because all the other disks are in the way. So first we have to move those $n - 1$ smaller disks to the spare peg. Once that's done we can move the largest disk directly to its destination. Finally to finish the puzzle, we have to move the $n -1$ disks from the spare peg to the destination. + +**That's it.** + +Since the problem was reduced to a base case and a $(n - 1)$ problem, we're good. The book has a funny quote "Our job is finished. If we didn't trust the junior monks, we wouldn't have hired them; let them do their job in peace." + + ``` +Hanoi(n, src, dst, tmp): + if n > 0 + Hanoi(n - 1, src, tmp, dst) + move disk n from src to dst + Hanoi(n - 1, tmp, dst, src) + ``` + +## Sorting Algorithms + +## Merge Sort + +``` +MergeSort(A[1..n]): + if n > 1 + m = floor(n / 2) + MergeSort(A[1..m]) + MergeSort(A[m + 1..n]) + Merge(A[1..n], m) +``` + +``` +Merge(A[1..n], m): + i = 1 + j = m + 1 + for k = 1 to n + if j > n + B[k] = A[i] + i++ + else if i > m + B[k] = A[j] + j++ + else if A[i] < A[j] + B[k] = A[i] + i++ + else + B[k] = A[j] + j++ + Copy B to A +``` + +I think an important part to recall here is that the algorithm will break it down to the lowest level. An array with one element and slowly work its way up. + +That means we can always assume that each subarray that we're merging is already sorted! Which is why the merge algorithm is written the way it is. + +## The Pattern + +This section is quoted verbatim. + +1. **Divide** the given instance of the problem into several *independent smaller* instances of *exactly* the same problem. +2. **Delegate** each smaller instance to the Recursion Fairy. +3. **Combine** the solutions for the smaller instances into the final solution for the given instance. + diff --git a/content/notes/bayesianstatistics.md b/content/notes/bayesianstatistics.md new file mode 100644 index 0000000..84a1897 --- /dev/null +++ b/content/notes/bayesianstatistics.md @@ -0,0 +1,20 @@ +--- +title: Bayesian Statistics +showthedate: false +--- + + + +# Bayesian Statistics: From Concept to Data Analysis + +In the Winter of 2017, I took a course on Bayesian Statistics on Coursera offered by Dr. Herbert Lee. + +Below are the notes for each of the four weeks. + +[Week 1](week1) + +[Week 2](week2) + +[Week 3](week3) + +[Week 4](week4) diff --git a/content/notes/bayesianstatistics/week1.md b/content/notes/bayesianstatistics/week1.md new file mode 100644 index 0000000..3480a84 --- /dev/null +++ b/content/notes/bayesianstatistics/week1.md @@ -0,0 +1,413 @@ +# Bayesian Statistics + +## Rules of Probability + +Probabilities must be between zero and one, i.e., $0≤P(A)≤1$ for any event A. + +Probabilities add to one, i.e., $\sum{P(X_i)} = 1$ + +The complement of an event, $A^c$, denotes that the event did not happen. Since probabilities must add to one, $P(A^c) = 1 - P(A)$ + +If A and B are two events, the probability that A or B happens (this is an inclusive or) is the probability of the union of the events: +$$ +P(A \cup B) = P(A) + P(B) - P(A\cap B) +$$ +where $\cup$ represents union ("or") and $\cap$ represents intersection ("and"). If a set of events $A_i$ are mutually exclusive (only one event may happen), then +$$ +P(\cup_{i=1}^n{A_i}) = \sum_{i=1}^n{P(A_i)} +$$ + +## Odds + +The odds for event A, denoted $\mathcal{O}(A)$ is defined as $\mathcal{O}(A) = P(A)/P(A^c)$ + +This is the probability for divided by probability against the event + +From odds, we can also compute back probabilities +$$ +\frac{P(A)}{P(A^c)} = \mathcal{O}(A) +$$ + +$$ +\frac{P(A)}{1-P(A)} = \mathcal{O}(A) +$$ + +$$ +\frac{1 -P(A)}{P(A)} = \frac{1}{\mathcal{O}(A)} +$$ + +$$ +\frac{1}{P(A)} - 1 = \frac{1}{\mathcal{O}(A)} +$$ + +$$ +\frac{1}{P(A)} = \frac{1}{\mathcal{O}(A)} + 1 +$$ + +$$ +\frac{1}{P(A)} = \frac{1 + \mathcal{O}(A)}{\mathcal{O}(A)} +$$ + +$$ +P(A) = \frac{\mathcal{O}(A)}{1 + \mathcal{O}(A)} +$$ + +## Expectation + +The expected value of a random variable X is a weighted average of values X can take, with weights given by the probabilities of those values. +$$ +E(X) = \sum_{i=1}^n{x_i * P(X=x_i)} +$$ + +## Frameworks of probability + +Classical -- Outcomes that are equally likely have equal probabilities + +Frequentist -- In an infinite sequence of events, what is the relative frequency + +Bayesian -- Personal perspective (your own measure of uncertainty) + +In betting, one must make sure that all the rules of probability are followed. That the events are "coherent", otherwise one might construct a series of bets where you're guaranteed to lose money. This is referred to as a Dutch book. + +## Conditional probability + +$$ +P(A|B) = \frac{P(A\cup B)}{P(B)} +$$ + +Where $A|B$ denotes "A given B" + +Example from lecture: + +Suppose there are 30 students, 9 of which are female. From the 30 students, 12 are computer science majors. 4 of those 12 computer science majors are female +$$ +P(Female) = \frac{9}{30} = \frac{3}{10} +$$ + +$$ +P(CS) = \frac{12}{30} = \frac{2}{5} +$$ + +$$ +P(F\cap CS) = \frac{4}{30} = \frac{2}{15} +$$ + +$$ +P(F|CS) = \frac{P(F \cap CS)}{P(CS)} = \frac{2/15}{2/5} = \frac{1}{3} +$$ + +An intuitive way to think about a conditional probability is that we're looking at a subsegment of the original population, and asking a probability question within that segment +$$ +P(F|CS^c) = \frac{P(F\cap CS^c)}{PS(CS^c)} = \frac{5/30}{18/30} = \frac{5}{18} +$$ +The concept of independence is when one event does not depend on another. +$$ +P(A|B) = P(A) +$$ +It doesn't matter that B occurred. + +If two events are independent then the following is true +$$ +P(A\cap B) = P(A)P(B) +$$ +This can be derived from the conditional probability equation. + +## Conditional Probabilities in terms of other conditional + +Suppose we don't know what $P(A|B)$ is but we do know what $P(B|A)$ is. We can then rewrite $P(A|B)$ in terms of $P(B|A)$ +$$ +P(A|B) = \frac{P(B|A)P(A)}{P(B|A)P(A) + P(B|A^c)P(A^c)} +$$ +Let's look at an example of an early test for HIV antibodies known as the ELISA test. +$$ +P(+ | HIV) = 0.977 +$$ + +$$ +P(- | NO\_HIV) = 0.926 +$$ + +As you can see over 90% of the time, this test was accurate. + +The probability of someone in North America having this disease was $P(HIV) = .0026$ + +Now let's consider the following problem: the probability of having the disease given that they tested positive $P(HIV | +)$ +$$ +P(HIV|+) = \frac{P(+|HIV)P(HIV)}{P(+|HIV)P(HIV) + P(+|NO\_HIV){P(NO\_HIV)}} +$$ + +$$ +P(HIV|+) = \frac{(.977)(.0026)}{(.977)(.0026) + (1-.977)(1-.0026)} +$$ + +$$ +P(HIV|+) = 0.033 +$$ + +This example looked at Bayes Theorem for the two event case. We can generalize it to n events through the following formula +$$ +P(A|B) = \frac{P(B|A_1){(A_1)}}{\sum_{i=1}^{n}{P(B|A_i)}P(A_i)} +$$ + + + +## Bernoulli Distribution + +~ means 'is distributed as' + +We'll be first studying the Bernoulli Distribution. This is when your event has two outcomes, which is commonly referred to as a success outcome and a failure outcome. The probability of success is $p$ which means the probability of failure is $(1-p)$ +$$ +X \sim B(p) +$$ + +$$ +P(X = 1) = p +$$ + +$$ +P(X = 0) = 1-p +$$ + +The probability of a random variable $X$ taking some value $x$ given $p$ is +$$ +f(X = x | p) = f(x|p) = p^x(1-p)^{1 - x}I +$$ +Where $I$ is the Heavenside function + +Recall the expected value +$$ +E(X) = \sum_{x_i}{x_iP(X=x_i)} = (1)p + (0)(1-p) = p +$$ +We can also define the variance of Bernoulli +$$ +Var(X) = p(1-p) +$$ + +## Binomial Distribution + +The binomial distribution is the sum of n *independent* Bernoulli trials +$$ +X \sim Bin(n, p) +$$ + +$$ +P(X=x|p) = f(x|p) = {n \choose x} p^x (1-p)^{n-x} +$$ + +$n\choose x$ is the combinatoric term which is defined as +$$ +{n \choose x} = \frac{n!}{x! (n - x)!} +$$ + +$$ +E(X) = np +$$ + +$$ +Var(X) = np(1-p) +$$ + +## Uniform distribution + +Let's say X is uniformally distributed +$$ +X \sim U[0,1] +$$ + +$$ +f(x) = \left\{ + \begin{array}{lr} + 1 & : x \in [0,1]\\ + 0 & : otherwise + \end{array} + \right. +$$ + +$$ +P(0 < x < \frac{1}{2}) = \int_0^\frac{1}{2}{f(x)dx} = \int_0^\frac{1}{2}{dx} = \frac{1}{2} +$$ + +$$ +P(0 \leq x \leq \frac{1}{2}) = \int_0^\frac{1}{2}{f(x)dx} = \int_0^\frac{1}{2}{dx} = \frac{1}{2} +$$ + +$$ +P(x = \frac{1}{2}) = 0 +$$ + +## Rules of probability density functions + +$$ +\int_{-\infty}^\infty{f(x)dx} = 1 +$$ + +$$ +f(x) \ge 0 +$$ + +$$ +E(X) = \int_{-\infty}^\infty{xf(x)dx} +$$ + +$$ +E(g(X)) = \int{g(x)f(x)dx} +$$ + +$$ +E(aX) = aE(X) +$$ + +$$ +E(X + Y) = E(X) + E(Y) +$$ + +If X & Y are independent +$$ +E(XY) = E(X)E(Y) +$$ + +## Exponential Distribution + +$$ +X \sim Exp(\lambda) +$$ + +Where $\lambda$ is the average unit between observations +$$ +f(x|\lambda) = \lambda e^{-\lambda x} +$$ + +$$ +E(X) = \frac{1}{\lambda} +$$ + +$$ +Var(X) = \frac{1}{\lambda^2} +$$ + +## Uniform (Continuous) Distribution + +$$ +X \sim [\theta_1, \theta_2] +$$ + +$$ +f(x|\theta_1,\theta_2) = \frac{1}{\theta_2 - \theta_1}I_{\theta_1 \le x \le \theta_2} +$$ + +## Normal Distribution + +$$ +X \sim N(\mu, \sigma^2) +$$ + +$$ +f(x|\mu,\sigma^2) = \frac{1}{\sqrt{2\pi \sigma^2}}e^{-\frac{1}{2\sigma^2}(x-\mu)^2} +$$ + +$$ +E(X) = \mu +$$ + +$$ +Var(X) = \sigma^2 +$$ + +## Variance + +Variance is the squared distance from the mean +$$ +Var(X) = \int_{-\infty}^\infty {(x - \mu)^2f(x)dx} +$$ + +## Geometric Distribution (Discrete) + +The geometric distribution is the number of trails needed to get the first success, i.e, the number of Bernoulli events until a success is observed. +$$ +X \sim Geo(p) +$$ + +$$ +P(X = x|p) = p(1-p)^{x-1} +$$ + +$$ +E(X) = \frac{1}{p} +$$ + +## Multinomial Distribution (Discrete) + +Multinomial is like a binomial when there are more than two possible outcomes. + + +$$ +f(x_1,...,x_k|p_1,...,p_k) = \frac{n!}{x_1! ... x_k!}p_1^{x_1}...p_k^{x_k} +$$ + +## Poisson Distribution (Discrete) + +The Poisson distribution is used for counts. The parameter $\lambda > 0$ is the rate at which we expect to observe the thing we are counting. +$$ +X \sim Pois(\lambda) +$$ + +$$ +P(X=x|\lambda) = \frac{\lambda^xe^{-\lambda}}{x!} +$$ + +$$ +E(X) = \lambda +$$ + +$$ +Var(X) = \lambda +$$ + +## Gamma Distribution (Continuous) + +If $X_1, X_2, ..., X_n$ are independent and identically distributed Exponentials,waiting time between success events, then the total waiting time for all $n$ events to occur will follow a gamma distribution with shape parameter $\alpha = n$ and rate parameter $\beta = \lambda$ +$$ +Y \sim Gamma(\alpha, \beta) +$$ + +$$ +f(y|\alpha,\beta) = \frac{\beta^n}{\Gamma(\alpha)}y^{n-1}e^{-\beta y}I_{y\ge0}(y) +$$ + +$$ +E(Y) = \frac{\alpha}{\beta} +$$ + +$$ +Var(Y) = \frac{\alpha}{\beta^2} +$$ + +Where $\Gamma(x)$ is the gamma function. The exponential distribution is a special case of the gamma distribution with $\alpha = 1$. As $\alpha$ increases, the gamma distribution more closely resembles the normal distribution. + +## Beta Distribution (Continuous) + +The beta distribution is used for random variables which take on values between 0 and 1. For this reason, the beta distribution is commonly used to model probabilities. +$$ +X \sim Beta(\alpha, \beta) +$$ + +$$ +f(x|\alpha,\beta) = \frac{\Gamma(\alpha + \beta)}{\Gamma(\alpha)\Gamma(\beta)}x^{n -1}(1 - x)^{\beta - 1}I_{\{0 < x < 1\}} +$$ + +$$ +E(X) = \frac{\alpha}{\alpha + \beta} +$$ + +$$ +Var(X) = \frac{\alpha\beta}{(\alpha + \beta)^2(\alpha+\beta+1)} +$$ + +The standard uniform distribution is a special case of the beta distribution with $\alpha = \beta = 1$ + +## Bayes Theorem for continuous distribution + +$$ +f(\theta|y) = \frac{f(y|\theta)f(\theta)}{\int{f(y|\theta)f(\theta)d\theta}} +$$ + diff --git a/content/notes/bayesianstatistics/week2.md b/content/notes/bayesianstatistics/week2.md new file mode 100644 index 0000000..54b2a6f --- /dev/null +++ b/content/notes/bayesianstatistics/week2.md @@ -0,0 +1,537 @@ +Under the frequentest paradigm, you view the data as a random sample from some larger, potentially hypothetical population. We can then make probability statements i.e, long-run frequency statements based on this larger population. + +## Coin Flip Example (Central Limit Theorem) + +Let's suppose we flip a coin 100 times and we get 44 heads and 56 tails. +$$ +n = 100 +$$ +We can view these 100 flips as a random sample from a much larger infinite hypothetical population of flips from this coin. + +Let's say that each flip follows a Bournelli distribution with some probability p. In this case $p$ is unknown, but we're assuming it's fixed because we have a particular physical coin. + +We can ask what's our best estimate of the probability of getting a head, or an estimate of $p$. We can also ask about how confident we are about that estimate. + +Let's start by applying the Central Limit Theorem. The Central Limit Theorem states that the sum of 100 flips will follow approximately a Normal distribution with mean 100p and variance 100p(1-p) +$$ +\sum^n_{i=1}{x_i} \sim N(np, np(1-p)) +$$ + +$$ +\sum_{i = 1}^{100}{x_i} \sim N(100p, 100p(1-p)) +$$ + +By the properties of a Normal distribution, 95% of the time we'll get a result within 1.96 standard deviations of the mean. Our estimate is $100\hat{p}$ and our error is 1.96 times the standard deviation. +$$ +n\hat{p} \pm 1.96\sqrt{n\hat{p}(1-\hat{p})} +$$ + +$$ +100\hat{p} \pm 1.96\sqrt{100\hat{p}(1-\hat{p})} +$$ + +This is referred to as a Confidence Interval. Confidence Intervals are commonly abbreviated as CI. In our example $\hat{p} = \frac{44}{n} = \frac{44}{100}$. Therefore, the 95% Confidence Interval in the true number of heads after flipping a coin 100 times is: +$$ +100(.44) \pm 1.96\sqrt{100(.44)(1-.44)} +$$ + +$$ +44 \pm 1.96\sqrt{44(.56)} +$$ + +$$ +44\pm 1.96\sqrt{24.64} +$$ + +$$ +(34.27, 53.73) +$$ + +We can divide this by 100 to get the 95% Confidence Interval for $p$ +$$ +(0.34, 0.53) +$$ +Let's step back and ask, what does it mean when I say we're 95% confident? + +Under the frequentest paradigm, what this means is we have to think back to our infinite hypothetical sequence of events. So if we were to repeat this trial an infinite number of times, or an arbitrary large number of times. Each time we create a confidence interval based on the data we observe, than on average 95% of the intervals we make will contain the true value of p. + +On the other hand, we might want to know something about this particular interval. Does this interval contain the true p? What's the probability that this interval contains a true p? Well, we don't know for this particular interval. But under the frequentest paradigm, we're assuming that there is a fixed answer for p. Either p is in that interval or it's not in that interval. The probability that p is in that interval is either 0 or 1. + +## Example: Heart Attack Patients (Maximum Likelihood) + +Consider a hospital where 400 patients are admitted over a month for heart attacks, and a month later 72 of them have died and 328 of them have survived. + +We can ask, what's our estimate of the mortality rate? + +Under the frequentest paradigm, we must first establish our reference population. What do we think our reference population is here? One possibility is we could think about heart attack patients in the region. + +Another reference population we can think about is heart attack patients that are admitted to this hospital, but over a longer period of time. + +Both of these might be reasonable attempts, but in this case our actual data are not random sample from either of those populations. We could sort of pretend they are and move on, or we could also try to think harder about what a random sample situation might be. We can think about all the people in the region who might possibly have a heart attack and might possibly get admitted to this hospital. + +It's a bit of an odd hypothetical situation, and so there are some philosophical issues with the setup of this whole problem with the frequentest paradigm, In any case, let's forge forward and think about how we might do some estimation. + +Moving on, we can say each patient comes from a Bernoulli distribution with an unknown parameter $\theta$. +$$ +Y_i \sim B(\theta) +$$ + +$$ +P(Y_i = 1) = \theta +$$ + +In this case, let's call the "success" a mortality. + +The probability density function for the entire set of data we can write in vector form. Probability of all the Y's take some value little y given a value of theta. +$$ +P(Y = y | \theta) = P(Y_1 = y_1, Y_2, = y_2,\dots, Y_n=y_n|\theta) +$$ +*Since we're viewing these as independent events*, then the probability of each of these individual ones we can write in product notation. +$$ +P(Y = y | \theta) = P(Y_1 = y_1|\theta)\dots P(Y_n = y_n | \theta) +$$ + +$$ +P(Y = y | \theta) = \prod_{i = 1}^n{P(Y_i =y_i | \theta)} = \prod_{i = 1}^n{(\theta^{y_i}(1-\theta)^{1-y_i})} +$$ + +This is the probability of observing the actual data that we collected, conditioned on a value of the parameter $\theta$. We can now think about this expression as a function of theta. This is a concept of a likelihood. +$$ +L(\theta|y) = \prod_{i = 1}^n{(\theta^{y_i}(1-\theta)^{1-y_i})} +$$ +It looks like the same function, but here it is a function of y given $\theta$. And now we're thinking of it as a function of $\theta$ given y. + +This is not a probability distribution anymore, but it is still a function for $\theta$. + +One we to estimate $\theta$ is that we choose the $\theta$ that gives us the largest value of the likelihood. It makes the data the most likely to occur for the particular data we observed. + +This is referred to as the maximum likelihood estimate (MLE), + +We're trying to find the $\theta$ that maximizes the likelihood. + +In practice, it's usually easier to maximize the natural logarithm of the likelihood, commonly referred to as the log likelihood. +$$ +\mathcal{L}(\theta) = \log{L(\theta|y)} +$$ +Since the logarithm is a monotonic function, if we maximize the logarithm of the function, we also maximize the original function. +$$ +\mathcal{L(\theta)} = \log{\prod_{i = 1}^n{(\theta^{y_i}(1-\theta)^{1-y_i})}} +$$ + +$$ +\mathcal{L}(\theta) = \sum_{i = 1}^n{\log{(\theta^{y_i}(1-\theta)^{1-y_i})}} +$$ + +$$ +\mathcal{L}(\theta) = \sum_{i = 1}^n{(\log{(\theta^{y_i}}) + \log{(1-\theta)^{1-y_i}})} +$$ + +$$ +\mathcal{L}(\theta) = \sum_{i = 1}^n{(y_i\log{\theta} + (1 - y_i)\log{(1-\theta)})} +$$ + +$$ +\mathcal{L}(\theta) = \log{\theta}\sum_{i = 1}^n{y_i} + \log{(1-\theta)}\sum_{i = 1}^n{(1-y_i)} +$$ + +How do we find the theta that maximizes this function? Recall from calculus that we can maximize a function by taking the derivative and setting it equal to 0. +$$ +\mathcal{L}^\prime(\theta) = \frac{1}{\theta}\sum{y_i} - \frac{1}{1-\theta}\sum{(1 - y_i)} +$$ +Now we need to set it equal to zero and solve for $\hat{\theta}$ +$$ +\frac{\sum{y_i}}{\hat{\theta}} = \frac{\sum{(1-y_i)}}{1-\hat{\theta}} +$$ + +$$ +\hat{\theta}\sum{(1-y_i)} = (1-\hat{\theta})\sum{y_i} +$$ + +$$ +\hat{\theta}\sum{(1-y_i)} + \hat{\theta}\sum{y_i} = \sum{y_i} +$$ + +$$ +\hat{\theta}(\sum^n{(1 - y_i + y_i)}) = \sum{y_i} +$$ + +$$ +\hat{\theta} = \frac{1}{n}\sum{y_i} = \hat{p} = \frac{72}{400} = 0.18 +$$ + +Maximum likelihood estimators have many desirable mathematical properties. They're unbiased, they're consistent, and they're invariant. + +In general, under certain regularity conditions, we can say that the MLE is approximately normally distributed with mean at the true value of $\theta$ and the variance $\frac{1}{I(\hat{\theta})}$ where $I(\hat{\theta})$ is the Fisher information at the value of $\hat{\theta}$. The Fisher information is a measure of how much information about $\theta$ is in each data point. +$$ +\hat{\theta} \sim N(\theta, \frac{1}{I(\hat{\theta})}) +$$ +For a Bernoulli random variable, the Fisher information turns out to be +$$ +I(\theta) = \frac{1}{\theta(1-\theta)} +$$ +So the information is larger, when theta is near zero or near one, and it's the smallest when theta is near one half. + +This makes sense, because if you're flipping a coin, and you're getting a mix of heads and tails, that tells you a little bit less than if you're getting nearly all heads or nearly all tails. + +## Exponential Likelihood Example + +Let's say $X_i$ are distributed so +$$ +X_i \sim Exp(\lambda) +$$ +Let's say the data is independent and identically distributed, therefore making the overall density function +$$ +f(x|\lambda) = \prod_{i = 1}^n{\lambda e^{-\lambda x_i}} +$$ + +$$ +f(x|\lambda) = \lambda^ne^{-\lambda \sum{x_i}} +$$ + +Now the likelihood function is +$$ +L(\lambda|x) = \lambda^n e^{-\lambda \sum{x_i}} +$$ + +$$ +\mathcal{L}(\lambda) = n\ln{\lambda} - \lambda\sum{x_i} +$$ + +Taking the derivative +$$ +\mathcal{L}^\prime(\lambda) = \frac{n}{\lambda} - \sum{x_i} +$$ +Setting this equal to zero +$$ +\frac{n}{\hat{\lambda}} =\sum{x_i} +$$ + +$$ +\hat{\lambda} = \frac{n}{\sum{x_i}} = \frac{1}{\bar{x}} +$$ + +## Uniform Distribution + +$$ +X_i \sim U[0, \theta] +$$ + +$$ +f(x|\theta) = \prod_{i = 1}^n{\frac{1}{\theta}I_{0 \le x_i \le \theta}} +$$ + +Combining all the indicator functions, for this to be a 1, each of these has to be true. These are going to be true if all the observations are bigger than 0, as in the minimum of the x is bigger than or equal to 0. The maximum of the x's is also less than or equal to $\theta$. +$$ +L(\theta|x) = \theta^{-1} I_{0\le min(x_i) \le max(x_i) \le \theta} +$$ + +$$ +L^\prime(\theta) = -n\theta^{-(n + 1)}I_{0 \le min(x_i) \le max(x_i)\le \theta} +$$ + +So now we can ask, can we set this equal to zero and solve for $\theta$? Well it turns out, this is not equal to zero for any $\theta$ positive value. We need $\theta$ to be strictly larger than zero. + +However, we can also note that for $\theta$ positive, this will always be negative. The derivative is negative, that says this is a decreasing function. So this funciton will be maximized when we pick $\theta$ as small as possible. What's the smallest possible value of $\theta$ we can pick? Well we need in particular for $\theta$ to be larger than all of the $X_i$ . And so, the maximum likelihood estimate is the maximum of $X_i$ +$$ +\hat{\theta} = max(x_i) +$$ + +## Products of Indicator Functions + +Because 0 * 1 = 0, the product of indicator functions can be combined into a single indicator function with a modified condition. + +**Example**: $I_{x < 5} * I_{x \ge 0} = I_{0 \le x < 5}$ + +**Example**: $\prod_{i = 1}^n{I_{x_i < 2}} = I_{x_i < 2 for all i} = I_{max(x_i) < 2}$ + +## Introduction to R + +R has some nice functions that one can use for analysis + +`mean(z)` gives the mean of some row vector $z$ + +`var(z)` reports the variance of some row vector + +`sqrt(var(z))` gives the standard deviation of some row vector + +`seq(from=0.1, to = 0.9, by = 0.1)` creates a vector that starts from $0.1$ and goes to $0.9$ incrementing by $0.1$ + +```R +seq(from=0.1, to = 0.9, by = 0.1) +[1] 0.1 0.2 0.3 0.4 0.5 0.6 0.7 0.8 0.9 +seq(1, 10) +[1] 1 2 3 4 5 6 7 8 9 10 +``` + +`names(x)` gives the names of all the columns in the dataset. + +```R +names(trees) +[1] "Girth" "Height" "Volume" +``` + +`hist(x)` provides a histogram based on a vector + +The more general `plot` function tries to guess at which type of plot to make. Feeding it two numerical vectors will make a scatter plot. + +The R function `pairs` takes in a data frame and tries to make all possible Pairwise scatterplots for the dataset. + +The `summary` command gives the five/six number summary (minimum, first quartile, median, mean, third quartile, maximum) + +## Plotting the likelihood function in R + +Going back to the hospital example + +```R +## Likelihood function +likelihood = function(n, y, theta) { + return(theta^y * (1 - theta)^(n - y)) +} +theta = seq(from = 0.01, to = 0.99, by = 0.01) +plot(theta, likelihood(400, 72, theta)) +``` + +You can also do this with log likelihoods. This is typically more numerically stable to compute + +```R +loglike = function(n, y, theta) { + return(y * log(theta) + (n - y) * log(1 - theta)) +} +plot(theta, loglike(400, 72, theta)) +``` + +Having these plotted as points makes it difficult to see, let's plot it as lines + +```R +plot(theta, loglike(400, 72, theta), type = "l") +``` + + + +## Cumulative Distribution Function + +The cumulative distribution function (CDF) exists for every distribution. We define it as $F(x) = P(X \le x)$ for random variable $X$. + +If $X$ is discrete-valued, then the CDF is computed with summation $F(x) = \sum_{t = -\infty}^x {f(t)}$. where $f(t) = P(X = t)$ is the probability mass function (PMF) which we've already seen. + +If $X$ is continuous, the CDF is computed with an integral $F(x) = \int_{-\infty}^x{f(t)dt}$ + +The CDF is convenient for calculating probabilities of intervals. Let $a$ and $b$ be any real numbers with $a < b$. Then the probability that $X$ falls between $a$ and $b$ is equal to $P(a < X < b) = P(X \le b) - P(X \le a) = F(b) - F(a)$ + + + +## Quantile Function + +The CDF takes a value for a random variable and returns a probability. Suppose instead we start with a number between $0$ and $1$, which we call $p$, and we wish to find a value $x$ so that $P(X \le x) = p$. The value $x$ which satisfies this equation is called the $p$ quantile. (or $100p$ percentile) of the distribution of $X$. + + + +## Probability Distributions in R + +Each of the distributions introduced in Lesson 3 have convenient functions in R which allow you to evaluate the PDF/PMF, CDF, and quantile functions, as well as generate random samples from the distribution. To illustrate, Table I list these functions for the normal distribution + +| Function | What it does | +| -------------------- | ---------------------------------------- | +| `dnorm(x, mean, sd)` | Evaluate the PDF at $x$ (mean = $\mu$ and sd = $\sqrt{\sigma^2}$) | +| `pnorm(q, mean, sd)` | Evaluate the CDF at $q$ | +| `qnorm(p, mean, sd)` | Evaluate the quantile function at $p$ | +| `rnorm(n, mean, sd)` | Generate $n$ pseudo-random samples from the normal distribution | + +These four functions exist for each distribution where `d...` function evaluates the density/mass, `p...` evaluates the CDF, `q...` evaluates the quantile, and `r...` generates a sample. Table 2 lists the `d...` functions for some of the most popular distributions. The `d` can be replaced with `p`, `q`, or `r` for any of the distributions, depending on what you want to calculate. + +For details enter `?dnorm` to view R's documentation page for the Normal distribution. As usual , replace the `norm` with any distribution to read the documentation for that distribution. + +| Distribution | Function | Parameters | +| ---------------------- | -------------------------- | ------------------------------------ | +| $Binomial(n,p)$ | `dbinom(x, size, prob)` | size = $n$, prob = $p$ | +| $Poisson(\lambda)$ | `dpois(x, lambda)` | lambda = $\lambda$ | +| $Exp(\lambda)$ | `dexp(x, rate)` | rate = $\lambda$ | +| $Gamma(\alpha, \beta)$ | `dgamma(x, shape, rate)` | shape = $\alpha$, rate = $\beta$ | +| $Uniform(a, b)$ | `dunif(x, min, max)` | min = $a$, max = $b$ | +| $Beta(\alpha, \beta)$ | `dbeta(x, shape1, shape2)` | shape1 = $\alpha$, shape2 = $\beta$ | +| $N(\mu, \sigma^2)$ | `dnorm(x, mean, sd)` | mean = $\mu$, sd = $\sqrt{\sigma^2}$ | +| $t_v$ | `dt(x, df)` | df = $v$ | + +## Two Coin Example + +Suppose your brother has a coin which you know to be loaded so that it comes up heads 70% of the time. He then comes to you with some coin, you're not sure which one and he wants to make a bet with you. Betting money that it's going to come up heads. + +You're not sure if it's the loaded coin or if it's just a fair one. So he gives you a chance to flip it 5 times to check it out. + +You flip it five times and get 2 heads and 3 tails. Which coin do you think it is and how sure are you about that? + +We'll start by defining the unknown parameter $\theta$, this is either that the coin is fair or it's a loaded coin. +$$ +\theta = \{fair ,loaded\} +$$ + +$$ +X \sim Bin(5, ?) +$$ + +$$ +f(x|\theta) = \begin{cases} + {5 \choose x}(\frac{1}{2})^5 & \theta = fair \\ + {5 \choose x} (.7)^x (.3)^{5 - x} & \theta = loaded\\ + \end{cases} +$$ + +We can also rewrite $f(x|\theta)$ with indicator functions +$$ +f(x|\theta) = {5\choose x}(.5)^5I_{\{\theta= fair\}} + {5 \choose x}(.7)^x(.3)^{5 - x}I_{\{\theta = loaded\}} +$$ +In this case, we observed that $x = 2$ +$$ +f(\theta | x = 2) = \begin{cases} + 0.3125 & \theta = fair \\ + 0.1323 & \theta = loaded +\end{cases} +$$ +MLE $\hat{\theta} = fair$ + +That's a good point estimate, but then how do we answer the question, how sure are you? + +This is not a question that's easily answered in the frequentest paradigm. Another question is that we might like to know what is the probability that theta equals fair, give, we observe two heads. +$$ +P(\theta = fair|x = 2) = ? +$$ +In the frequentest paradigm, the coin is a physical quantity. It's a fixed coin, and therefore it has a fixed probability of coining up heads. It is either the fair coin, or it's the loaded coin. +$$ +P(\theta = fair) = \{0,1\} +$$ + +### Bayesian Approach to the Problem + +An advantage of the Bayesian approach is that it allows you to easily incorporate prior information, when you know something in advance of the looking at the data. This is difficult to do under the Frequentest paradigm. + +In this case, we're talking about your brother. You probably know him pretty well. So suppose you think that before you've looked at the coin, there's a 60% probability that this is the loaded coin. + +This case, we put this into our prior. Our prior is that the probability the coin is loaded is 0.6. We can update our prior with the data to get our posterior beliefs, and we can do this using the bayes theorem. + +Prior: $P(loaded) = 0.6$ +$$ +f(\theta|x) = \frac{f(x|\theta)f(\theta)}{\sum_\theta{f(x|\theta)f(\theta)}} +$$ + +$$ +f(\theta|x) = \frac{{5\choose x} [(\frac{1}{2})^5(.4)I_{\{\theta = fair\}} + (.7)^x (.3)^{5-x}(.6)I_{\{\theta = loaded\}} ] } +{{5\choose x} [(\frac{1}{2})^5(.4) + (.7)^x (.3)^{5-x}(0.6) ] } +$$ + +$$ +f(\theta|x=2)= \frac{0.0125I_{\{\theta=fair\}} + 0.0079I_{\{\theta=loaded\}} }{0.0125+0.0079} +$$ + +$$ +f(\theta|x=2) = 0.612I_{\{\theta=fair\}} + 0.388I_{\{\theta = loaded\}} +$$ + +As you can see in the calculation here, we have the likelihood times the prior in the numerator, and in the denominator, we have a normalizing constant, so that when we divide by this, we'll get answer that add up to one. These numbers match exactly in this case, because it's a very simple problem. But this is a concept that goes on, what's in the denominator here is always a normalizing constant. +$$ +P(\theta = loaded | x = 2) = 0.388 +$$ +This here updates our beliefs after seeing some data about what the probability might be. + +We can also examine what would happen under different choices of prior. +$$ +P(\theta = loaded) = \frac{1}{2} \implies P(\theta = loaded | x = 2) = 0.297 +$$ + +$$ +P(\theta = loaded) = 0.9 \implies P(\theta = loaded | x = 2) = 0.792 +$$ + +In this case, the Bayesian approach is inherently subjective. It represents your own personal perspective, and this is an important part of the paradigm. If you have a different perspective, you will get different answers, and that's okay. It's all done in a mathematically vigorous framework, and it's all mathematically consistent and coherent. + +And in the end, we get results that are interpretable + +## Continuous Bayes + +$$ +f(\theta | y) = \frac{f(y | \theta)f(\theta)}{f(y)} = \frac{f(y|\theta)f(\theta)}{\int{f(y|\theta)f(\theta)d\theta}} = \frac{likelihood * prior}{normalization} \propto likelihood * prior +$$ + +In practice, sometimes this integral can be a pain to compute. And so, we may work with looking at saying this is proportional to the likelihood times the prior. And if we can figure out what this looks like and just put the appropriate normalizing constant on at the end, we don't necessarily have to compute this integral. + + + +So for example, suppose we're looking at a coin and it has unknown probability $\theta$ of coming up heads. Suppose we express ignorance about the value of $\theta$ by assigning it a uniform distribution. +$$ +\theta \sim U[0, 1] +$$ + +$$ +f(\theta) = I_{\{0 \le \theta\le 1\}} +$$ + +$$ +f(\theta | y = 1) = \frac{\theta^1(1-\theta)^0I_{\{0 \le \theta\le1\}}}{\int_{-\infty}^\infty{\theta^1(1-\theta)^0I_{\{0\le \theta \le 1\}}}} +$$ + +$$ +f(\theta | y = 1) = \frac{\theta I_{\{0\le\theta\le1\}}}{\int_0^1{\theta d\theta}} = 2\theta I_{\{0\le\theta\le1\}} +$$ + +Now if we didn't want to take the integral we could've done this approach +$$ +f(\theta | y) \propto f(y|\theta)f(\theta) \propto \theta I_{\{0\le\theta\le1\}} +$$ +Which then we need to find the constant such that it's a proper PMF. In this case, it's $2$. + +Since it's a proper PMF, we can perform interval probabilities as well. This is called Posterior interval estimates. +$$ +P(0.025 < \theta < 0.975) = \int_{0.025}^{0.975}{2\theta d \theta} = (0.975)^2 - (0.025)^2 = 0.95 +$$ + +$$ +P(\theta > 0.05) = 1 - (0.05)^2 = 0.9975 +$$ + +These are the sort of intervals we would get from the prior and asking about what their posterior probability is. + +In other cases, we may want to ask, what is the posterior interval of interest? What's an interval that contains 95% of posterior probability in some meaningful way? This would be equivalent then to a frequentest confidence interval. We can do this in several different ways, 2 main ways that we make Bayesian Posterior intervals or credible intervals are equal-tailed intervals and highest posterior density intervals. + +## Equal-tailed Interval + +In the case of an equal-tailed interval, we put the equal amount of probability in each tail. So to make a 95% interval we'll put 0.025 in each tail. + +To be able to do this, we're going to have to figure out what the quantiles are. So we're going to need some value, $q$, so that +$$ +P(\theta < q | Y = 1) = \int_0^9{2\theta d\theta} = q^2 +$$ + +$$ +P(\sqrt{0.025} < \theta < \sqrt{0.975}) = P(0.158 < \theta < 0.987) = 0.95 +$$ + +This is an equal tailed interval in that the probability that $\theta$ is less than 0.18 is the same as the probability that $\theta$ is greater than 0.987. We can say that under the posterior, there's a 95% probability that $\theta$ is in this interval. + +## Highest Posterior Density (HPD) + +Here we want to ask where in the density function is it highest? Theoretically this will be the shortest possible interval that contains the given probability, in this case a 95% probability. +$$ +P(\theta > \sqrt{0.05} | Y = 1) = P(\theta > 0.224 | Y = 1) = 0.95 +$$ +This is the shortest possible interval, that under the posterior has a probability 0.95. it's $\theta$ going from 0.224 up to 1. + + + +The posterior distribution describes our understanding of our uncertainty combinbing our prior beliefs and the data. It does this with a probability density function, so at the end of teh day, we can make intervals and talk about probabilities of data being in the interval. + +This is different from the frequentest approach, where we get confidence intervals. But we can't say a whole lot about the actual parameter relative to the confidence interval. We can only make long run frequency statements about hypothetical intervals. + +In this case, we can legitimately say that the posterior probability that $\theta$ is bigger than 0.05 is $0.9975$. We can also say that we believe there's a 95% probability that $\theta$ is in between 0.158 and 0.987. + + + +Bayesians represent uncertainty with probabilities, so that the coin itself is a physical quantity. It may have a particular value for $\theta$. + +It may be fixed, but because we don't know what that value is, we represent our uncertainty about that value with a distribution. And at the end of the day, we can represent our uncertainty, collect it with the data, and get a posterior distribution and make intuitive statements. + + + +#### + +Frequentest confidence intervals have the interpretation that "If you were to repeat many times the process of collecting data and computing a 95% confidence interval, then on average about 95% of those intervals would contain the true parameter value; however, once you observe data and compute an interval the true value is either in the interval or it is not, but you can't tell which." + +Bayesian credible intervals have the interpretation that "Your posterior probability that the parameter is in a 95% credible interval is 95%." \ No newline at end of file diff --git a/content/notes/bayesianstatistics/week3.md b/content/notes/bayesianstatistics/week3.md new file mode 100644 index 0000000..cb1c1fc --- /dev/null +++ b/content/notes/bayesianstatistics/week3.md @@ -0,0 +1,409 @@ +How do we choose a prior? + +Our prior needs to represent our personal perspective, beliefs, and our uncertainties. + +Theoretically, we're defining a cumulative distribution function for the parameter +$$ +\begin{cases} +P(\theta \le c) & c \in \mathbb{R} +\end{cases} +$$ +This is true for an infinite number of possible sets. This isn't practical to do, and it would be very difficult to do coherently so that all the probabilities were consistent. + +In practice, we work with a convenient family that's sufficiently flexible such that a member of a family represents our beliefs. + +Generally if one has enough data, the information in the data will overwhealm the information in the prior. And so, the prior is not particularly important in terms of what you get for the posterior. Any reasonable choice of prior will lead to approximately the same posterior. However, there are some things that can go wrong. + +## Example of Bad Prior + +Suppose we chose a prior that says the probability of $P(\theta = \frac{1}{2}) = 1$ + +And thus, the probability of $\theta$ equaling any other value is $0$. If we do this, our data won't make a difference since we only put a probability of $1$ at a single point. +$$ +f(\theta|y) \propto f(y|\theta)f(\theta) = f(\theta) = \delta(\theta) +$$ + +In the basic context, events with prior probability of zero have a posterior probability of zero. Events with a prior probability of one, have a posterior probability of one. + +Thus a good Bayesian will not assign probability of zero or one to any event that has already occurred or already known not to occur. + +## Calibration + +A useful concept in terms of choosing priors is that of the calibration of predictive intervals. + +If we make an interval where we're saying we predict 95% of new data points will occur in this interval. It would be good if in reality 95% of new data points actually did fall in that interval. + +How do we calibrate to reality? This is actually a frequentest concept but this is important for practical statistical purposes that our results reflect reality. + +We can compute a predictive interval, this is an interval such that 95% of new observations are expected to fall into it. It's an interval for the **data** rather than an interval for $\theta$ +$$ +f(y) = \int{f(y|\theta)f(\theta)d\theta} = \int{f(y, \theta)d\theta} +$$ +Where $f(y,\theta)$ is the joint density of Y and $\theta$. + +This is the prior predictive before any data is observed. + +**Side Note:** From this you can say that $f(y, \theta) = f(y|\theta)f(\theta)$ + +## Binomial Example + +Suppose we're going to flip a coin ten times and count the number of heads we see. We're thinking about this in advance of actually doing it, so we're interested in the predictive distribution. How many heads do we predict we're going to see? +$$ +X = \sum_{i = 1}^{10}{Y_i} +$$ +Where $Y_i$ is each individual coin flip. + +If we think that all possible coins or all possible probabilities are equally likely, then we can put a prior for $\theta$ that's flat over the interval from 0 to 1. +$$ +f(\theta) = I_{\{0 \le \theta \le 1\}} +$$ + +$$ +f(x) = \int{f(x|\theta)f(\theta)d\theta} = \int_0^1{\frac{10!}{x!(10-x)!}\theta^x(1-\theta)^{10 -x}(1)d\theta} +$$ + +Note that because we're interested in $X$ at the end, it's important that we distinguish between a binomial density and a Bernoulli density. Here we just care about the total count rather than the exact ordering which would be Bernoulli's + +For most of the analyses we're doing, where we're interested in $\theta$ rather than x, the binomial and the Bernoulli are interchangeable because the part in here that depends on $\theta$ is the same. + +To solve this integral let us recall some facts +$$ +n! = \Gamma(n + 1) +$$ + +$$ +Z \sim Beta(\alpha, \beta) +$$ + +$$ +f(z) = \frac{\Gamma(\alpha + \beta)}{\Gamma(\alpha) \Gamma(\beta)}z^{\alpha - 1}(1-z)^{\beta - 1} +$$ + +Let us rewrite $f(x)$ +$$ +f(x) = \int_0^1{\frac{\Gamma(11)}{\Gamma(x + 1)\Gamma(11 - x)}\theta^{(x + 1)-1}(1-\theta)^{(11-x)-1}d\theta} +$$ + +$$ +f(x) = \frac{\Gamma(11)}{\Gamma(12)}\int_0^1{\frac{\Gamma(12)}{\Gamma(x + 1)\Gamma(11 - x)}\theta^{(x + 1)-1}(1-\theta)^{(11-x)-1}d\theta} +$$ + +The integral above is a beta density, all integrals of valid beta densities equals to one. +$$ +f(x) = \frac{\Gamma(11)}{\Gamma(12)} = \frac{10!}{11!} = \frac{1}{11} +$$ +For $x \in {0, 1, 2, \dots, 10}$ + +Thus we see that if we start with a uniform prior, we then end up with a discrete uniform predictive density for $X$. If all possible probabilities are equally likely, then all possible $X$ outcomes are equally likely. + +## Posterior Predictive Distribution + +What about after we've observed data? What's our posterior predictive distribution? + +Going from the previous example, let us observe after one flip that we got a head. We want to ask, what's our predictive distribution for the second flip, given we saw a head on the first flip. +$$ +f(y_2|y_1) = \int{f(y_2|\theta,y_1)f(\theta|y_1)}d\theta +$$ +We're going to assume that $Y_2$ is independent of $Y_1$. Therefore, +$$ +f(y_2 |y_1) = \int{f(y_2|\theta)f(\theta|y_1)d\theta} +$$ +Suppose we're thinking of a uniform distribution for $\theta$ and we observe the first flip is a heads. What do we predict for the second flip? + +This is no longer going to be a uniform distribution like it was before, because we have some data. We're going to think it's more likely that we're going to get a second head. We think this because since we observed a head $\theta$ is now likely to be at least $\frac{1}{2}$ possibly larger. +$$ +f(y_2 | Y_1 = 1) = \int_0^1{\theta^{y_2}(1-\theta)^{1-y_2}2\theta d\theta} +$$ + +$$ +f(y_2|Y_1 = 1) = \int_0^1{2\theta^{y_2 + 1}(1-\theta)^{1-y_2}d\theta} +$$ + +We could work this out in a more general form, but in this case, $Y_2$ has to take the value $0$ or $1$. The next flip is either going to be heads or tails so it's easier to just plop in a particular example. +$$ +P(Y_2 = 1|Y_1 = 1) = \int_0^1{2\theta^2d\theta} = \frac{2}{3} +$$ + +$$ +P(Y_2 = 0 | Y_1 = 1) = 1 - P(Y_2 = 1 | Y_1 = 1) = 1 - \frac{2}{3} = \frac{1}{3} +$$ + +We can see here that the posterior is a combination of the information in the prior and the information in the data. In this case, our prior is like having two data points, one head and one tail. + +Saying we have a uniform prior for $\theta$ is equivalent in an information sense as saying we have observed one head and one tail. + +So then when we observe one head, it's like we now have seen two heads and one tail. So our predictive distribution for the second flip says if we have two heads and one tail, then we have a $\frac{2}{3}$ probability of getting another head and a $\frac{1}{3}$ probability of getting another tail. + +## Binomial Likelihood with Uniform Prior + +Likelihood of y given theta is +$$ +f(y|\theta) = \theta^{\sum{y_i}}(1-\theta)^{n - \sum{y_i}} +$$ + +Our prior for theta is just a uniform distribution +$$ +f(\theta) = I_{\{0 \le \theta \le 1\}} +$$ +Thus our posterior for $\theta$ is +$$ +f(\theta | y) = \frac{f(y|\theta)f(\theta)}{\int{f(y|\theta)f(\theta)d\theta}} = \frac{\theta^{\sum{y_i}}(1-\theta)^{n - \sum{y_i}} I_{\{0 \le \theta \le 1\}}}{\int_0^1{\theta^{\sum{y_i}}(1-\theta)^{n - \sum{y_i}} I_{\{0 \le \theta \le 1\}}d\theta}} +$$ +Recalling the form of the beta distribution we can rewrite our posterior as +$$ +f(\theta | y) = \frac{\theta^{\sum{y_i}}(1-\theta)^{n - \sum{y_i}} I_{\{0 \le \theta \le 1\}}}{\frac{\Gamma(\sum{y_i} + 1)\Gamma(n - \sum{y_i} + 1)}{\Gamma(n + 2)}\int_0^1{\frac{\Gamma(n + 2)}{\Gamma(\sum{y_i} + 1)\Gamma(n - \sum{y_i} + 1)}\theta^{\sum{y_i}}(1-\theta)^{n - \sum{y_i}}d\theta}} +$$ +Since the beta density integrates to $1$, we can simplify this as +$$ +f(\theta | y) = \frac{\Gamma(n + 2)}{\Gamma(\sum{y_i}+ 1)\Gamma(n - \sum{y_i}+ 1)}\theta^{\sum{y_i}}(1-\theta)^{n-\sum{y_i}}I_{\{0 \le \theta \le 1\}} +$$ +From here we can see that the posterior follows a beta distribution +$$ +\theta | y \sim Beta(\sum{y_i} + 1, n - \sum{y_i} + 1) +$$ + +## Conjugate Priors + +The uniform distribution is $Beta(1, 1)$ + +Any beta distribution is conjugate for the Bernoulli distribution. Any beta prior will give a beta posterior. +$$ +f(\theta) = \frac{\Gamma(\alpha + \beta)}{\Gamma(\alpha)\Gamma(\beta)}\theta^{\alpha - 1}(1-\theta)^{\beta -1}I_{\{0 \le \theta \le 1\}} +$$ + +$$ +f(\theta | y) \propto f(y|\theta)f(\theta) = \theta^{\sum{y_i}}(1-\theta)^{n - \sum{y_i}}\frac{\Gamma(\alpha + \beta)}{\Gamma(\alpha)\Gamma(\beta)}\theta^{\alpha - 1}(1 - \theta)^{\beta - 1}I_{\{0 \le \theta \le 1\}} +$$ + +$$ +f(y|\theta)f(\theta) \propto \theta^{\alpha + \sum{y_i}-1}(1-\theta)^{\beta + n - \sum{y_i} - 1} +$$ + +Thus we see that this is a beta distribution +$$ +\theta | y \sim Beta(\alpha + \sum{y_i}, \beta + n - \sum{y_i}) +$$ +When $\alpha$ and $\beta$ is one like in the uniform distribution, then we get the same result as earlier. + + + +This whole process where we choose a particular form of prior that works with a likelihood is called using a conjugate family. + +A family of distributions is referred to as conjugate if when you use a member of that family as a prior, you get another member of that family as your posterior. + +The beta distribution is conjugate for the Bernoulli distribution. It's also conjugate for the binomial distribution. The only difference in the binomial likelihood is that there is a combinatoric term. Since that does not depend on $\theta$, we get the same posterior. + +We often use conjugate priors because they make life much more simpler, sticking to conjugate families allows us to get closed form solutions easily. + +If the family is flexible enough, then you can find a member of that family that closely represents your beliefs. + +## Posterior Mean and Effect Size + +Returning to the beta posterior model it is clear how both the prior and the data contribute to the posterior. + +We can say that the effect size of the prior is $\alpha + \beta$ + +Recall that the expected value or mean of a beta distribution is $\frac{\alpha}{\alpha + \beta}$ + +Therefore we can derive the posterior mean as +$$ +posterior_{mean} = \frac{\alpha + \sum{y_i}}{\alpha + \sum{y_i}+\beta + n - \sum{y_i}}= \frac{\alpha+\sum{y_i}}{\alpha + \beta + n} +$$ +We can further decompose this as +$$ +posterior_{mean} = \frac{\alpha + \beta}{\alpha + \beta + n}\frac{\alpha}{\alpha + \beta} + \frac{n}{\alpha + \beta + n}\frac{\sum{y_i}}{n} +$$ +We can describe this as the (prior weight * prior mean) + (data weight * data mean) + +The posterior mean is a weighted average of the prior mean and the data mean. + +This effective sample size gives you an idea of how much data you would need to make sure that your prior doesn't have much influence on your posterior. + +If $\alpha + \beta$ is small compared to $n$ then the posterior will largely just be driven by the data. If $\alpha + \beta$ is large relative to $n$ then the posterior will be largely driven by the prior. + +We can make a 95% credible interval using our posterior distribution for $\theta$. We can find an interval that actually has 95% probability of containing $\theta$. + +Using Bayesian Statistics we can chain together dong a sequential update every time we get new data. We can get a new posterior, and we just use our previous posterior as a prior to do another update using Baye's theorem. + +## Data Analysis Example in R + +Suppose we're giving two students a multiple-choice exam with 40 questions, where each question has four choices. We don't know how much the students have studied for this exam, but we think that they'll do better than just guessing randomly + +1) What are the parameters of interest? + +The parameters of interests are $\theta_1 = true$ the probability that the first student will answer a question correctly, $\theta_2 = true$ the probability that the second student will answer a question correctly. + +2) What is our likelihood? + +The likelihood is $Binomial(40, \theta)$, if we assume that each question is independent and that the probability a student gets each question right is the same for all questions for that student. + +3) What prior should we use? + +The conjugate prior is a beta prior. We can plot the density with `dbeta` + +```R +theta = seq(from = 0, to = 1, by = 0.1) +# Uniform +plot(theta, dbeta(theta, 1, 1), type = 'l') +# Prior mean 2/3 +plot(theta, dbeta(theta, 4, 2), type = 'l') +# Prior mean 2/3 but higher effect size (more concentrated at mean) +plot(theta, dbeta(theta, 8, 4), type = 'l') +``` + +4 ) What are the prior probabilities $P(\theta > 0.25)$? $P(\theta > 0.5)$? $P(\theta > 0.8)$? + +```R +1 - pbeta(0.25, 8, 4) +#[1] 0.998117 +1 - pbeta(0.5, 8, 4) +#[1] 0.8867188 +1 - pbeta(0.8, 8, 4) +#[1] 0.16113392 +``` + + + +5) Suppose the first student gets 33 questions right. What is the posterior distribution for $\theta_1$? $P(\theta > 0.25)$? $P(\theta > 0.5)$? $P(\theta > 0.8)$? What is the 95% posterior credible interval for $\theta_1$? +$$ +Posterior \sim Beta(8 + 33, 4 + 40 - 33) = Beta(41, 11) +$$ +With a posterior mean of $\frac{41}{41+11} = \frac{41}{52}$ + +We can plot the posterior distribution with the prior + +```R +plot(theta, dbeta(theta, 41, 11), type = 'l') +lines(theta, dbeta(theta, 8 ,4), lty = 2) #Dashed line for prior +``` + +Posterior probabilities + +```R +1 - pbeta(0.25, 41, 11) +#[1] 1 +1 - pbeta(0.5, 41, 11) +#[1] 0.9999926 +1 - pbeta(0.8, 41, 11) +#[1] 0.4444044 +``` + +Equal tailed 95% credible interval + +```R +qbeta(0.025, 41, 11) +#[1] 0.6688426 +qbeta(0.975, 41, 11) +#[1] 0.8871094 +``` + +95% confidence that $\theta_1$ is between 0.67 and 0.89 + + + +6) Suppose the second student gets 24 questions right. What is the posterior distribution for $\theta_2$? $P(\theta > 0.25)$? $P(\theta > 0.5)$? $P(\theta > 0.8)$? What is the 95% posterior credible interval for $\theta_2$ +$$ +Posterior \sim Beta(8 + 24, 4 + 40 - 24) = Beta(32, 20) +$$ +With a posterior mean of $\frac{32}{32+20} = \frac{32}{52}$ + +We can plot the posterior distribution with the prior + +```R +plot(theta, dbeta(theta, 32, 20), type = 'l') +lines(theta, dbeta(theta, 8 ,4), lty = 2) #Dashed line for prior +``` + +Posterior probabilities + +```R +1 - pbeta(0.25, 32, 20) +#[1] 1 +1 - pbeta(0.5, 32, 20) +#[1] 0.9540427 +1 - pbeta(0.8, 32, 20) +#[1] 0.00124819 +``` + +Equal tailed 95% credible interval + +```R +qbeta(0.025, 32, 20) +#[1] 0.4808022 +qbeta(0.975, 32, 20) +#[1] 0.7415564 +``` + +95% confidence that $\theta_1$ is between 0.48 and 0.74 + + + +7) What is the posterior probability that $\theta_1 > \theta_2$? i.e., that the first student has a better chance of getting a question right than the second student? + +Estimate by simulation: draw 1,000 samples from each and see how often we observe $\theta_1 > \theta_2$ + +```R +theta1 = rbeta(100000, 41, 11) +theta2 = rbeta(100000, 32, 20) +mean(theta1 > theta2) +#[1] 0.975 +``` + +## Poisson Data (Chocolate Chip Cookie Example) + +In mass produced chocolate chip cookies, they make a large amount of dough. They mix in a large number of chips, mix it up really well and then chunk out individual cookies. In this process, the number of chips per cookie approximately follow a Poisson distribution. + +If we were to assume that chips have no volume, then this would be exactly a Poisson process and follow exactly a Poisson distribution. In practice, however, chips aren't that big so they follow approximately a Poisson distribution for the number of chips per cookie. +$$ +Y_i \sim Poisson(\lambda) +$$ + +$$ +f(y|\lambda) = \frac{\lambda^{\sum{y_i}}e^{-n\lambda}}{\prod_{i = 1}^n{y_i!}} +$$ + +This is for $\lambda > 0$ + +What type of prior should we put on $\lambda$? It would be convenient if we could put a conjugate prior. What distribution looks like lambda raised to a power and e raised to a negative power? + +For this, we're going to use a Gamma prior. +$$ +\lambda \sim \Gamma(\alpha, \beta) +$$ + +$$ +f(\lambda) = \frac{\beta^\alpha}{\Gamma(\alpha)}\lambda^{\alpha - 1}e^{-\beta\lambda} +$$ + +$$ +f(\lambda | y) \propto f(y|\lambda)f(\lambda) \propto \lambda^{\sum{y_i}}e^{-n\lambda}\lambda^{\alpha - 1}e^{-\beta \lambda} +$$ + +$$ +f(\lambda | y) \propto \lambda^{\alpha + \sum{y_i} - 1}e^{-(\beta + n)\lambda} +$$ + +Thus we can see that the posterior is a Gamma Distribution +$$ +\lambda|y \sim \Gamma(\alpha + \sum{y_i}, \beta + n) +$$ +The mean of Gamma under this parameterization is $\frac{\alpha}{\beta}$ + +The posterior mean is going to be +$$ +posterior_{mean} = \frac{\alpha + \sum{y_i}}{\beta + n} = \frac{\beta}{\beta + n}\frac{\alpha}{\beta} + \frac{n}{\beta + n}\frac{\sum{y_i}}{n} +$$ +As you can see here the posterior mean of the Gamma distribution is also the weighted average of the prior mean and the data mean. + +Let us present two strategies on how to choose our hyper parameters $\alpha$ and $\beta$ + +1. Think about the prior mean. For example, what do you think the number of chips per cookie on average is? + +After this, we need some other piece of knowledge to pin point both parameters. Here are some options. + +- What is your error on the number of chips per cookie? In other words, what do you think the standard deviation. Under the Gamma prior the standard deviation is $\frac{\sqrt{\alpha}}{\beta}$ +- What is the effective sample size $\beta$? How many units of information do you think we have in our prior versus our data points. + +2. In Bayesian Statistics, a vague prior refers to one that's relatively flat across much of the space. For a Gamma prior we can choose $\Gamma(\epsilon, \epsilon)$ where $\epsilon$ is small and strictly positive. + +This would create a distribution with a mean of 1 and a huge standard deviation across the whole space. Hence the posterior will be largely driven by the data and very little by the prior. \ No newline at end of file diff --git a/content/notes/bayesianstatistics/week4.md b/content/notes/bayesianstatistics/week4.md new file mode 100644 index 0000000..d2d4038 --- /dev/null +++ b/content/notes/bayesianstatistics/week4.md @@ -0,0 +1,617 @@ +## Exponential Data + +Suppose you're waiting for a bus that you think comes on average once every 10 minutes, but you're not sure exactly how often it comes. +$$ +Y \sim Exp(\lambda) +$$ +Your waiting time has a prior expectation of $\frac{1}{\lambda}$ + + + +It turns out the gamma distribution is conjugate for an exponential likelihood. We need to specify a prior, or a particular gamma in this case. If we think that the buses come on average every ten minutes, that's a rate of one over ten. +$$ +prior_{mean} = \frac{1}{10} +$$ +Thus, we'll want to specify a gamma distribution so that the first parameter divded by the second parameter is $\frac{1}{10}$ + +We can now think about our variability. Perhaps you specify +$$ +\Gamma(100, 1000) +$$ +This will indeed have a prior mean of $\frac{1}{10}$ and it'll have a standard deviation of $\frac{1}{100}$. If you want to have a rough estimate of our mean plus or minus two standard deviations then we have the following +$$ +0.1 \pm 0.02 +$$ +Suppose that we wait for 12 minutes and a bus arrives. Now you want to update your posterior for $\lambda$ about how often this bus will arrive. +$$ +f(\lambda | y) \propto f(y|\lambda)f(\lambda) +$$ + +$$ +f(\lambda | y) \propto \lambda e^{-\lambda y}\lambda^{\alpha - 1}e^{-\beta \lambda} +$$ + +$$ +f(\lambda | y) \propto \lambda^{(\alpha + 1) - 1}e^{-(\beta + y)\lambda} +$$ + +$$ +\lambda | y \sim \Gamma(\alpha + 1, \beta + y) +$$ + +Plugging in our particular prior gives us a posterior for $\lambda$ which is +$$ +\lambda | y \sim \Gamma(101, 1012) +$$ +Thus our posterior mean is going to be $\frac{101}{1012} Which is equal to 0.0998. + + + +This one observation doesn't contain a lot of data under this likelihood. When the bus comes and it takes 12 minutes instead of 10, it barely shifts our posterior mean up. One data point doesn't have a big impact here. + + + +## Normal/Gaussian Data + +Let's suppose the standard deviation or variance is known and we're only interested in learning about the mean. This is the situation that often arises in monitoring industrial production processes. +$$ +X_i \sim N(\mu, \sigma^2) +$$ +It turns out that the Normal distribution is conjugate for itself when looking for the mean parameter + +Prior +$$ +\mu \sim N(m_0,S_0^2) +$$ + +$$ +f(\mu |x ) \propto f(x|\mu)f(\mu) +$$ + +$$ +\mu | x \sim N(\frac{n\bar{x}/\sigma_0^2 + m_0/s_0^2}{n/\sigma_0^2 + 1/s_0^2}, \frac{1}{n/\sigma_0^2 + 1/s_0^2}) +$$ + +Let's look at the posterior mean +$$ +posterior_{mean} = \frac{n/\sigma_0^2}{n/\sigma_0^2 + 1/s_0^2}\bar{x} + \frac{1/s_0^2}{n/\sigma_0^2 + 1/s_0^2} +$$ + +$$ +posterior_{mean} = \frac{n}{n + \sigma_0^2/s_0^2}\bar{x} + \frac{\sigma_0^2/s_0^2}{n + \sigma_0^2/s_0^2} +$$ + +Thus we see, that the posterior mean is a weighted average of the prior mean and the data mean. And indeed that the effective sample size for this prior is the ratio of the variance for the data to the variance in the prior. + +This makes sense, because the larger the variance of the prior, the less information that's in it. + +The marginal distribution for Y is +$$ +N(m_0, s_0^2 + \sigma^2) +$$ + +### When $\mu$ and $\sigma^2$ is unknown + +$$ +X_i | \mu, \sigma^2 \sim N(\mu, \sigma^2) +$$ + +A prior from $\mu$ conditional on the value for $\sigma^2$ +$$ +\mu | \sigma^2 \sim N(m, \frac{\sigma^2}{w}) +$$ +$w$ is going to be the ratio of $\sigma^2$ and some variance for the Normal distribution. This is the effective sample size of the prior. + +Finally, the last step is to specify a prior for $\sigma^2$. The conjugate prior here is an inverse gamma distribution with parameters $\alpha$ and $\beta$. +$$ +\sigma^2 \sim \Gamma^{-1}(\alpha, \beta) +$$ +After many calculations... we get the posterior distribution +$$ +\sigma^2 | x \sim \Gamma^{-1}(\alpha + \frac{n}{2}, \beta + \frac{1}{2}\sum_{i = 1}^n{(x-\bar{x}^2 + \frac{nw}{2(n+2)}(\bar{x} - m)^2)}) +$$ + +$$ +\mu | \sigma^2,x \sim N(\frac{n\bar{x}+wm}{n+w}, \frac{\sigma^2}{n + w}) +$$ + +Where the posterior mean can be written as the weighted average of the prior mean and the data mean. +$$ +\frac{n\bar{x}+wm}{n+w} = \frac{w}{n + w}m + \frac{n}{n + w}\bar{x} +$$ +In some cases, we really only care about $\mu$. We want some inference on $\mu$ and we may want it such that it doesn't depend on $\sigma^2$. We can marginalize that $\sigma^2$ integrating it out. The posterior for $\mu$ marginally follows a $t$ distribution. +$$ +\mu | x \sim t +$$ +Similarly the posterior predictive distribution also is a $t$ distribution. + +Finally, note that we can extend this in various directions, this can be extended to the multivariate normal case that requires matrix vector notations and can be extended in a hierarchial fashion if we want to specify priors for $m$, $w$ and $\beta$ + +## Non Informative Priors + +We've seen examples of choosing priors that contain a significant amount of information. We've also seen some examples of choosing priors where we're attempting to not put too much information in to keep them vague. + +Another approach is referred to as objective Bayesian statistics or inference where we explicitly try to minimize the amount of information that goes into the prior. + +This is an attempt to have the data have maximum influence on the posterior + +Let's go back to coin flipping +$$ +Y_i \sim B(\theta) +$$ +How do we minimize our prior information in $\theta$? One obvious intuitive approach is to say that all values of $\theta$ are equally likely. So we could have a piror for $\theta$ which follows a uniform distribution on the interval $[0, 1]$ + +Saying all values of $\theta$ are equally likely **seems** like it would have no information in it. + +Recall however, that a $Uniform(0, 1)$ is the same as $Beta(1, 1)$ + +The effective sample size of a beta prior is the sum of its two parameters. So in this case, it has an effective sample size of 2. This is equivalent to data, with one head and one tail already in it. + +So this is not a completely non informative prior. + +We could think about a prior that has less information. For example $Beta(\frac{1}{2}, \frac{1}{2})$, this would have half as much information with an effective sample size of one. + +We can take this even further. Think about something like $Beta(0.001, 0.001)$ This would have much less information, with the effective sample size fairly close to zero. In this case, the data would determine the posterior and there would be very little influence from the prior. + +###Improper priors + +Can we go even further? We can think of the limiting case. Let's think of $Beta(0,0)$, what would that look like? +$$ +f(\theta) \propto \theta^{-1}(1-\theta)^{-1} +$$ +This is not a proper density. If you integrate this over $(0,1)$, you'll get an infinite integral, so it's not a true density in the sense of it not integrating to 1. + +There's no way to normalize it, since it has an infinite integral. This is what we refer to as an improper prior. + +It's improper in the sense that it doesn't have a proper density. But it's not necessarily imporper in the sense that we can't use it. If we collect data, we use this prior and as long as we observe one head and one tail, or **at least one success and one failure**. Then we can get a posterior +$$ +f(\theta|y) \propto \theta^{y-1}(1-\theta)^{n-y-1} \sim Beta(y, n-y) +$$ +With a posterior mean of $\frac{y}{n} =\hat{\theta}$, which you should recognize as the maximum likelihood estimate. So by using this improper prior, we get a posterior which gives us point estimates exactly the same as the frequentest approach. + +But in this case, we can also think of having a full posterior. From this, we can make interval statements, probability statements, and we can actually find an interval and say that there's 95% probability that $\theta$ is in this interval. Which is not something you can do under the frequentest approach even though we may get the same exact interval. + +### Statements about improper priors + +Improper priors are okay as long as the posterior itself is proper. There may be some mathematical things that need to be checked and you may need to have certain restrictions on the data. In this case, we needed to make sure that we observed at least one head and one tail to get a proper posterior. + +But as long as the posterior is proper, we can go forwards and do Bayesian inference even with an improper prior. + +The second point is that for many problems there does exist a prior, typically an improper prior that will lead to the same point estimates as you would get under the frequentest paradigm. So we can get very similar results, results that are fully dependent on the data, under the Bayesian approach. + +But in this case, we can also have continue to have a posterior and make posterior interval estimates and talk about posterior probabilities of the parameter. + +### Normal Case + +Another example is thinking about the normal case. +$$ +Y_i \stackrel{iid}\sim N(\mu, \sigma^2) +$$ +Let's start off by assuming that $\sigma^2$ is known and we'll just focus on the mean $\mu$. + +We can think about a vague prior like before and say that +$$ +\mu \sim N(0, 1000000^2) +$$ +This would just spread things out across the real line. That would be a fairly non informative prior covering a lot of possibilities. We can then think about taking the limit, what happens if we let the variance go to $\infty$. In that case, we're basically spreading out this distribution across the entire real number line. We can say that the density is just a constant across the whole real line. +$$ +f(\mu) \propto 1 +$$ +This is an improper prior because if you integrate the real line you get an infinite answer. However, if we go ahead and find the posterior +$$ +f(\mu|y) \propto f(y|\mu)f(\mu) \propto exp(-\frac{1}{2\sigma^2}\sum{(y_i - \mu)^2})(1) +$$ + +$$ +f(\mu | y) \propto exp(-\frac{1}{2\sigma^2/n}(\mu - \bar{y})^2) +$$ + +$$ +\mu | y \sim N(\bar{y}, \frac{\sigma^2}{n}) +$$ + +This should look just like the maximum likelihood estimate. + +### Unknown Variance + +In the case that $\sigma^2$ is unknown, the standard non informative prior is +$$ +f(\sigma^2) \propto \frac{1}{\sigma^2} +$$ + +$$ +\sigma^2 \sim \Gamma^{-1}(0,0) +$$ + +This is an improper prior and it's uniform on the log scale of $\sigma^2$. + +In this case, we'll end up with a posterior for $\sigma^2$ +$$ +\sigma^2|y \sim \Gamma^{-1}(\frac{n-1}{2}, \frac{1}{2}\sum{(y_i - \bar{y})^2}) +$$ +This should also look reminiscent of quantities we get as a frequentest. For example, the samples standard deviation + +## Jeffreys Prior + +Choosing a uniform prior depends upon the particular parameterization. + +Suppose I used a prior which is uniform on the log scale for $\sigma^2$ +$$ +f(\sigma^2) \propto \frac{1}{\sigma^2} +$$ +Suppose somebody else decides, that they just want to put a uniform prior on $\sigma^2$ itself. +$$ +f(\sigma^2) \propto 1 +$$ +These are both uniform on certain scales or certain parameterizations, but they are different priors. So when we compute the posteriors, they will be different as well. + + The key thing is that uniform priors are not invariant with respect to transformation. Depending on how you parameterize the problem, you can get different answers by using a uniform prior + +One attempt to round this out is to use Jeffrey's Prior + +Jeffrey's Prior is defined as the following +$$ +f(\theta) \propto \sqrt{\mathcal{I(\theta)}} +$$ +Where $\mathcal{I}(\theta)$ is the fisher information of $\theta$. In most cases, this will be an improper prior. + +### Normal Data + +For the example of Normal Data +$$ +Y_i \sim N(\mu, \sigma^2) +$$ + +$$ +f(\mu) \propto 1 +$$ + +$$ +f(\sigma^2) \propto \frac{1}{\sigma^2} +$$ + +Where $\mu$ is uniform and $\sigma^2$ is uniform on the log scale. + +This prior will then be transformation invariant. We will end up putting the same information into the prior even if we use a different parameterization for the Normal. + +### Binomial + +$$ +Y_i \sim B(\theta) +$$ + +$$ +f(\theta) \propto \theta^{-\frac{1}{2}}(1-\theta)^{-\frac{1}{2}} \sim Beta(\frac{1}{2},\frac{1}{2}) +$$ + +This is a rare example of where the Jeffreys prior turns out to be a proper prior. + +You'll note that this prior actually does have some information in it. It's equivalent to an effective sample size of one data point. However, this information will be the same, not depending on the parameterization we use. + +In this case, we have $\theta$ as a probability, but another alternative which is sometimes used is when we model things on a logistics scale. + +By using the Jeffreys prior, we'll maintain the exact same information. + +### Closing information about priors + +Other possible approaches to objective Bayesian inference includes priors such as reference priors and maximum entropy priors. + +A related concept to this is called empirical Bayesian analysis. The idea in empirical Baye's is that you use the data to help inform your prior; such as by using the mean of the data to set the mean of the prior distribution. This approach often leads to reasonable point estimates in your posterior. However, it's sort of cheating since you're using your data twice and as a result may lead to improper uncertainty estimates. + +## Fisher Information + +The Fisher information (for one parameter) is defined as +$$ +\mathcal{I}(\theta) = E[(\frac{d}{d\theta}log{(f(X|\theta))})^2] +$$ +Where the expectation is taken with respect to $X$ which has PDF $f(x|\theta)$. This quantity is useful in obtaining estimators for $\theta$ with good properties, such as low variance. It is also the basis for Jeffreys prior. + +**Example:** Let $X | \theta \sim N(\theta, 1)$. Then we have +$$ +f(x|\theta) = \frac{1}{\sqrt{2\pi}}exp[-\frac{1}{2}(x-\theta)^2] +$$ + +$$ +\log{(f(x|\theta))} = -\frac{1}{2}\log{(2\pi)}-\frac{1}{2}(x-\theta)^2 +$$ + +$$ +(\frac{d}{d\theta}log{(f(x|\theta))})^2 = (x-\theta)^2 +$$ + +and so $\mathcal{I}(\theta) = E[(X - \theta)^2] = Var(X) = 1$ + +## Linear Regression + +###Brief Review of Regression + +Recall that linear regression is a model for predicting a response or dependent variable ($Y$, also called an output) from one or more covariates or independent variables ($X$, also called explanatory variables, inputs, or features). For a given value of a single $x$, the expected value of $y$ is +$$ +E[y] = \beta_0 + \beta_1x +$$ +or we could say that $Y \sim N(\beta_0 + \beta_1x, \sigma^2)$. For data $(x_1, y_1), \dots , (x_n, y_n)$, the fitted values for the coefficients, $\hat{\beta_0}$ and $\hat{\beta_1}$ are those that minimize the sum of squared errors $\sum_{i = 1}^n{(y_i - \hat{y_i})^2}$, where the predicted values for the response are $\hat{y} = \hat{\beta_0} + \hat{\beta_1}x$. We can get these values from R. These fitted coefficients give the least-squares line for the data. + +This model extends to multiple covariates, with one $\beta_j$ for each $k$ covariates +$$ +E[y_i] = \beta_0 + \beta_1x_{i1} + \dots + \beta_kx_{ik} +$$ +Optionally, we can represent the multivariate case using vector-matrix notation. + +### Conjugate Modeling + +In the Bayesian framework, we treat the $\beta$ parameters as unknown, put a prior on them, and then find the posterior. We might treat $\sigma^2$ as fixed and known, or we might treat it as an unknown and also put a prior on it. Because the underlying assumption of a regression model is that the errors are independent and identically normally distributed with mean $0$ and variance $\sigma^2$, this defines a normal likelihood. + +#### $\sigma^2$ known + +Sometimes we may know the value of the error variance $\sigma^2$. This simplifies calculations. The conjugate prior for the $\beta$'s is a normal prior. In practice, people typically use a non-informative prior, i.e., the limit as the variance of the normal prior goes to infinity, which has the same mean as the standard least-squares estimates. If we are only estimating $\beta$ and treating $\sigma^2$ as known, then the posterior for $\beta$ is a (multivariate) normal distribution. If we just have a single covariate, then the posterior for the slope is +$$ +\beta_1 | y \sim N(\frac{\sum_{i = 1}^n{(x_i-\bar{x})(y_i - \bar{y})}}{\sum_{i=1}^n{(x_i-\bar{x})^2}}, \frac{\sigma^2}{\sum_{i=1}^n{(x_i - \bar{x})^2}}) +$$ +If we have multiple covariates, then using a matrix-vector notation, the posterior for the vector of coefficients is +$$ +\beta | y \sim N((X^tX)^{-1}X^ty, (X^tX)^{-1}\sigma^2) +$$ +where $X$ denotes the design matrix and $X^t$ is the transpose of $X$. The intercept is typically included in $X$ as a column of $1$'s. Using an improper prior requires us to have at least as many data points as we have parameters to ensure that the posterior is proper. + +#### $\sigma^2$ Unknown + +If we treat both $\beta$ and $\sigma^2$ as unknown, the standard prior is the non-informative Jeffreys prior, $f(\beta, \sigma^2) \propto \frac{1}{\sigma^2}$. Again, the posterior mean for $\beta$ will be the same as the standard least-squares estimates. The posterior for $\beta$ conditional on $\sigma^2$ is the same normal distributions as when $\sigma^2$ is known, but the marginal posterior distribution for $\beta$, with $\sigma^2$ integrated out is a $t$ distribution, analogous to the $t$ tests for significance in standard linear regression. The posterior $t$ distribution has mean $(X^tX)^{-1}X^ty$ and scale matrix (related to the variance matrix) $s^2(X^tX)^{-1}$, where $s^2 = \sum_{i = 1}^n{(y_i - \hat{y_i})^2/(n - k - 1)}$. The posterior distribution for $\sigma^2$ is an inverse gamma distribution +$$ +\sigma^2 | y \sim \Gamma^{-1}(\frac{n - k - 1}{2}, \frac{n - k - 1}{2}s^2) +$$ +In the simple linear regression case (single variable), the marginal posterior for $\beta$ is a $t$ distribution with mean $\frac{\sum_{i = 1}^n{(x_i-\bar{x})(y_i - \bar{y})}}{\sum_{i=1}^n{(x_i-\bar{x})^2}}$ and scale $ \frac{s^2}{\sum_{i=1}^n{(x_i - \bar{x})^2}}$. If we are trying to predict a new observation at a specified input $x^*$, that predicted value has a marginal posterior predictive distribution that is a $t$ distribution, with mean $\hat{y} = \hat{\beta_0} + \hat{\beta_1}x^*$ and scale $se_r\sqrt{1 + \frac{1}{n} + \frac{(x^* - \bar{x})^2}{(n - 1)s_x^2}}$. $se_r$ is the residual standard error of the regression, which can be found easily in R. $s_x^2$ is the sample variance of $x$. Recall that the predictive distribution for a new observation has more variability than the posterior distribution for $\hat{y}$ , because individual observations are more variable than the mean. + +## Linear Regression + +### Single Variable Regression + +We'll be looking at the Challenger dataset. It contains 23 past launches where it has the temperature at the day of launch and the O-ring damage index + +http://www.randomservices.org/random/data/Challenger2.txt +Read in the data + +```R +oring=read.table("http://www.randomservices.org/random/data/Challenger2.txt", + header=T) +# Note that attaching this masks T which is originally TRUE +attach(oring) +``` + +Now we'll see the plot + +```R +plot(T, I) +``` + +![Challenger](files/courses/BayesianStatistics/Challenger.png) + +Fit a linear model + +```R +oring.lm=lm(I~T) +summary(oring.lm) +``` + +Output of the summary + +``` +Call: +lm(formula = I ~ T) + +Residuals: + Min 1Q Median 3Q Max +-2.3025 -1.4507 -0.4928 0.7397 5.5337 + +Coefficients: + Estimate Std. Error t value Pr(>|t|) +(Intercept) 18.36508 4.43859 4.138 0.000468 +T -0.24337 0.06349 -3.833 0.000968 + +(Intercept) *** +T *** +--- +Signif. codes: +0 ‘***’ 0.001 ‘**’ 0.01 ‘*’ 0.05 ‘.’ 0.1 ‘ ’ 1 + +Residual standard error: 2.102 on 21 degrees of freedom +Multiple R-squared: 0.4116, Adjusted R-squared: 0.3836 +F-statistic: 14.69 on 1 and 21 DF, p-value: 0.0009677 +``` + +Add the fitted line into the scatterplot + +```R +lines(T,fitted(oring.lm)) +``` + +![challengerfitted](files/courses/BayesianStatistics/challengerfitted.png) + +Create a 95% posterior interval for the slope + +```R +-0.24337 - 0.06349*qt(.975,21) +# [1] -0.3754047 +-0.24337 + 0.06349*qt(.975,21) +# [1] -0.1113353 +``` + +**Note:** These are the same as the frequentest confidence intervals + +If the challenger launch was at 31 degrees Fahrenheit, how much O-Ring damage would we predict? + +```R +coef(oring.lm)[1] + coef(oring.lm)[2]*31 +# [1] 10.82052 +``` + +Let's make our posterior prediction interval + +```R +predict(oring.lm,data.frame(T=31),interval="predict") +``` + +Output of `predict` + +``` + fit lwr upr +1 10.82052 4.048269 17.59276 +``` + +We can calculate the lower bound through the following formula + +```R +10.82052-2.102*qt(.975,21)*sqrt(1+1/23+((31-mean(T))^2/22/var(T))) +``` + +What's the posterior probability that the damage index is greater than zero? + +```R +1-pt((0-10.82052)/(2.102*sqrt(1+1/23+((31-mean(T))^2/22/var(T)))),21) +``` + +### Multivariate Regression + +We're looking at Galton's seminal data predicting the height of children from the height of the parents + +http://www.randomservices.org/random/data/Galton.txt +Read in the data + +```R +heights=read.table("http://www.randomservices.org/random/data/Galton.txt", + header=T) +attach(heights) +``` + +What are the columns in the dataset? + +```R +names(heights) +# [1] "Family" "Father" "Mother" "Gender" "Height" "Kids" +``` + +Let's look at the relationship between the different variables + +```R +pairs(heights) +``` + +![heightpairs](files/courses/BayesianStatistics/heightpairs.png) + +First let's start by creating a linear model taking all of the columns into account + +```R +summary(lm(Height~Father+Mother+Gender+Kids)) +``` + +Output of `summary` + +``` +Call: +lm(formula = Height ~ Father + Mother + Gender + Kids) + +Residuals: + Min 1Q Median 3Q Max +-9.4748 -1.4500 0.0889 1.4716 9.1656 + +Coefficients: + Estimate Std. Error t value Pr(>|t|) +(Intercept) 16.18771 2.79387 5.794 9.52e-09 +Father 0.39831 0.02957 13.472 < 2e-16 +Mother 0.32096 0.03126 10.269 < 2e-16 +GenderM 5.20995 0.14422 36.125 < 2e-16 +Kids -0.04382 0.02718 -1.612 0.107 + +(Intercept) *** +Father *** +Mother *** +GenderM *** +Kids +--- +Signif. codes: +0 ‘***’ 0.001 ‘**’ 0.01 ‘*’ 0.05 ‘.’ 0.1 ‘ ’ 1 + +Residual standard error: 2.152 on 893 degrees of freedom +Multiple R-squared: 0.6407, Adjusted R-squared: 0.6391 +F-statistic: 398.1 on 4 and 893 DF, p-value: < 2.2e-16 +``` + +As you can see here, the `Kids` column is not significant. Let's look at a model with it removed. + +```R +summary(lm(Height~Father+Mother+Gender)) +``` + +Output of `summary` + +``` +Call: +lm(formula = Height ~ Father + Mother + Gender) + +Residuals: + Min 1Q Median 3Q Max +-9.523 -1.440 0.117 1.473 9.114 + +Coefficients: + Estimate Std. Error t value Pr(>|t|) +(Intercept) 15.34476 2.74696 5.586 3.08e-08 +Father 0.40598 0.02921 13.900 < 2e-16 +Mother 0.32150 0.03128 10.277 < 2e-16 +GenderM 5.22595 0.14401 36.289 < 2e-16 + +(Intercept) *** +Father *** +Mother *** +GenderM *** +--- +Signif. codes: +0 ‘***’ 0.001 ‘**’ 0.01 ‘*’ 0.05 ‘.’ 0.1 ‘ ’ 1 + +Residual standard error: 2.154 on 894 degrees of freedom +Multiple R-squared: 0.6397, Adjusted R-squared: 0.6385 +F-statistic: 529 on 3 and 894 DF, p-value: < 2.2e-16 +``` + +This model looks good, let's go ahead and save it to a variable + +```R +heights.lm=lm(Height~Father+Mother+Gender) +``` + +From this we can tell that for each extra inch of height in a father is correlated with an extra 0.4 inches extra to the height of a child. + +We can also tell that each extra inch of height in a mother is correlated with an extra 0.3 inches extra to the height of the child. + +A male child is on average 5.2 inches taller than a female child. + +Let's create a 95% posterior interval for the difference in height by gender + +```R +5.226 - 0.144*qt(.975,894) +# [1] 4.943383 +5.226 + 0.144*qt(.975,894) +# [1] 5.508617 +``` + +Let's make a posterior prediction interval for a male and female with a father whose 68 inches and a mother whose 64 inches. + +```R +predict(heights.lm,data.frame(Father=68,Mother=64,Gender="M"), + interval="predict") + +# fit lwr upr +# 1 68.75291 64.51971 72.9861 +``` + +```R +predict(heights.lm,data.frame(Father=68,Mother=64,Gender="F"), + interval="predict") + +# fit lwr upr +# 1 63.52695 59.29329 67.76062 +``` + + + +## What's next? + +This concludes this course, if you want to go further with Bayesian statistics, the next topics to explore would be hierarchal modeling and fitting of non conjugate models with Markov Chain Monte Carlo or MCMC. diff --git a/content/notes/quadraticcongruences.md b/content/notes/quadraticcongruences.md new file mode 100644 index 0000000..594faea --- /dev/null +++ b/content/notes/quadraticcongruences.md @@ -0,0 +1,82 @@ +# Handy Quadratic Congruences Facts + +## Number of Solutions + +For congruences mod 2 + +**Proposition 16.1**. Let $f(x) = ax^2 + bx + c$ with $a$ odd, and let $\Delta = b^2 - 4ac$ be the discriminant of $f(x)$. Then, + +1. If $\Delta \equiv 1$ (mod $8$), so that $b$ is odd and $c$ is even, then $f(x) \equiv 0$ (mod $2$) has **two** solutions +2. If $\Delta \equiv 5$ (mod $8$), so that $b$ and $c$ are odd, then $f(x) \equiv 0$ (mod $2$) has **no** solutions +3. If $4 | \Delta$ , so that $b$ is even, then $f(x) \equiv 0$ (mod $2$) has exactly **one** solution. + +**Proposition 16.2.** Let $p$ be an odd prime and let $a$ be an integer. Then, + +1. If $p$ does not divide $a$, then the congruence $x^2 \equiv a$ (mod $p$) has either two solutions or no solutions. +2. If $p$ divides $a$, then $x^2 \equiv a$ (mod $p$) has exactly one solution, namely $x = 0$. + +**Legendre symbol definition**. Let $p$ be an odd prime and $a$ any integer. Then the *Legendre symbol*, written as $(\frac{a}{p})$ is defined as +$$ +(\frac{a}{p}) = \begin{cases} +1, & \text{if $x^2 \equiv a$ (mod $p$) has exactly two solutions,} \\ +0, & \text{if $x^2 \equiv a$ (mod $p$) has exactly one solution,} \\ +-1, & \text{if $x^2 \equiv a$ (mod $p$) has no soultions.} +\end{cases} +$$ +**Properties of Legendre symbol**. + +- $(\frac{a}{p}) = 0 \iff p$ divides $a$ + +- $(\frac{1}{p}) = 1$ for every odd prime $p$ + +- $a \equiv b$ (mod $p$) $\implies$ $(\frac{a}{p}) = (\frac{b}{p})$ + +- $(\frac{ab}{p}) = (\frac{a}{p})(\frac{b}{p})$ + +- If $p$ is an odd prime then, + + - $$ + (\frac{-1}{p}) = + \begin{cases} + 1, & \text{if $p \equiv 1$ (mod $4$)} \\ + -1, & \text{ if $p \equiv 3$ (mod $4$)} + \end{cases} + $$ + +- If $p$ is an odd prime then, + + - $$ + (\frac{2}{p}) = + \begin{cases} + 1, & \text{if $p \equiv 1$ (mod $8$) or $p \equiv 7$ (mod $8$)} \\ + -1, & \text{ if $p \equiv 3$ (mod $8$) or $p \equiv 5$ (mod $8$)} + \end{cases} + $$ + +- **Quadratic Reciprocity Theorem**. Let $p$ and $q$ be distinct odd primes. Then, + + - $$ + (\frac{q}{p}) = + \begin{cases} + (\frac{p}{q}), & \text{if $p \equiv 1$ (mod $4$) or $q \equiv 1$ (mod $4$)} \\ + -(\frac{p}{q}), & \text{ if $p \equiv 3$ (mod $4$) and $q \equiv 3$ (mod $4$)} + \end{cases} + $$ + +## Procedure + +When $p$ is an odd prime, a quadratic congruence $ax^2 + bx + c \equiv 0$ (mod $p$) can be transformed into a specialized form by completing the square. +\begin{align*} +ax^2 + bx + c \equiv 0 \text{ (mod $p$)} &\iff 4a(ax^2 + bx + c) \equiv 0 \text{ (mod $p$)} \\\\ +&\iff 4a^2x^2 + 4abx + 4ac \equiv 0 \text{ (mod $p$)} \\\\ +&\iff 4a^2x^2 + 4abx + 4ac + (b^2 - 4ac) \equiv b^2 - 4ac \text{ (mod $p$)} \\\\ +&\iff 4a^2x^2 + 4abx + b^2 \equiv b^2 - 4ac \text{ (mod $p$)} \\\\ +&\iff (2ax+b)^2 \equiv b^2 - 4ac \text{ (mod $p$)} +\end{align*} + +## Quadratic Congruences Modulo a prime power + +Let $a$ be the solution to $f(x) \equiv 0$ (mod $p$) where $p$ is an odd prime. Consider $b = pt + a$. Then, $f(b) \equiv 0$ (mod $p^2$) if $f^\prime(a)t \equiv -\frac{f(a)}{p}$ (mod $p$). + +In general, let $a$ be the solution to $f(x) \equiv 0$ (mod $p^n$) where $p$ is an odd prime. Consider $b = pt + a$. Then, $f(b) \equiv 0$ (mod $p^{n + 1}$) if $f^\prime(a)t \equiv -\frac{f(a)}{p^n}$ (mod $p$) + diff --git a/content/notes/realanalysis.md b/content/notes/realanalysis.md new file mode 100644 index 0000000..af1c1f5 --- /dev/null +++ b/content/notes/realanalysis.md @@ -0,0 +1,93 @@ +# Real Analysis Sheet + +**Fact:** $\forall a,b, \in \mathbb{R}$, $\sqrt{ab} \le \frac{1}{2}(a + b)$. + +**Bernoulli's Inequality:** If $x > -1$, then $(1 + x)^n \ge 1 + nx$, $\forall n \in \mathbb{N}$. + +**Triangle Inequality:** If $a,b \in \mathbb{R}$, then $|a + b| \le |a| + |b|$. + +**Epsilon Neighborhood Definition:** + +Let $a \in \mathbb{R}$ and $\epsilon > 0$. The $\epsilon$-neighborhood of $a$ is the set $V_\epsilon(a) = \{ x \in \mathbb{R}, |x - a| < \epsilon\}$. + +**Archimedean Property:** If $x \in \mathbb{R}$, then $\exists n_x \in \mathbb{N}$ such that $x \le n_x$. + +**Convergence Definition:** + +$X = (x_n)$ converges to $x \in \mathbb{R}$ if $\forall \epsilon > 0, \exists k \in \mathbb{N}$ such that $\forall n \ge k, |x_n - x| < \epsilon$. + +**Fact:** A sequence in $\mathbb{R}$ can have at most one limit. + +**Theorem 3.1.9:** + +If $(a_n)$ is a sequence in $\mathbb{R}$ such that $a_n \rightarrow 0$, and for some constant $c > 0, m \in \mathbb{N}$, + +$|x_n - x| \le ca_n, \forall n \ge m$, then $x_n \rightarrow x$. + +**Theorem 3.2.7:** + +(a) If $x_n \rightarrow x$, then $|x_n| \rightarrow |x|$. + +(b) If $x_n \rightarrow x$ and $x_n \ge 0$, then $\sqrt{x_n} \rightarrow \sqrt{x}$. + +**Ratio Test:** + +Let $\{x_n\} \subseteq \mathbb{R}^+$ such that $L = \lim{(\frac{x_{n + 1}}{x_n})}$. If $L < 1$, then $x_n \rightarrow 0$. + +**Theorem 3.2.2:** Every convergent sequence is bounded. (The converse is not necessarily true) + +**Squeeze Theorem:** + +If $x_n \rightarrow x, y_n \rightarrow y,$ and $z_n \rightarrow x$ such that $x_n \le y_n \le z_n, \forall n \in \mathbb{N}$ then $y = x$. + +**Monotone Convergence Theorem** + +Let $X = (x_n)$ be a subsequence in $\mathbb{R}$. + +(a) If $X$ is monotonically increasing and bounded above then $\lim{x_n} = sup\{x_n : n \in \mathbb{N}\}$ + +(b) If $X$ is monotonically decreasing and bounded below then $\lim{x_n} = inf\{x_n : n \in \mathbb{N}\}$ + +**Useful Fact:** If $\lim{x_n} = a \in \mathbb{R}$, then $\lim{x_{n + 1}} = a$. + +**Interesting Application of MCT:** + +Let $s_1 > 0$ be arbitrary, and define $s_{n + 1} = \frac{1}{2}(s_n + \frac{a}{s_n})$. We know $s_n \rightarrow \sqrt{a}$. + +**Euler's Number:** Consider the sequence $e_n = (1 + \frac{1}{n})^n$. We know $e_n \rightarrow e$. + +**Theorem 3.4.2:** If $X = (x_n) \subseteq \mathbb{R}$ converges to $x$, then every subsequence converges to $x$. + +**Corollary:** If $X = (x_n) \subseteq \mathbb{R}$ has a subsequence that diverges then $X$ diverges. + +**Monotone Sequence Theorem**: If $X = (x_n) \subseteq \mathbb{R}$, then it contains a monotone subsequence. + +**Bolzano-Weierstrass Theorem:** Every bounded sequence in $\mathbb{R}$ has a convergent subsequence. + +**Theorem 3.4.12:** A bounded $(x_n) \in \mathbb{R}$ is convergent iff $liminf(x_n) = limsup(x_n)$. + +**Cauchy Criteria for Convergence:** Let $X = (x_n) \subseteq \mathbb{R}$. We say that $X$ is cauchy if $\forall \epsilon > 0, \exists N \in \mathbb{N}$ such that $\forall n,m \ge N, |x_n - x_m| < \epsilon$. We know that a sequence converges iff it is cauchy. + +**P-Series:** Series of the form $s_n = \sum_{i = 0}^n{\frac{1}{n^p}}$ is convergent for $p > 1$. + +**Geometric Series:** + +Series of the form $s_n = \sum_{i = 0}^n{ar^i}$ has the following partial sum $a\frac{1 - r^n}{1 - r}$ and converges to $\frac{a}{1 - r}$ if $|r| < 1$. + +**Comparison Test:** + +Let $(x_n), (y_n) \subseteq \mathbb{R}$. Suppose that for some $k \in \mathbb{N}, 0 \le x_n \le y_n,$ for $n \ge k$. + +(a) If $\sum{y_n} < \infty$, then $\sum{x_n} < \infty$. + +(b) If $\sum{x_n} = \infty$, then $\sum{y_n} = \infty$. + +**Limit Comparison Test:** + +Let $(x_n), (y_n)$ be strictly positive sequence of real numbers. Suppose $r = \lim{\frac{x_n}{y_n}}$. + +(a) If $r \ne 0$, then $\sum{x_n} < \infty \iff \sum{y_n} < \infty$. + +(b) If ($r = 0$ and $\sum{y_n} < \infty$), then $\sum{x_n} < \infty$. + + \ No newline at end of file diff --git a/content/notes/reproducibleresearch.md b/content/notes/reproducibleresearch.md new file mode 100644 index 0000000..77e1ea2 --- /dev/null +++ b/content/notes/reproducibleresearch.md @@ -0,0 +1,20 @@ +--- +title: Reproducible Research +showthedate: false +--- + + + +# Reproducible Research + +In the Winter of 2017, I took a coursera course on Reproducible Research taught by Dr. Peng from John Hopkins University + +Below are my notes for each of the four weeks. + +[Week 1](week1) + +[Week 2](week2) + +[Week 3](week3) + +[Week 4](week4) diff --git a/content/notes/reproducibleresearch/week1.md b/content/notes/reproducibleresearch/week1.md new file mode 100644 index 0000000..4db0cc4 --- /dev/null +++ b/content/notes/reproducibleresearch/week1.md @@ -0,0 +1,397 @@ +# Reproducible Research Week 1 + +## Replication + +The ultimate standard for strengthening scientific evidence is replication of finding and conducting studies with independent + +- Investigators +- Data +- Analytical Methods +- Laboratories +- Instruments + +Replication is particularly important in studies that can impact broad policy or regulatory decisions + + + +### What's wrong with replication? + +Some studies cannot be replicated + +- No time, opportunistic +- No money +- Unique + +*Reproducible Research:* Make analytic data and code available so that others may reproduce findings + + + +Reproducibility bridges the gap between replication which is awesome and doing nothing. + + + +## Why do we need reproducible research? + +New technologies increasing data collection throughput; data are more complex and extremely high dimensional + +Existing databases can be merged into new "megadatabases" + +Computing power is greatly increased, allowing more sophisticated analyses + +For every field "X" there is a field "Computational X" + + + +## Research Pipeline + +Measured Data -> Analytic Data -> Computational Results -> Figures/Tables/Numeric Summaries -> Articles -> Text + +Data/Metadata used to develop test should be made publically available + +The computer code and fully specified computational procedures used for development of the candidate omics-based test should be made sustainably available + +"Ideally, the computer code that is released will encompass all of the steps of computational analysis, including all data preprocessing steps. All aspects of the analysis needs to be transparently reported" -- IOM Report + + + +### What do we need for reproducible research? + +- Analytic data are available +- Analytic code are available +- Documentation of code and data +- Standard means of distribution + + + +### Who is the audience for reproducible research? + +Authors: + +- Want to make their research reproducible +- Want tools for reproducible research to make their lives easier (or at least not much harder) + +Readers: + +- Want to reproduce (and perhaps expand upon) interesting findings +- Want tools for reproducible research to make their lives easier. + +### Challenges for reproducible research + +- Authors must undertake considerable effort to put data/results on the web (may not have resources like a web server) +- Readers must download data/results individually and piece together which data go with which code sections, etc. +- Readers may not have the same resources as authors +- Few tools to help authors/readers + +### What happens in reality + +Authors: + +- Just put stuff on the web +- (Infamous for disorganization) Journal supplementary materials +- There are some central databases for various fields (e.g biology, ICPSR) + +Readers: + +- Just download the data and (try to) figure it out +- Piece together the software and run it + +## Literate (Statistical) Programming + +An article is a stream of text and code + +Analysis code is divided into text and code "chunks" + +Each code chunk loads data and computes results + +Presentation code formats results (tables, figures, etc.) + +Article text explains what is going on + +Literate programs can be weaved to produce human-readable documents and tagled to produce machine-readable documents + +Literate programming is a general concept that requires + +1. A documentation language (human readable) +2. A programming language (machine readable) + +Knitr is an R package that brings a variety of documentation languages such as Latex, Markdown, and HTML + +### Quick summary so far + +Reproducible research is important as a minimum standard, particularly for studies that are difficult to replicate + +Infrastructure is needed for creating and distributing reproducible document, beyond what is currently available + +There is a growing number of tools for creating reproducible documents + + + +**Golden Rule of Reproducibility: Script Everything** + +## Steps in a Data Analysis + +1. Define the question +2. Define the ideal data set +3. Determine what data you can access +4. Obtain the data +5. Clean the data +6. Exploratory data analysis +7. Statistical prediction/modeling +8. Interpret results +9. Challenge results +10. Synthesize/write up results +11. Create reproducible code + +"Ask yourselves, what problem have you solved, ever, that was worth solving, where you knew all of the given information in advance? Where you didn't have a surplus of information and have to filter it out, or you had insufficient information and have to go find some?" -- Dan Myer + +Defining a question is the kind of most powerful dimension reduction tool you can ever employ. + +### An Example for #1 + +**Start with a general question** + +Can I automatically detect emails that are SPAM or not? + +**Make it concrete** + +Can I use quantitative characteristics of emails to classify them as SPAM? + +### Define the ideal data set + +The data set may depend on your goal + +- Descriptive goal -- a whole population +- Exploratory goal -- a random sample with many variables measured +- Inferential goal -- The right population, randomly sampled +- Predictive goal -- a training and test data set from the same population +- Causal goal -- data from a randomized study +- Mechanistic goal -- data about all components of the system + +### Determine what data you can access + +Sometimes you can find data free on the web + +Other times you may need to buy the data + +Be sure to respect the terms of use + +If the data don't exist, you may need to generate it yourself. + +### Obtain the data + +Try to obtain the raw data + +Be sure to reference the source + +Polite emails go a long way + +If you load the data from an Internet source, record the URL and time accessed + +### Clean the data + +Raw data often needs to be processed + +If it is pre-processed, make sure you understand how + +Understand the source of the data (census, sample, convenience sample, etc) + +May need reformatting, subsampling -- record these steps + +**Determine if the data are good enough** -- If not, quit or change data + +### Exploratory Data Analysis + +Look at summaries of the data + +Check for missing data + +-> Why is there missing data? + +Look for outliers + +Create exploratory plots + +Perform exploratory analyses such as clustering + +If it's hard to see your plots since it's all bunched up, consider taking the log base 10 of an axis + +`plot(log10(trainSpan$capitalAve + 1) ~ trainSpam$type)` + +### Statistical prediction/modeling + +Should be informed by the results of your exploratory analysis + +Exact methods depend on the question of interest + +Transformations/processing should be accounted for when necessary + +Measures of uncertainty should be reported. + +### Interpret Results + +Use the appropriate language + +- Describes +- Correlates with/associated with +- Leads to/Causes +- Predicts + +Gives an explanation + +Interpret Coefficients + +Interpret measures of uncertainty + +### Challenge Results + +Challenge all steps: + +- Question +- Data Source +- Processing +- Analysis +- Conclusions + +Challenge measures of uncertainty + +Challenge choices of terms to include in models + +Think of potential alternative analyses + +### Synthesize/Write-up Results + +Lead with the question + +Summarize the analyses into the story + +Don't include every analysis, include it + +- If it is needed for the story +- If it is needed to address a challenge +- Order analyses according to the story, rather than chronologically +- Include "pretty" figures that contribute to the story + +### In the lecture example... + +Lead with the question + +​ Can I use quantitative characteristics of the emails to classify them as SPAM? + +Describe the approach + +​ Collected data from UCI -> created training/test sets + +​ Explored Relationships + +​ Choose logistic model on training set by cross validation + +​ Applied to test, 78% test set accuracy + +Interpret results + +​ Number of dollar signs seem reasonable, e.g. "Make more money with Viagra $ $ $ $" + +Challenge Results + +​ 78% isn't that great + +​ Could use more variables + +​ Why use logistic regression? + + + +## Data Analysis Files + +Data + +- Raw Data +- Processed Data + +Figures + +- Exploratory Figures +- Final Figures + +R Code + +- Raw/Unused Scripts +- Final Scripts +- R Markdown Files + +Text + +- README files +- Text of Analysis/Report + +### Raw Data + +Should be stored in the analysis folder + +If accessed from the web, include URL, description, and date accessed in README + +### Processed Data + +Processed data should be named so it is easy to see which script generated the data + +The processing script -- processed data mapping should occur in the README + +Processed data should be tidy + +### Exploratory Figures + +Figures made during the course of your analysis, not necessarily part of your final report + +They do not need to be "pretty" + +### Final Figures + +Usually a small subset of the original figures + +Axes/Colors set to make the figure clear + +Possibly multiple panels + +### Raw Scripts + +May be less commented (but comments help you!) + +May be multiple versions + +May include analyses that are later discarded + +### Final Scripts + +Clearly commented + +- Small comments liberally - what, when, why, how + +- Bigger commented blocks for whole sections + +Include processing details + +Only analyses that appear in the final write-up + +### R Markdown Files + +R Markdown files can be used to generate reproducible reports + +Text and R code are integrated + +Very easy to create in RStudio + +### Readme Files + +Not necessary if you use R Markdown + +Should contain step-by-step instructions for analysis + +### Text of the document + +It should contain a title, introduction (motivation), methods (statistics you used), results (including measures of uncertainty), and conclusions (including potential problems) + +It should tell a story + +It should not include every analysis you performed + +References should be included for statistical methods \ No newline at end of file diff --git a/content/notes/reproducibleresearch/week2.md b/content/notes/reproducibleresearch/week2.md new file mode 100644 index 0000000..49779f6 --- /dev/null +++ b/content/notes/reproducibleresearch/week2.md @@ -0,0 +1,227 @@ +## Coding Standards for R + +1. Always use text files/text editor +2. Indent your code +3. Limit the width of your code (80 columns?) +4. Author suggests indentation of 4 spaces at minimum +5. Limit the length of individual functions + +## What is Markdown? + +Markdown is a text-to-HTML conversion tool for web writers. Markdown allows you to write using an easy-to-read, easy-to-write plain text format, then convert it structurally to valid XHTML/HTML + +## Markdown Syntax + +`*This text will appear italicized!*` + +*This text will appear italicized!* + +`**This text will appear bold!**` + +**This text will appear bold** + +`## This is a secondary heading` + +`###This is a tertiary heading ` + +## This is a secondary heading + +### This is a tertiary heading + +Unordered Lists + +`- first item in list` + +`- second item in list` + +- first item in list +- second item in list + +Ordered lists + +`1. first item in list` + +`2. second item in list` + +`3. third item in list` + +1. first item in list +2. second item in list +3. third item in list + +Create links + +`[Download R](http://www.r-project.org/)` + +[Download R](http://www.r-project.org/) + +Advanced linking + +`I spent so much time reading [R bloggers][1] and [Simply Statistics][2]!` + +`[1]: http://www.r-bloggers.com/ "R bloggers"` + +`[2]: http://simplystatistics.org/ "Simply Statistics"` + +I spent so much time reading [R bloggers][1] and [Simply Statistics][2]! + +[1]: http://www.r-bloggers.com/ "R bloggers" + +[2]: http://simplystatistics.org/ "Simply Statistics" + +Newlines require a double space after the end of a line + +## What is Markdown? + +Created by John Gruber and Aaron Swartz. It is a simplified version of "markup" languages. It allows one to focus on writing as opposed to formatting. Markdown provides a simple, minimal, and intuitive way of formatting elements. + +You can easily convert Markdown to valid HTML (and other formats) using existing tools. + +## What is R Markdown? + +R Markdown is the integration of R code with markdown. It allows one to create documents containing "live" R code. R code is evaluated as part of the processing of the markdown and its results are inserted into the Markdown document. R Markdown is a core tool in **literate statistical programming** + +R Markdown can be converted to standard markdown using `knitr` package in R. Markdown can then be converted to HTML using the `markdown` package in R. This workflow can be easily managed using R Studio. One can create powerpoint like slides using the `slidify` package. + +## Problems, Problems + +- Authors must undertake considerable effort to put data/results on the web +- Readers must download data/results individually and piece together which data go with which code sections, etc. +- Authors/readers must manually interact with websites +- There is no single documents to integrate data analysis with textual representations; i.e data, code, and text are not linked + +One of the ways to resolve this is to simply put the data and code together in the same document so that people can execute the code in the right order, and the data are read at the right times. You can have a single document that integrates the data analysis with all the textual representations. + +## Literate Statistical Programming + +- Original idea comes from Don Knuth +- An article is a stream of **text** and **code** +- Analysis code is divded into text and code "chunks" +- Presentation code formats results (tables, figures, etc.) +- Article text explains what is going on +- Literate programs are weaved to produce human-readable documents and tangled to produce machine-readable documents. + +## Literate Statistical Programming + +- Literate programming is a general concept. We need + - A documentation language + - A programming language +- `knitr` supports a variety of documentation languages + +## How Do I Make My Work Reproducible? + +- Decide to do it (ideally from the start) +- Keep track of everything, hopefully through a version control system +- Use software in which operations can be coded +- Don't save output +- Save data in non-proprietary formats + +## Literate Programming: Pros + +- Text and code all in one place, logical order +- Data, results automatically updated to reflect external changes +- Code is live -- automatic "regression test" when building a document + +## Literate Programming: Cons + +- Text and code are all in one place; can make documents difficult to read, especially if there is a lot of code +- Can substantially slow down processing of documents (although there are tools to help) + +## What is Knitr Good For? + +- Manuals +- Short/Medium-Length technical documents +- Tutorials +- Reports (Especially if generated periodically) +- Data Preprocessing documents/summaries + +## What is knitr NOT good for? + +- Very long research articles +- Complex time-consuming computations +- Documents that require precise formatting + +## Non-GUI Way of Creating R Markdown documents + +```R +library(knitr) +setwd() +knit2html('document.Rmd') +browseURL('document.html') +``` + +## A few notes about knitr + +- knitr will fill a new document with filler text; delete it + +- Code chunks begin with ` ```{r}` and ends with ` ``` ` + +- All R code goes in between these markers + +- Code chunks can have names, which is useful when we start making graphics + + ` ```{r firstchunk}` + + `## R code goes here` + + ` ``` ` + +- By default, code in a code chunk is echoed, as will the results of the computation (if there are results to print) + +## Processing of knitr documents + +- You write RMarkdown document (.Rmd) +- knitr produces a Markdown document (.md) +- knitr converts the Markdown document into HTML (by default) +- .Rmd -> .md -> .html +- You should NOT edit (or save) the .md or .html documents until you are finished + +## Inline Text Computations + +You can reference variable in RMarkdown through the following + +``` +`The current time is `r time`. My favorite random number is `r rand` +``` + +## Setting Global Options + +- Sometimes we want to set options for every code chunk that are different from the defaults +- For example, we may want to suppress all code echoing and results output +- We have to write some code to set these global options + +Example for suppressing all code chunks + +```R +​```{r setoptions, echo=FALSE} +opts_chunk$set(echo=False, results = "hide") +​``` +``` + +## Some Common Options + +- Output + - Results: "axis", "hide" + - echo: TRUE, FALSE +- Figures + - fig.height: numeric + - fig.width: numeric + +## Caching Computations + +- What if one chunk takes a long time to run? +- All chunks have to be re-computed every time you re-knit the file +- The `cache=TRUE` option can be set on a chunk-by-chunk basis to store results of computation +- After the first run, results are loaded from cache + +## Caching Caveats + +- If the data or code (or anything external) changes, you need to re-run the cache code chunks +- Dependencies are not checked explicitly!!!! +- Chunks with significant *side effects* may not be cacheable + +## Summary of knitr + +- Literate statistical programming can be a useful way to put text, code, data, output all in one document +- knitr is a powerful tool for iterating code and text in a simple document format + diff --git a/content/notes/reproducibleresearch/week3.md b/content/notes/reproducibleresearch/week3.md new file mode 100644 index 0000000..1a92f30 --- /dev/null +++ b/content/notes/reproducibleresearch/week3.md @@ -0,0 +1,308 @@ +## tl;dr + +People are busy, especially managers and leaders. Results of data analyses are sometimes presented in oral form, but often the first cut is presented via email. + +It is often useful therefore, to breakdown the results of an analysis into different levels of granularity/detail + +## Hierarchy of Information: Research Paper + +- Title / Author List + - Speaks about what the paper is about + - Hopefully interesting + - No detail +- Abstract + - Motivation of the problem + - Bottom Line Results +- Body / Results + - Methods + - More detailed results + - Sensitivity Analysis + - Implication of Results +- Supplementary Materials / Gory Details + - Details on what was done +- Code / Data / Really Gory Details + - For reproducibility + + + +## Hierarchy of Information: Email Presentation + +- Subject Line / Subject Info + - At a minimum: include one + - Can you summarize findings in one sentence? +- Email Body + - A brief description of the problem / context: recall what was proposed and executed; summarize findings / results. (Total of 1-2 paragraphs) + - If action is needed to be taken as a result of this presentation, suggest some options and make them as concrete as possible + - If questions need to be addressed, try to make them yes / no +- Attachment(s) + - R Markdown file + - knitr report + - Stay Concise: Don't spit out pages of code +- Links to Supplementary Materials + - Code / Software / Data + - Github Repository / Project Website + + + +## DO: Start with Good Science + +- Remember: Garbage, in, garbage out +- Find a coherent focused question. This helps solve many problems +- Working with good collaborators reinforces good practices +- Something that's interesting to you will hopefully motivate good habits + +## DON'T: Do Things By Hand + +- Editing spreadsheets of data to "clean it up" + - Removing outliers + - QA / QC + - Validating +- Editing tables or figures (e.g rounding, formatting) +- Downloading data from a website +- Moving data around your computer, splitting, or reformatting files. + +Things done by hand need to precisely documented (this is harder than it sounds!) + +## DON'T: Point and Click + +- Many data processing / statistical analysis packages have graphical user interfaces (GUIs) +- GUIs are convenient / intuitive but the actions you take with a GUI can be difficult for others to reproduce +- Some GUIs produce a log file or script which includes equivalent commands; these can be saved for later examination +- In general, be careful with data analysis software that is highly interactive; ease of use can sometimes lead to non-reproducible analyses. +- Other interactive software, such as text editors, are usually fine. + + +## DO: Teach a Computer + +If something needs to be done as part of your analysis / investigation, try to teach your computer to do it (even if you only need to do it once) + +In order to give your computer instructions, you need to write down exactly what you mean to do and how it should be done. Teaching a computer almost guarantees reproducibility + +For example, by, hand you can + + 1. Go to the UCI Machine Learning Repository at http://archive.ics.uci.edu/mil/ + 2. Download the Bike Sharing Dataset + +Or you can teach your computer to do it using R + +```R +download.file("http://archive.ics.uci.edu/ml/machine-learning-databases/00275/Bike-Sharing-Dataset.zip", "ProjectData/Bike-Sharing-Dataset.zip") +``` + +Notice here that: + +- The full URL to the dataset file is specified +- The name of the file saved to your local computer is specified +- The directory to which the filed was saved is specified ("ProjectData") +- Code can always be executed in R (as long as link is available) + +## DO: Use Some Version Control + +It helps you slow things down by adding changes into small chunks. (Don't just do one massive commit). It allows one to track / tag snapshots so that one can revert back to older versions of the project. Software like Github / Bitbucket / SourceForge make it easy to publish results. + + + +## DO: Keep Track of Your Software Environment + +If you work on a complex project involving many tools / datasets, the software and computing environment can be critical for reproducing your analysis. + +**Computer Architecture**: CPU (Intel, AMD, ARM), CPU Architecture, GPUs + +**Operating System**: Windows, Mac OS, Linux / Unix + +**Software Toolchain**: Compilers, interpreters, command shell, programming language (C, Perl, Python, etc.), database backends, data analysis software + +**Supporting software / infrastructure**: Libraries, R packages, dependencies + +**External dependencies**: Websites, data repositories, remote databases, software repositories + +**Version Numbers:** Ideally, for everything (if available) + +This function in R helps report a bunch of information relating to the software environment + +```R +sessionInfo() +``` + +## DON'T: Save Output + +Avoid saving data analysis output (tables, figures, summaries, processed data, etc.), except perhaps temporarily for efficiency purposes. + +If a stray output file cannot be easily connected with the means by which it was created, then it is not reproducible + +Save the data + code that generated the output, rather than the output itself. + +Intermediate files are okay as long as there is clear documentation of how they were created. + +## DO: Set Your Seed + +Random number generators generate pseudo-random numbers based on an initial seed (usually a number or set of numbers) + +​ In R, you can use the `set.seed()` function to set the seed and to specify the random number generator to use + +Setting the seed allows for the stream of random numbers to be exactly reproducible + +Whenever you generate random numbers for a non-trivial purpose, **always set the seed**. + +## DO: Think About the Entire Pipeline + +- Data analysis is a lengthy process; it is not just tables / figures/ reports +- Raw data -> processed data -> analysis -> report +- How you got the end is just as important as the end itself +- The more of the data analysis pipeline you can make reproducible, the better for everyone + +## Summary: Checklist + +- Are we doing good science? + - Is this interesting or worth doing? +- Was any part of this analysis done by hand? + - If so, are those parts precisely documented? + - Does the documentation match reality? +- Have we taught a computer to do as much as possible (i.e. coded)? +- Are we using a version control system? +- Have we documented our software environment? +- Have we saved any output that we cannot reconstruct from original data + code? +- How far back in the analysis pipeline can we go before our results are no longer (automatically reproducible) + + +## Replication and Reproducibility + +Replication + +- Focuses on the validity of the scientific claim +- Is this claim true? +- The ultimate standard for strengtening scientiffic evidence +- New investigators, data, analytical methods, laboratories, instruments, etc. +- Particularly important in studies that can impact broad policy or regulatory decisions. + +Reproducibility + +- Focuses on the validity of the data analysis +- Can we trust this analysis? +- Arguably a minimum standard for any scientific study +- New investigators, same data, same methods +- Important when replication is impossible + +## Background and Underlying Trends + +- Some studies cannot be replicated: No time, no money, or just plain unique / opportunistic +- Technology is increasing data collection throughput; data are more complex and high-dimensional +- Existing databases can be merged to become bigger databases (but data are used off-label) +- Computing power allows more sophisticated analyses, even on "small" data +- For every field "X", there is a "Computational X" + +## The Result? + +- Even basic analyses are difficult to describe +- Heavy computational requirements are thrust upon people without adequate training in statistics and computing +- Errors are more easily introduced into long analysis pipelines +- Knowledge transfer is inhibited +- Results are difficult to replicate or reproduce +- Complicated analyses cannot be trusted + +## What Problem Does Reproducibility Solve? + +What we get: + +- Transparency +- Data Availability +- Software / Methods of Availability +- Improved Transfer of Knowledge + +What we do NOT get + +- Validity / Correctness of the analysis + +An analysis can be reproducible and still be wrong + +We want to know 'can we trust this analysis + +Does requiring reproducibility deter bad analysis? + +## Problems with Reproducibility + +The premise of reproducible research is that with data/code available, people can check each other and the whole system is self-correcting + +- Addresses the most "downstream" aspect of the research process -- Post-publication +- Assumes everyone plays by the same rules and wants to achieve the same goals (i.e. scientific discovery) + +## Who Reproduces Research? + +- For reproducibility to be effective as a means to check validity, someone needs to do something + - Re-run the analysis; check results match + - Check the code for bugs/errors + - Try alternate approaches; check sensitivity +- The need for someone to do something is inherited from traditional notion of replication +- Who is "someone" and what are their goals? + +## The Story So Far + +- Reproducibility brings transparency (wrt code+data) and increased transfer of knowledge +- A lot of discussion about how to get people to share data +- Key question of "can we trust this analysis"? is not addressed by reproducibility +- Reproducibility addresses potential problems long after they've occurred ("downstream") +- Secondary analyses are inevitably colored by the interests/motivations of others. + +## Evidence-based Data Analysis + +- Most data analyses involve stringing together many different tools and methods +- Some methods may be standard for a given field, but others are often applied ad hoc +- We should apply throughly studied (via statistical research), mutually agreed upon methods to analyze data whenever possible +- There should be evidence to justify the application of a given method + +## Evidence-based Data Analysis + +- Create analytic pipelines from evidence-based components - standardize it +- A deterministic statistical machine +- Once an evidence-based analytic pipeline is established, we shouldn't mess with it +- Analysis with a "transparent box" +- Reduce the "research degrees of freedom" +- Analogous to a pre-specified clinical trial protocol + +## Case Study: Estimating Acute Effects of Ambient Air Pollution Exposure + +- Acute / Short-term effects typically estimated via panel studies or time series studies +- Work originated in late 1970s early 1980s +- Key question "Are short-term changes in pollution associated with short-term changes in a population health outcome?" +- Studies are usually conducted at a community level +- Long history of statistical research investigating proper methods of analysis + +## Case Study: Estimating Acute Effects of Ambient Air Pollution Exposure + +- Can we encode everything that we have found in statistical / epidemiological research into a single package? +- Time series studies do not have a huge range of variation; typically involves similar types of data and similar questions +- We can create a deterministic statistical machine for this area? + +## DSM Modules for Time Series Studies of Air Pollution and Health + +1. Check for outliers, high leverage, overdispersion +2. Fill in missing data? No! +3. Model selection: Estimate degrees of freedom to adjust for unmeasured confounders + - Other aspects of model not as critical +4. Multiple lag analysis +5. Sensitivity analysis wrt + - Unmeasured confounder adjustment + - Influential points + +## Where to Go From Here? + +- One DSM is not enough, we need many! +- Different problems warrant different approaches and expertise +- A curated library of machines providing state-of-the-art analysis pipelines +- A CRAN/CPAN/CTAN/... for data analysis +- Or a "Cochrane Collaboration" for data analysis + +## A Curated Library of Data Analysis + +- Provide packages that encode data analysis pipelines for given problems, technologies, questions +- Curated by experts knowledgeable in the field +- Documentation / References given supporting module in the pipeline +- Changes introduced after passing relevant benchmarks/unit tests + +## Summary + +- Reproducible research is important, but does not necessarily solve the critical question of whether a data analysis is trustworthy +- Reproducible research focuses on the most "downstream" aspect of research documentation +- Evidence-based data analysis would provide standardized best practices for given scientific areas and questions +- Gives reviewers an important tool without dramatically increases the burden on them +- More effort should be put into improving the quality of "upstream" aspects of scientific research \ No newline at end of file diff --git a/content/notes/reproducibleresearch/week4.md b/content/notes/reproducibleresearch/week4.md new file mode 100644 index 0000000..1ce5fad --- /dev/null +++ b/content/notes/reproducibleresearch/week4.md @@ -0,0 +1,158 @@ +## The `cacher` Package for R + +- Add-on package for R +- Evaluates code written in files and stores immediate results in a key-value database +- R expressions are given SHA-1 hash values so that changes can be tracked and code reevaluated if necessary +- "Chacher packages" can be built for distribution +- Others can "clone" an analysis and evaluate subsets of code or inspect data objects + +The value of this is so other people can get the analysis or clone the analysis and look at subsets of the code. Or maybe more specifically data objects. People who want to run your code may not necessarily have the resources that you have. Because of that, they may not want to run the entire Markov chain Monte Carlo simulation that you did to get the posterior distribution or the histogram that you got at the end. + +But the idea is that you peel the onion a little bit rather than just go straight to the core. + +## Using `cacher` as an Author + +1. Parse the R source file; Create the necessary cache directiories and subdirectories +2. Cycle through each expression in the source file + - If an expression has never been evaluated, evaluate it and store any resulting R objects in the cache database + - If any cached results exists, lazy-load the results from the cache database and move to the next expression + - If an expression does not create any R objects (i.e, there is nothing to cache), add the expression to the list of expressions where evaluation needs to be forced + - Write out metadata for this expression to the metadata file + +- The `cachepackage` function creates a `cacher` package storing + - Source File + - Cached data objects + - Metadata +- Package file is zipped and can be distributed +- Readers can unzip the file and immediately investigate its contents via `cacher` package + +## Using `cacher` as a Reader + +A journal article says + +​ "... the code and data for this analysis can be found in the cacher package 092dcc7dda4b93e42f23e038a60e1d44dbec7b3f" + +```R +library(cacher) +clonecache(id = "092dcc7dda4b93e42f23e038a60e1d44dbec7b3f") +clonecache(id = "092d") ## Same as above +# Created cache directory `.cache` +showfiles() +# [1] "top20.R" +sourcefile("top20.R") +``` + +## Cloning an Analysis + +- Local directories are created +- Source code files and metadata are downloaded +- Data objects are *not* downloaded by default (may be really large) +- References to data objects are loaded and corresponding data can be lazy-loaded on demand + +`graphcode()` gives a node graph representing the code + +## Running Code + +- The `runcode` function executes code in the source file +- By default, expressions that results in an object being created are not run and the resulting objects is lazy-loaded into the workspace +- Expressions not resulting in objects are evaluated + +## Checking Code and Objects + +- The `checkcode` function evaluates all expressions from scratch (no lazy-loading) +- Results of evaluation are checked against stored results to see if the results are the same as what the author calculated + - Setting RNG seeds is critical for this to work +- The integrity of data objects can be verified with the `checkobjects` function to check for possible corruption of data perhaps during transit. + +You can inspect data objects with `loadcache`. This loads in pointers to each of the data objects into the workspace. Once you access the object, it will transfer it from the cache. + +## `cacher` Summary + +- The `cacher` package can be used by authors to create cache packages from data analyses for distribution +- Readers can use the `cacher` package to inspect others' data analyses by examing cached computations +- `cacher` is mindful of readers' resources and efficiently loads only those data objects that are needed. + +# Case Study: Air Pollution + +Particulate Matter -- PM + +When doing air pollution studies you're looking at particulate matter pollution. The dust is not just one monolithic piece of dirt or soot but it's actually composed of many different chemical constituents. + +Metals inert things like salts and other kinds of components so there's a possibility that a subset of those constituents are really harmful elements. + +PM is composed of many different chemical constituents and it's important to understand that the Environmental Protection Agency (EPA) monitors the chemical constituents of particulate matter and has been doing so since 1999 or 2000 on a national basis. + +## What causes PM to be Toxic? + +- PM is composed of many different chemical elements +- Some components of PM may be more harmful than others +- Some sources of PM may be more dangerous than others +- Identifying harmful chemical constituents may lead us to strategies for controlling sources of PM + +## NMMAPS + +- The National Morbidity, Mortality, and Air Pollution Study (NMMAPS) was a national study of the short-term health effects of ambient air pollution + +- Focused primarily on particulate matter ($PM_{10}$) and Ozone ($O_3$) + +- Health outcomes include mortality from all causes and hospitalizations for cardiovascular and respiratory diseases + +- Key publications + + - http://www.ncbi.nlm.nih.gov/pubmed/11098531 + - http://www.ncbi.nlm.nih.gov/pubmed/11354823 + +- Funded by the Heath Effects Institute + + - Roger Peng currently serves on the Health Effects Institute Health Review Committee + + ​ + +## NMMAPS and Reproducibility + +- Data made available at the Internet-based Health and Air Pollution Surveillance System (http://www.ihapss.jhsph.edu) +- Research and software also available at iHAPSS +- Many studies (over 67 published) have been conducted based on the public data http://www.ncbi.nlm.nih.gov/pubmed/22475833 +- Has served as an important test bed for methodological development + +## What Causes Particulate Matter to be Toxic? + +http://www.ncbi.nlm.nih.gov/pmc/articles/PMC1665439 + +- Lippmann et al. found strong evidence that NI modified the short-term effect of $PM_{10}$ across 60 US communities +- No other PM chemical constituent seemed to have the same modifying effect +- To simple to be true? + +## A Reanalysis of the Lippmann et al. Study + +http://www.ncbi.nlm.nih.gov/pmc/articles/PMC2137127 + +- Rexamine the data from NMMAPS and link with PM chemical constituent data +- Are the findings sensitive for levels of Nickel in New York City? + +## Does Nickel Make PM Toxic? + +- Long-term average nickel concentrations appear correlated with PM risk +- There appear to be some outliers on the right-hand side (New York City) + +## Does Nickel Make PM Toxic? + +One of the most important things about those three points to the right is those are called high leverage points. So the regression line can be very senstive to high leverage points. Removing those three points from the dataset brings the regression line's slope down a little bit. Which then produces a line that is no longer statistical significant (p-value about 0.31) + +## What Have We Learned? + +- New York does have very high levels of nickel and vanadium, much higher than any other US community +- There is evidence of a positive relationship between NI concentrations and $PM_{10}$ risk +- The strength of this relationship is highly sensitive to the observations from New York City +- Most of the information in the data is derived from just 3 observations + +## Lessons Learned + +- Reproducibility of NMMAPS allowed for a secondary analysis (and linking with PM chemical constituent data) investigating a novel hypothesis (Lippmann et al.) +- Reproducibility also allowed for a critique of that new analysis and some additional new analysis (Dominici et al.) +- Original hypothesis not necessarily invalidated, but evidence not as strong as originally suggested (more work should be done) +- Reproducibility allows for the scientific discussion to occur in a timely and informed manner +- This is how science works. + + + diff --git a/content/notes/stat381.md b/content/notes/stat381.md new file mode 100644 index 0000000..146b80f --- /dev/null +++ b/content/notes/stat381.md @@ -0,0 +1,20 @@ +--- +title: Probability and Statistical Inference +showthedate: false +--- + + + +# Probability and Statistical Inference + +In the Fall of 2017, I took the course STAT 381 with Dr. Debra Hydorn. Below I included the interesting labs we worked on in the class. + +*Please note that these reports were not formatted for this site. So equations and images may not show up.* + +[Random Walk](randomwalk) + +[Random Number Generation](randomnumber) + +[Central Limit Theorum](centrallimit) + +[Confidence Interval](confint) diff --git a/content/notes/stat381/centrallimit.md b/content/notes/stat381/centrallimit.md new file mode 100644 index 0000000..440b2c8 --- /dev/null +++ b/content/notes/stat381/centrallimit.md @@ -0,0 +1,407 @@ +# Central Limit Theorem Lab + +**Brandon Rozek** + +## Introduction + +The Central Limit Theorem tells us that if the sample size is large, then the distribution of sample means approach the Normal Distribution. For distributions that are more skewed, a larger sample size is needed, since that lowers the impact of extreme values on the sample mean. + +### Skewness + +Skewness can be determined by the following formula +$$ +Sk = E((\frac{X - \mu}{\sigma})^3) = \frac{E((X - \mu)^3)}{\sigma^3} +$$ +Uniform distributions have a skewness of zero. Poisson distributions however have a skewness of $\lambda^{-\frac{1}{2}}$. + +In this lab, we are interested in the sample size needed to obtain a distribution of sample means that is approximately normal. + +### Shapiro-Wilk Test + +In this lab, we will test for normality using the Shapiro-Wilk test. The null hypothesis of this test is that the data is normally distributed. The alternative hypothesis is that the data is not normally distributed. This test is known to favor the alternative hypothesis for a large number of sample means. To circumvent this, we will test normality starting with a small sample size $n$ and steadily increase it until we obtain a distribution of sample means that has a p-value greater than 0.05 in the Shapiro-Wilk test. + +This tells us that with a false positive rate of 5%, there is no evidence to suggest that the distribution of sample means don't follow the normal distribution. + +We will use this test to look at the distribution of sample means of both the Uniform and Poisson distribution in this lab. + +### Properties of the distribution of sample means + +The Uniform distribution has a mean of $0.5$ and a standard deviation of $\frac{1}{\sqrt{12n}}$ and the Poisson distribution has a mean of $\lambda$ and a standard deviation of $\sqrt{\frac{\lambda}{n}}$. + +## Methods + +For the first part of the lab, we will sample means from a Uniform distribution and a Poisson distribution of $\lambda = 1$ both with a sample size $n = 5$. + +Doing so shows us how the Uniform distribution is roughly symmetric while the Poisson distribution is highly skewed. This begs the question: what sample size $(n)$ do I need for the Poisson distribution to be approximately normal? + +### Sampling the means + +The maximum number of mean observations that the Shapiro-Wilk test allows is 5000 observations. Therefore, we will obtain `n` observations separately from both the Uniform or Poisson distribution and calculate the mean from it. Repeating that process 5000 times. + +The mean can be calculated from the following way +$$ +Mean = \frac{\sum x_i}{n} +$$ +Where $x_i$ is the observation obtained from the Uniform or Poisson distribution + +### Iterating with the Shapiro-Wilk Test + +Having a sample size of a certain amount doesn't always guarantee that it will fail to reject the Shapiro-Wilk test. Therefore, it is useful to run the test multiple times so that we can create a 95th percentile of sample sizes that fails to reject the Shapiro-Wilk test. + +The issue with this is that lower lambda values result in higher skewness's. Which is described by the skewness formula. If a distribution has a high degree of skewness, then it will take a larger sample size n to make the sample mean distribution approximately normal. + +Finding large values of n result in longer computational time. Therefore, the code takes this into account by starting at a larger value of n and/or incrementing by a larger value of n each iteration. Incrementing by a larger value of n decreases the precision, though that is the compromise I'm willing to take in order to achieve faster results. + +Finding just the first value of $n$ that generates the sample means that fails to reject the Shapiro-Wilk test doesn't tell us much in terms of the sample size needed for the distribution of sample means to be approximately normal. Instead, it is better to run this process many times, finding the values of n that satisfy this condition multiple times. That way we can look at the distribution of sample sizes required and return back the 95th percentile. + +Returning the 95th percentile tells us that 95% of the time, it was the sample size returned or lower that first failed to reject the Shapiro-Wilk test. One must be careful, because it can be wrongly interpreted as the sample size needed to fail to reject the Shapiro-Wilk test 95% of the time. Using that logic requires additional mathematics outside the scope of this paper. Returning the 95th percentile of the first sample size that failed to reject the Shapiro-Wilk test, however, will give us a good enough estimate for a sample size needed. + +### Plots + +Once a value for `n ` is determined, we sample the means of the particular distribution (Uniform/Poisson) and create histograms and Q-Q plots for each of the parameters we're interested in. We're looking to verify that the histogram looks symmetric and that the points on the Q-Q Plot fit closely to the Q-Q Line with one end of the scattering of points on the opposite side of the line as the other. + + + +## Results + +### Part I + +Sampling the mean of the uniform distribution with $n = 5$ results in a mean of $\bar{x} = 0.498$ and standard deviation of $sd = 0.1288$. The histogram and Q-Q Plot can be seen in Figure I and Figure II respectively. + +$\bar{x}$ isn't far from the theoretical 0.5 and the standard deviation is also close to +$$ +\frac{1}{\sqrt{12(5)}} \approx 0.129 +$$ +Looking at the histogram and Q-Q plot, it suggests that data is approximately normal. Therefore we can conclude that a sample size of 5 is sufficient for the sample mean distribution coming from the normal distribution to be approximately normal. + +Sampling the mean of the Poisson distribution with $n = 5$ and $\lambda = 1$ results in a mean of $\bar{x} = 0.9918$ and a standard deviation of $sd = 0.443$. The histogram and Q-Q Plot can be seen in Figures III and IV respectively. + +$\bar{x}$ is not too far from the theoretical $\lambda = 1$, the standard deviation is a bit farther from the theoretical +$$ +\sqrt{\frac{\lambda}{n}} = \sqrt{\frac{1}{5}} = 0.447 +$$ +Looking at the Figures, however, shows us that the data does not appear normal. Therefore, we cannot conclude that 5 is a big enough sample size for the Poisson Distribution of $\lambda = 1$ to be approximately normal. + +### Part II + +Running the algorithm I described, I produced the following table + +| $\lambda$ | Skewness | Sample Size Needed | Shapiro-Wilk P-Value | Average of Sample Means | Standard Deviation of Sample Means | Theoretical Standard Deviation of Sample Means | +| --------- | -------- | ------------------ | -------------------- | ----------------------- | ---------------------------------- | ---------------------------------------- | +| 0.1 | 3.16228 | 2710 | 0.05778 | 0.099 | 0.0060 | 0.0061 | +| 0.5 | 1.41421 | 802 | 0.16840 | 0.499 | 0.0250 | 0.0249 | +| 1 | 1.00000 | 215 | 0.06479 | 1.000 | 0.0675 | 0.0682 | +| 5 | 0.44721 | 53 | 0.12550 | 4.997 | 0.3060 | 0.3071 | +| 10 | 0.31622 | 31 | 0.14120 | 9.999 | 0.5617 | 0.5679 | +| 50 | 0.14142 | 10 | 0.48440 | 50.03 | 2.2461 | 2.2361 | +| 100 | 0.10000 | 6 | 0.47230 | 100.0027 | 4.1245 | 4.0824 | + +The skewness was derived from the formula in the first section while the sample size was obtained by looking at the .95 blue quantile line in Figures XVIII-XIV. The rest of the columns are obtained from the output of the R Code function `show_results`. + +Looking at the histograms and Q-Q Plots produced by the algorithm, the distribution of sample means distributions are all roughly symmetric. The sample means are also tightly clustered around the Q-Q line, showing that the normal distribution is a good fit. This allows us to be confident that using these values of `n` as the sample size would result in the distribution of sample means of Uniform or Poisson (with a given lambda) to be approximately normal. + +All the values of the average sampling means are within 0.001 of the theoretical average of sample means. The standard deviation of sample means slightly increase as the value of $\lambda$ increases, but it still is quite low. + +## Conclusion + +The table in the results section clearly show that as the skewness increases, so does the sample size needed to make the distribution of sample means approximately normal. This shows the central limit theorem in action in that no matter the skewness, if you obtain a large enough sample, the distribution of sample means will be approximately normal. + +These conclusions pave the way for more interesting applications such as hypothesis testing and confidence intervals. + +## Appendix + +### Figures + +#### Figure I, Histogram of Sample Means coming from a Uniform Distribution with sample size of 5 + +![part1histunif](/home/rozek/Pictures/stat381lab3/part1histunif.png) + +#### Figure II, Q-Q Plot of Sample Means coming from a Uniform Distribution with sample size of 5 + +![part1qunif](/home/rozek/Pictures/stat381lab3/part1qunif.png) + +#### Figure III, Histogram of Sample Means coming from a Poisson Distribution with $\lambda = 1$ and sample size of 5 + +![part1histpoisson](/home/rozek/Pictures/stat381lab3/part1histpoisson.png) + +#### Figure IV, Q-Q Plot of Sample Means coming from Poisson Distribution with $\lambda = 1$ and sample size of 5 + +![part1qpoisson](/home/rozek/Pictures/stat381lab3/part1qpoisson.png) + +#### Figure V, Histogram of Sample Means coming from Poisson Distribution with $\lambda = 0.1$ and sample size of 2710 + +![histpoisson01](/home/rozek/Pictures/stat381lab3/histpoisson01.png) + +#### Figure VI, Q-Q Plot of Sample Means coming from Poisson Distribution with $\lambda = 0.1$ and sample size of 2710 + +![qpoisson01](/home/rozek/Pictures/stat381lab3/qpoisson01.png) + +#### Figure VII, Histogram of Sample Means coming from Poisson Distribution with $\lambda = 0.5$ and sample size of 516 + +![histpoisson05](/home/rozek/Pictures/stat381lab3/histpoisson05.png) + +#### Figure VII, Q-Q Plot of Sample Means coming from Poisson Distribution with $\lambda = 0.5$ and sample size of 516 + +![qpoisson05](/home/rozek/Pictures/stat381lab3/qpoisson05.png) + +#### Figure VIII, Histogram of Sample Means coming from Poisson Distribution with $\lambda = 1$ and sample size of 215 + +![histpoisson1](/home/rozek/Pictures/stat381lab3/histpoisson1.png) + +#### Figure IX, Q-Q Plot of Sample Means coming from Poisson Distribution with $\lambda = 1$ and sample size of 215 + +![qpoisson1](/home/rozek/Pictures/stat381lab3/qpoisson1.png) + +#### Figure X, Histogram of Sample Means coming from Poisson Distribution of $\lambda = 5$ and sample size of 53 + +![histpoisson5](/home/rozek/Pictures/stat381lab3/histpoisson5.png) + +#### Figure XI, Q-Q Plot of Sample Means coming from Poisson Distribution of $\lambda = 5$ and sample size of 53 + +![qpoisson5](/home/rozek/Pictures/stat381lab3/qpoisson5.png) + +#### Figure XII, Histogram of Sample Means coming from Poisson Distribution of $\lambda = 10$ and sample size of 31 + +![histpoisson10](/home/rozek/Pictures/stat381lab3/histpoisson10.png) + +#### Figure XIII, Q-Q Plot of Sample Means coming from Poisson Distribution of $\lambda = 10$ and sample size of 31 + +![qpoisson10](/home/rozek/Pictures/stat381lab3/qpoisson10.png) + +#### Figure XIV, Histogram of Sample Means coming from Poisson Distribution of $\lambda = 50$ and sample size of 10 + +![histpoisson50](/home/rozek/Pictures/stat381lab3/histpoisson50.png) + +#### Figure XV, Q-Q Plot of Sample Means coming from Poisson Distribution of $\lambda = 50$ and sample size of 10 + +![qpoisson50](/home/rozek/Pictures/stat381lab3/qpoisson50.png) + +#### Figure XVI, Histogram of Sample Means coming from Poisson Distribution of $\lambda = 100$ and sample size of 6 + +![histpoisson100](/home/rozek/Pictures/stat381lab3/histpoisson100.png) + +#### Figure XVII, Q-Q Plot of Sample Means coming from Poisson Distribution of $\lambda = 100$ and sample size of 6 + +![qpoisson100](/home/rozek/Pictures/stat381lab3/qpoisson100.png) + +#### Figure XVIII, Histogram of sample size needed to fail to reject the normality test for Poisson Distribution of $\lambda = 0.1$ + +![histl01](/home/rozek/Pictures/stat381lab3/histl01.png) + +#### Figure XIX, Histogram of sample size needed to fail to reject the normality test for Poisson Distribution of $\lambda = 0.5$ + +![histl05](/home/rozek/Pictures/stat381lab3/histl05.png) + +#### Figure XX, Histogram of sample size needed to fail to reject the normality test for Poisson Distribution of $\lambda = 1$ + +![histl1.0](/home/rozek/Pictures/stat381lab3/histl1.0.png) + +#### Figure XXI, Histogram of sample size needed to fail to reject the normality test for Poisson Distribution of $\lambda = 5$ + +![histl5](/home/rozek/Pictures/stat381lab3/histl5.png) + +####Figure XXII, Histogram of sample size needed to fail to reject the normality test for Poisson Distribution of $\lambda = 10$ + +![histl10](/home/rozek/Pictures/stat381lab3/histl10.png) + +####Figure XXIII, Histogram of sample size needed to fail to reject the normality test for Poisson Distribution of $\lambda = 50$ + +![histl50](/home/rozek/Pictures/stat381lab3/histl50.png) + +#### Figure XXIV, Histogram of sample size needed to fail to reject the normality test for Poisson Distribution of $\lambda = 100$ + +![histl100](/home/rozek/Pictures/stat381lab3/histl100.png) + +### R Code + +```R +rm(list=ls()) +library(ggplot2) + +sample_mean_uniform = function(n) { + xbarsunif = numeric(5000) + for (i in 1:5000) { + sumunif = 0 + for (j in 1:n) { + sumunif = sumunif + runif(1, 0, 1) + } + xbarsunif[i] = sumunif / n + } + xbarsunif +} + +sample_mean_poisson = function(n, lambda) { + xbarspois = numeric(5000) + for (i in 1:5000) { + sumpois = 0 + for (j in 1:n) { + sumpois = sumpois + rpois(1, lambda) + } + xbarspois[i] = sumpois / n + } + xbarspois +} + + +poisson_n_to_approx_normal = function(lambda) { + print(paste("Looking at Lambda =", lambda)) + ns = c() + + # Speed up computation of lower lambda values by starting at a different sample size + # and/or lowering the precision by increasing the delta sample size + # and/or lowering the number of sample sizes we obtain from the shapiro loop + increaseBy = 1; + iter = 3; + startingValue = 2 + if (lambda == 0.1) { + startingValue = 2000; + iter = 3; + increaseBy = 50; + } else if (lambda == 0.5) { + startingValue = 200; + iter = 5; + increaseBy = 10; + } else if (lambda == 1) { + startingValue = 150; + iter = 25; + } else if (lambda == 5) { + startingValue = 20; + iter = 50; + startingValue = 10; + } else if (lambda == 10) { + iter = 100; + } else { + iter = 500; + } + + progressIter = 1 + for (i in 1:iter) { + + # Include a progress indicator for personal sanity + if (i / iter > .1 * progressIter) { + print(paste("Progress", i / iter * 100, "% complete")) + progressIter = progressIter + 1 + } + + n = startingValue + + dist = sample_mean_poisson(n, lambda) + p.value = shapiro.test(dist)$p.value + while (p.value < 0.05) { + n = n + increaseBy + dist = sample_mean_poisson(n, lambda) + p.value = shapiro.test(dist)$p.value + + # More sanity checks + if (n %% 10 == 0) { + print(paste("N =", n, " p.value =", p.value)) + } + } + ns = c(ns, n) + } + + print(ggplot(data.frame(ns), aes(x = ns)) + + geom_histogram(fill = 'white', color = 'black', bins = 10) + + geom_vline(xintercept = ceiling(quantile(ns, .95)), col = '#0000AA') + + ggtitle(paste("Histogram of N needed for Poisson distribution of lambda =", lambda)) + + xlab("N") + + ylab("Count") + + theme_bw()) + + + ceiling(quantile(ns, .95)) #95% of the time, this value of n will give you a sampling distribution that is approximately normal +} + +uniform_n_to_approx_normal = function() { + ns = c() + progressIter = 1 + + for (i in 1:500) { + + # Include a progress indicator for personal sanity + if (i / 500 > .1 * progressIter) { + print(paste("Progress", i / 5, "% complete")) + progressIter = progressIter + 1 + } + + n = 2 + dist = sample_mean_uniform(n) + p.value = shapiro.test(dist)$p.value + while (p.value < 0.05) { + n = n + 1 + dist = sample_mean_uniform(n) + p.value = shapiro.test(dist)$p.value + + if (n %% 10 == 0) { + print(paste("N =", n, " p.value =", p.value)) + } + + } + + ns = c(ns, n) + } + + print(ggplot(data.frame(ns), aes(x = ns)) + + geom_histogram(fill = 'white', color = 'black', bins = 10) + + geom_vline(xintercept = ceiling(quantile(ns, .95)), col = '#0000AA') + + ggtitle("Histogram of N needed for Uniform Distribution") + + xlab("N") + + ylab("Count") + + theme_bw()) + + ceiling(quantile(ns, .95)) #95% of the time, this value of n will give you a sampling distribution that is approximately normal +} + + + +show_results = function(dist) { + print(paste("The mean of the sample mean distribution is:", mean(dist))) + print(paste("The standard deviation of the sample mean distribution is:", sd(dist))) + print(shapiro.test(dist)) + print(ggplot(data.frame(dist), aes(x = dist)) + + geom_histogram(fill = 'white', color = 'black', bins = 20) + + ggtitle("Histogram of Sample Means") + + xlab("Mean") + + ylab("Count") + + theme_bw()) + qqnorm(dist, pch = 1, col = '#001155', main = "QQ Plot", xlab = "Sample Data", ylab = "Theoretical Data") + qqline(dist, col="#AA0000", lty=2) +} + + +## PART I +uniform_mean_dist = sample_mean_uniform(n = 5) +poisson_mean_dist = sample_mean_poisson(n = 5, lambda = 1) + +show_results(uniform_mean_dist) +show_results(poisson_mean_dist) + +## PART II + +print("Starting Algorithm to Find Sample Size Needed for the Poisson Distribution of Lambda = 0.1"); +n.01 = poisson_n_to_approx_normal(0.1) +show_results(sample_mean_poisson(n.01, 0.1)) +print("Starting Algorithm to Find Sample Size Needed for the Poisson Distribution of Lambda = 0.5"); +n.05 = poisson_n_to_approx_normal(0.5) +show_results(sample_mean_poisson(n.05, 0.5)) +print("Starting Algorithm to Find Sample Size Needed for the Poisson Distribution of Lambda = 1"); +n.1 = poisson_n_to_approx_normal(1) +show_results(sample_mean_poisson(n.1, 1)) +print("Starting Algorithm to Find Sample Size Needed for the Poisson Distribution of Lambda = 5"); +n.5 = poisson_n_to_approx_normal(5) +show_results(sample_mean_poisson(n.5, 5)) +print("Starting Algorithm to Find Sample Size Needed for the Poisson Distribution of Lambda = 10"); +n.10 = poisson_n_to_approx_normal(10) +show_results(sample_mean_poisson(n.10, 10)) +print("Starting Algorithm to Find Sample Size Needed for the Poisson Distribution of Lambda = 50"); +n.50 = poisson_n_to_approx_normal(50) +show_results(sample_mean_poisson(n.50, 50)) +print("Starting Algorithm to Find Sample Size Needed for the Poisson Distribution of Lambda = 100"); +n.100 = poisson_n_to_approx_normal(100) +show_results(sample_mean_poisson(n.100, 100)) + +print("Starting Algorithm to Find Sample Size Needed for the Uniform Distribution") +n.uniform = uniform_n_to_approx_normal() +show_results(sample_mean_uniform(n.uniform)) +``` + diff --git a/content/notes/stat381/confint.md b/content/notes/stat381/confint.md new file mode 100644 index 0000000..9ed0f73 --- /dev/null +++ b/content/notes/stat381/confint.md @@ -0,0 +1,287 @@ +# Confidence Interval Lab + +**Written by Brandon Rozek** + +## Introduction + +Confidence intervals expands the concept of a point estimation by giving a margin of error such that one can be confident that a certain percentage of the time the true parameter falls within that interval. + +In this lab, we will look at confidence intervals for a mean. This lab focuses on a certain method of confidence intervals that depends on the distribution of sample means being Normal. We will show how the violation of this assumption impacts the probability that the true parameter falls within the interval. + +## Methods + +The observed level of confidence tells us the proportion of times the true mean falls within a confidence interval. To show how the violation of the Normality assumption affects this, we will sample from both a Normal distribution, T distribution, and exponential distribution with different sample sizes. + +The normal and T distributions are sampled with a mean of 5 and a standard deviation of 2. The exponential deviation is sampled with a lambda of 2 or mean of 0.5. + +From the samples, we obtain the mean and the upper/lower bounds of the confidence interval. This is performed 100,000 times. That way we obtain a distribution of these statistics. + +We know that a confidence interval is valid, if the lower bound is no more than the true mean and the upper bound is no less than the true mean. From this definition, we can compute a proportion of observed confidence from the simulations + +### Visualizations + +From the distributions of statistics, we can create visualizations to support the understanding of confidence intervals. + +The first one is a scatterplot of lower bounds vs upper bounds. This plot demonstrates the valid confidence intervals in blue and the invalid ones in red. It demonstrates how confidence intervals that are invalid are not located inside the box. + +The second visualization is a histogram of all the sample means collected. The sample means that didn't belong to a valid confidence interval are shaded in red. This graphic helps demonstrate the type I errors on both sides of the distribution. + +In this lab, we're interested in seeing how our observed level of confidence differs from our theoretical level of confidence (95%) when different sample sizes and distributions are applied. + +## Results + +We can see from the table section in the Appendix that sampling from a Normal or t distribution does not adversely affect our observed level of confidence. The observed level of confidence varies slightly from the theoretical level of confidence of 0.95. + +When sampling from the exponential distribution, however, the observed level of confidence highly depends upon the sample size. + +Looking at Table III, we can see that for a sample size of 10, the observed level of confidence is at a meager 90%. This is 5% off from our theoretical level of confidence. This shows how the normality assumption is vital to the precision of our estimate. + +This comes from the fact that using this type of confidence interval on a mean from a non-normal distribution requires a large sample size for the central limit theorem to take affect. + +The central limit theorem states that if the sample size is "large", the distribution of sample means approach the normal distribution. You can see how in Figure XVIII, the distribution of sample means is skewed, though as the sample size increases, the distribution of sample means become more symmetric (Figure XIX). + +## Conclusion + +From this, we can conclude that violating the underlying assumption of normality decreases the observed level of confidence. We can mitigate the decrease of the observed level of confidence when sampling means from a non-normal distribution by having a larger sample size. This is due to the central limit theorem. + +## Appendix + +### Tables + +#### Table I. Sampling from Normal + +| Sample Size | Proportion of Means Within CI | +| ----------- | ----------------------------- | +| 10 | 0.94849 | +| 20 | 0.94913 | +| 50 | 0.95045 | +| 100 | 0.94955 | + + + +#### Table II. Sampling from T Distribution + +| Sample Size | Proportion of Means Within CI | +| ----------- | ----------------------------- | +| 10 | 0.94966 | +| 20 | 0.94983 | +| 50 | 0.94932 | +| 100 | 0.94999 | + + + +#### Table III. Sampling from Exponential Distribution + +| Sample Size | Proportion of Means Within CI | +| ----------- | ----------------------------- | +| 10 | 0.89934 | +| 20 | 0.91829 | +| 50 | 0.93505 | +| 100 | 0.94172 | + + + + + +### Figures + +#### Normal Distribution + +##### Figure I. Scatterplot of Bounds for Normal Distribution of Sample Size 10 + +![normal10scatter](/home/rozek/Pictures/statlab4/normal10scatter.png) + +##### Figure II. Histogram of Sample Means for Normal Distribution of Sample Size 10 + +![normal10hist](/home/rozek/Pictures/statlab4/normal10hist.png) + +##### Figure III. Scatterplot of Bounds for Normal Distribution of Sample Size 20 + +![normal20scatterplot](/home/rozek/Pictures/statlab4/normal20scatterplot.png) + +##### Figure IV. Histogram of Sample Means for Normal Distribution of Sample Size 20 + +![normal20hist](/home/rozek/Pictures/statlab4/normal20hist.png) + +##### Figure VScatterplot of Bounds for Normal Distribution of Sample Size 50 + +![normal50scatterplot](/home/rozek/Pictures/statlab4/normal50scatterplot.png) + +##### Figure VI. Histogram of Sample Means for Normal Distribution of Sample Size 50 + +![normal50hist](/home/rozek/Pictures/statlab4/normal50hist.png) + +##### Figure VII. Scatterplot of Bounds for Normal Distribution of Sample Size 100 + +![normal100scatterplot](/home/rozek/Pictures/statlab4/normal100scatterplot.png) + +##### Figure VIII. Histogram of Sample Means for Normal Distribution of Sample Size 100 + +![normal100hist](/home/rozek/Pictures/statlab4/normal100hist.png) + +#### T Distribution + +##### Figure IX. Scatterplot of Bounds for T Distribution of Sample Size 10 + +![t10scatterplot](/home/rozek/Pictures/statlab4/t10scatterplot.png) + +##### Figure X. Histogram of Sample Means for T Distribution of Sample Size 10 + +![t10hist](/home/rozek/Pictures/statlab4/t10hist.png) + +##### Figure XI. Scatterplot of Bounds for T Distribution of Sample Size 20 + +![t20scatterplot](/home/rozek/Pictures/statlab4/t20scatterplot.png) + +##### Figure XII. Histogram of Sample Means for T Distribution of Sample Size 20 + +![t20hist](/home/rozek/Pictures/statlab4/t20hist.png) + +##### Figure XIII. Scatterplot of Bounds for T Distribution of Sample Size 50 + +![t50scatter](/home/rozek/Pictures/statlab4/t50scatter.png) + +##### Figure XIV. Histogram of Sample Means for T Distribution of Sample Size 50 + +![t50hist](/home/rozek/Pictures/statlab4/t50hist.png) + +##### Figure XV. Scatterplot of Bounds for T Distribution of Sample Size 100 + +![t100scatter](/home/rozek/Pictures/statlab4/t100scatter.png) + +##### Figure XVI. Histogram of Sample Means for T Distribution of Sample Size 100 + +![t100hist](/home/rozek/Pictures/statlab4/t100hist.png) + +#### Exponential Distribution + +##### Figure XVII. Scatterplot of Bounds for Exponential Distribution of Sample Size 10 + +![exp10scatter](/home/rozek/Pictures/statlab4/exp10scatter.png) + +##### Figure XVIII. Histogram of Sample Means for Exponential Distribution of Sample Size 10 + +![exp10hist](/home/rozek/Pictures/statlab4/exp10hist.png) + +##### Figure XIX. Scatterplot of Bounds for Exponential Distribution of Sample Size 20 + +![exp20scatter](/home/rozek/Pictures/statlab4/exp20scatter.png) + +##### Figure XX. Histogram of Sample Means for Exponential Distribution of Sample Size 20 + +![exp20hist](/home/rozek/Pictures/statlab4/exp20hist.png) + +##### Figure XXI. Scatterplot of Bounds for Exponential Distribution of Sample Size 50 + +![exp50scatter](/home/rozek/Pictures/statlab4/exp50scatter.png) + +##### Figure XXII. Histogram of Sample Means for Exponential Distribution of Sample Size 50 + +![exp50hist](/home/rozek/Pictures/statlab4/exp50hist.png) + +##### Figure XXIII. Scatterplot of Bounds for Exponential Distribution of Sample Size 100 + +![exp100scatter](/home/rozek/Pictures/statlab4/exp100scatter.png) + +##### Figure XXIV. Histogram of Sample Means for Exponential Distribution of Sample Size 100 + +![exp100hist](/home/rozek/Pictures/statlab4/exp100hist.png) + + + +### R Code + +```R +rm(list=ls()) +library(ggplot2) +library(functional) # For function currying + +proportion_in_CI = function(n, mu, dist) { + + # Preallocate vectors + lower_bound = numeric(100000) + upper_bound = numeric(100000) + means = numeric(100000) + + number_within_CI = 0 + + ME = 1.96 * 2 / sqrt(n) ## Normal Margin of Error + + for (i in 1:100000) { + x = numeric(n) + + # Sample from distribution + if (dist == "Normal" | dist == "t") { + x = rnorm(n,mu,2) + } else if (dist == "Exponential") { + x = rexp(n, 1 / mu) + } + + ## Correct ME if non-normal + if (dist != "Normal") { + ME = qt(0.975,n-1)*sd(x)/sqrt(n) + } + + ## Store statistics + means[i] = mean(x) + lower_bound[i] = mean(x) - ME + upper_bound[i] = mean(x) + ME + + # Is Confidence Interval Valid? + if (lower_bound[i] < mu & upper_bound[i] > mu) { + number_within_CI = number_within_CI + 1 + } + } + + # Prepare for plotting + lbub = data.frame(lower_bound, upper_bound, means) + lbub$col = ifelse(lbub$lower_bound < mu & lbub$upper_bound > mu, 'Within CI', 'Outside CI') + print(ggplot(lbub, aes(x = lower_bound, y = upper_bound, col = col)) + + geom_point(pch = 1) + + geom_hline(yintercept = mu, col = '#000055') + + geom_vline(xintercept = mu, col = '#000055') + + ggtitle(paste("Plot of Lower Bounds vs Upper Bounds with Sample Size of ", n)) + + xlab("Lower Bound") + + ylab("Upper Bounds") + + theme_bw() + ) + print(ggplot(lbub, aes(x = means, fill = col)) + + geom_histogram(color = 'black') + + ggtitle(paste("Histogram of Sample Means with Sample Size of ", n)) + + xlab("Sample Mean") + + ylab("Count") + + theme_bw() + ) + + # Return proportion within CI + number_within_CI / 100000 +} + +sample_sizes = c(10, 20, 50, 100) + +### PART I +proportion_in_CI_Normal = Curry(proportion_in_CI, dist = "Normal", mu = 5) +p_norm = sapply(sample_sizes, proportion_in_CI_Normal) +sapply(p_norm, function(x) { + cat("The observed proportion of intervals containing mu is", x, "\n") + invisible(x) +}) + + +### PART II +proportion_in_CI_T = Curry(proportion_in_CI, dist = "t", mu = 5) +p_t = sapply(sample_sizes, proportion_in_CI_T) +sapply(p_t, function(x) { + cat("The observed proportion of intervals containing mu is", x, "\n") + invisible(x) +}) + +### PART III +proportion_in_CI_Exp = Curry(proportion_in_CI, dist = "Exponential", mu = 0.5) +p_exp = sapply(sample_sizes, proportion_in_CI_Exp) +sapply(p_exp, function(x) { + cat("The observed proportion of intervals containing mu is", x, "\n") + invisible(x) +}) +``` + diff --git a/content/notes/stat381/randomnumber.md b/content/notes/stat381/randomnumber.md new file mode 100644 index 0000000..dcdb5d4 --- /dev/null +++ b/content/notes/stat381/randomnumber.md @@ -0,0 +1,441 @@ +# Random Number Generation + +## Introduction + +The generation of random numbers have a variety of applications including but not limited to the modeling of stochastic processes. It is important, therefore, to be able to generate any random number following a given distribution. One of the many ways to achieve this is to transform numbers sampled from a random uniform distribution. + +In this lab, we will compare the effectiveness between the linear congruence method (LCM), `runif`, and `rexp` to generate random numbers. The programming language R will be used and different plots and summary statistics are drawn upon to analyze the effectiveness of the methods. + +## Methods + +### The Linear Congruential Method + +The linear congruential method (LCM) is an algorithm that produces a sequence of pseudo-random numbers using the following recursive function +$$ +X_{n + 1} = (aX_n + c) \mod m +$$ +The R code we use has a `c` value of 0 which is a special case known as the multiplicative congruential generator (MCG). + +There are several conditions for using a MCG. First, the seed value must be co-prime to `m`. In other words, the greatest common denominator between the two must be 1. A function was written in R to check this. Secondly, `m` must be a prime number or a power of a prime number. + +#### Periodicity + +An element of periodicity comes into play when dealing with pseudo-random number generators. Once the generator has produced a certain number of terms, it is shown to loop back to the first term of the sequence. It is advantageous, therefore, to keep the period high. + +The period in a MCG is at most `m - 1`. In this lab, `m` has a value of $2^{31}$ and only 100 numbers were sampled from the LCM. This allows us to avoid the issue of periodicity entirely in our analysis. + +### Mersenne-Twister Method + +The default pseudo-random number generator (pseudo RNG) in R is the Mersenne-Twister with the default seed value of the current time and the process id of the current R instance. Mersenne-Twister is part of a class of pseudo RNG called the generalized feedback register. This class of pseudo RNGs provide a very long period (VLP) or in other words, a long cycle before the values start repeating. VLPs are often useful when executing large simulations in R. + +Since this method is already coded in the `base` R-package, we will leave the implementation for the curious to research. + +### The Uniform Distribution + +#### Probability Mass Function + +The uniform distribution function $Unif(\theta_1, \theta_2)$ has a probability mass function (PMF) of the following. +$$ +f(x) = \frac{1}{\theta_2 - \theta_1} +$$ +Where x is valid between [$\theta_1$, $\theta_2$]. + +In our case, we are producing numbers from [0,1]. We can therefore reduce the probability mass function to the following +$$ +f(x) = 1 +$$ +#### Expected Value + +The expected value can be defined as +$$ +E(X) = \int_a^b xf(x)dx +$$ +For the uniform distribution we're using that becomes +$$ +E(X) = \int_0^1 xdx = \frac{1}{2}[x^2]_0^1 = \frac{1}{2} +$$ +We should, therefore, expect the mean of the generated random number sequence to roughly equal $\frac{1}{2}$. + +#### Median + +To find the median of the distribution, we need to find the point at which the cumulative density function (CDF) is equal to .5. +$$ +\int_0^{Median(X)} f(x)dx = \frac{1}{2} +$$ +$$ +\int_0^{Median(X)} dx = \frac{1}{2} +$$ + +$$ +[X]_0^{Median(X)} = \frac{1}{2} +$$ + +$$ +Median(X) = \frac{1}{2} +$$ + +This shows us that the median of the distribution should be roughly equal to $\frac{1}{2}$ as well. + +#### Analysis of Uniform Distribution Fit + +The histogram of a uniform distribution of data should look rectangular in shape. This means that the counts of all the sub-intervals should be about the same. + +Another way to test whether or not the distribution is a good fit is to use what is called a Quantile-Quantile plot (Q-Q Plot). This is a probability plot that compares the quantiles from the theoretical distribution, this is the uniform distribution, to that of the sample. + +For a precise Q-Q Plot, we need a lot of quantiles to compare. In this lab, we will compare 100 different quantiles. The quantiles from the theoretical distribution can be easily derived from the fact that all value ranges are equally probable. The theoretical quantiles in this case is 0.01, 0.02, ..., 0.98, 0.99, 1. The sample quantiles are obtianed by receiving 100 observations from `runif` or the LCM. + +In the Q-Q plot, a good fit is shown when the points hug closely to the Q-Q line. It is also important to have symmetry in the points. This means that the points are ending on opposite sides of the Q-Q line. + +For sake of exploration, we will use 5 different seed values for the linear congruential method (while making sure that the seed values are co-prime). We will then use the results of these and compare LCM to how the standard `runif` method generates random numbers. + +### Exponential Distribution + +#### Probability Mass Function and the Cumulative Density Function + +The exponential distribution is a type of continuous distribution that is defined by the following PMF +$$ +f(x) = \lambda e^{-\lambda t} +$$ +We can find the CDF by taking the integral of the PMF. +$$ +F(x) = \int f(x)dx = \lambda \int e^{-\lambda x} dx = \lambda * (\frac{-1}{\lambda}) e^{-\lambda x} + C = -e^{-\lambda x} + C +$$ +One of the conditions for the cumulative density function is that as $x \to \infty$, $F(x) \to 1$. +$$ +1 = \lim_{x \to \infty} (-e^{-\lambda x} + C) = \lim_{x \to \infty} (-e^{-\lambda x}) + lim_{x \to \infty} ( C) = \lim_{x \to \infty}(-e^{\lambda x}) + C +$$ +This shows that $C = 1$, since $lim_{x \to \infty} (-e^{-\lambda x})$ is equal to 0. + +Substituting $C​$ gives us the following. +$$ +F(x) = 1 - e^{-\lambda x} +$$ + +#### Expected Value + +We can find the expected value using the formula described in the previous Expected Value section. Reflected in the bounds of integration is the domain of the exponential distribution $[0, \infty)$. +$$ +E(X) = \lim_{a \to \infty}\int_0^a x \lambda e^{-\lambda x} dx +$$ +The integral above features a product of two functions. So as an aside, we will derive a formula so we can take the integral above. + +The total derivative is defined as +$$ +d(uv) = udv + vdu +$$ + + +After taking the integral of both sides, we can solve for a formula that gives the following +$$ +\int d(uv) = \int udv + \int vdu +$$ + +$$ +\int udv = uv - \int vdu +$$ + +The formula above is called *Integration by Parts*. We will make use of this formula by defining $u = \lambda x$ and $dv = e^{-\lambda x} dx$ + +This implies that $du = \lambda dx$ and $v= -\frac{1}{\lambda}e^{-\lambda x}$ +$$ +E(X) = -\lim_{a \to \infty}[\lambda x \frac{1}{\lambda}e^{-\lambda x}]_0^a - \lim_{b \to \infty}\int_0^b -\frac{1}{\lambda}e^{-\lambda x}\lambda dx +$$ + +$$ +E(X) = -\lim_{a \to \infty} [xe^{-\lambda x}]_0^a - \lim_{b \to \infty}\int_0^b -e^{-\lambda x}dx +$$ + +$$ +E(X) = -\lim_{a \to \infty}(ae^{-\lambda a}) - \lim_{b \to \infty}[\frac{1}{\lambda}e^{-\lambda x}]_0^b +$$ + +$$ +E(X) = 0 - \frac{1}{\lambda}[\lim_{b \to \infty}(e^{-\lambda b}) - e^{-0\lambda}] +$$ + +$$ +E(X) = -\frac{1}{\lambda}(-1) = \frac{1}{\lambda} +$$ + +For the purposes of this lab, we will make the rate ($\lambda$) equal to 3. Which means we should expect our mean to be roughly equal to $\frac{1}{3}$. + +#### Median + +The median can be found by setting the CDF equal to $\frac{1}{2}$ +$$ +1- e^{-\lambda Median(X)} = \frac{1}{2} +$$ + +$$ +e^{-\lambda Median(X)} = \frac{1}{2} +$$ + +$$ +-\lambda Median(X) = \ln(\frac{1}{2}) +$$ + +$$ +Median(X) = \frac{\ln(2)}{\lambda} +$$ + +This shows that we should expect our median to be around $\frac{\ln(2)}{3} \approx 0.231$. + +### Inverse Transform Sampling + +Once we have a uniform distribution of values, we can then use these values to map to an exponential distribution. This is done through a technique called inverse transform sampling, the technique works as follows: + +1. Generate a random number u from the standard uniform distribution +2. Compute the value of X such that F(X) = u +3. The value of X belongs to the distribution of F + +Using these steps, we'll derive the exponential transform below. +$$ +F(X) = 1 - e^{-\lambda x} = u +$$ +Then proceeding to solve for X, we obtain the following. +$$ +e^{-\lambda X} = 1 - u +$$ + +$$ +-\lambda X = \ln(1 - u) +$$ + +$$ +X = \frac{-\ln(1 - u)}{\lambda} +$$ + +With this formula, we can now find values for X which is a random variable that follows an exponential distribution given random uniform data $u$. + +In this lab, we are looking at the exponential distribution with a rate of 3. Therefore, the probability mass function, the cumulative distribution function, and the exponential transform can be redefined as these respectively. +$$ +f(x) = 3e^{-3x} +$$ + +$$ +F(x) = 1 - e^{-3x} +$$ + +$$ +X = \frac{-\ln(1 - u)}{3} +$$ + +### R Code + +The R code makes use of the concepts above. The purpose of this code is to output the summary statistics, histograms, and Q-Q plots are used to compare the different methods. + +First the LCM is executed four times with three different seed values. The LCM is used to create a uniform distribution of data that is then compared to the standard `runif` function in the R language. + +Then, transformations of a LCM, `runif`, are executed and compared with the standard `rexp` to create an exponential distribution of data with $\lambda = 3$. + + + +## Results + +### Uniform Distribution + +For a small sample of 100 values, the data seems evenly distributed for all seeds and methods used. The peaks and troughs are more pronounced in the LCM methods suggesting that the `runif` command creates more evenly distributed data than the LCM. + +Deviations from the mean and median are lowest for the LCM rather than the standard `runif` command with the exception of the LCM with the seed of 93463. + +The Q-Q plots for all of the methods follow the Q-Q Line tightly and appear symmetric. + +### Exponential Distribution + +A bin size of 20 is used to make the histograms easily comparable to each other. One interesting thing to note is that in Figure XI, there is an observation located far out from the rest of the data. For the purpose of a histogram, which is to show us the shape of the distribution, this one far observation skews what we can see. Therefore the next figure, Figure XII has that single outlier removed and shows the histogram of the rest of the data. + +All of the histograms appear exponential in shape. Looking at the Q-Q plots, the LCM transformation and the `rexp` distribution of data fit closely to the QQ-Line. All of the Q-Q Plots have the points getting further away from the line as you get higher up in the percentiles. The `runif` transformation quantiles diverge from the line after about the 50th percentile. + +Deviations from the mean and median were about the same for both transformed techniques (`runif` and LCM). The `rexp` command did better when it came to the deviation from the mean, but performed worse when it came to deviation from the median. + +## Conclusion + +The linear congruential methods performed better when it came to simulating the distribution than the standard R functions. It more accurately captured the median for both the standard uniform data, and the exponential data. Against the `runif` command, it also performed better at simulating the mean. + +This can especially be seen when comparing the two transform techniques. The transformed LCM distribution of data followed the Q-Q line more tightly than the transformed `runif`. + +I speculate that this is due to the seed value used. The Mersenne-Twist method performs better when the seed value doesn't have many zeros in it. Since the seed value is determined by the system time and process id, we don't know for sure if it's a proper input for the Mersenne-Twist. For the LCM, seeds were properly tested to make sure that it was co-prime with one of its parameters. This condition allowed proper seeds to work well with the LCM. + +Further research can be done on standardizing the seed values used across all the different pseudo random number generators and looking at the 6 other pseudo RNG that comes built into R. Changing the seed and random number generator can be achieved through the `set.seed` function. + +## Appendix + +### Figures + +#### Figure I, Histogram of LCM Random Data with seed 55555 + +![](file:///home/rozek/Pictures/stat381lab2/hist55555.png) + +#### Figure II, Q-Q Plot of LCM Random Data with seed 55555 + +![qqplot55555](/home/rozek/Pictures/stat381lab2/qqplot55555.png) + +#### Figure III, Histogram of LCM Random Data with seed 93463 + +![hist93463](/home/rozek/Pictures/stat381lab2/hist93463.png) + +#### Figure IV, Q-Q Plot of LCM Random Data with seed 93463 + +![q93463](/home/rozek/Pictures/stat381lab2/q93463.png) + +#### Figure V, Histogram of LCM Random Data with seed 29345 + +![hist29345](/home/rozek/Pictures/stat381lab2/hist29345.png) + +#### Figure VI, Q-Q Plot of LCM Random Data with seed 29345 + +![q29345](/home/rozek/Pictures/stat381lab2/q29345.png) + + + +#### Figure VII, Histogram of LCM Random Data with seed 68237 + +![hist68237](/home/rozek/Pictures/stat381lab2/hist68237.png) + +#### Figure VIII, Q-Q Plot of LCM Random Data with seed 68237 + +![q68237](/home/rozek/Pictures/stat381lab2/q68237.png) + +#### Figure IX, Histogram of R Random Uniform Data + +![histunif](/home/rozek/Pictures/stat381lab2/histunif.png) + +#### Figure X, Q-Q Plot of R Random Uniform Data + +![qunif](/home/rozek/Pictures/stat381lab2/qunif.png) + +#### Figure XI, Histogram of Exponential Data from LCM Random + +![histexplcm](/home/rozek/Pictures/stat381lab2/histexplcm.png) + +#### Figure XII, Histogram of Exponential Data from LCM Random without Outlier Above 2 + +![histexplcm_nooutlier](/home/rozek/Pictures/stat381lab2/histexplcm_nooutlier.png) + +#### Figure XIII, Q-Q Plot of Exponential Data from LCM Rnadom + +![qexplcm](/home/rozek/Pictures/stat381lab2/qexplcm.png) + +#### Figure XIV, Histogram of Exponential Data from R Random Uniform + +![histexpunif](/home/rozek/Pictures/stat381lab2/histexpunif.png) + +#### Figure XV, Q-Q Plot of Exponential Data from R Random Uniform + +![qexpunif](/home/rozek/Pictures/stat381lab2/qexpunif.png) + +#### Figure XVI, Histogram of R Generated Exponential Data + +![histexp](/home/rozek/Pictures/stat381lab2/histexp.png) + +#### Figure XVII, Q-Q Plot of R Generated Exponential Data + +![qexp](/home/rozek/Pictures/stat381lab2/qexp.png) + +### Tables + +#### Table I, Uniform Distribution Sample Data + +| Method | Mean ($\bar{x}$) | Median ($\tilde{x}$) | $\mu - \bar{x}$ | $m - \tilde{x}$ | +| ------------------- | ---------------- | -------------------- | --------------- | --------------- | +| LCM with seed 55555 | 0.505 | 0.521 | -0.005 | -0.021 | +| LCM with seed 93463 | 0.452 | 0.402 | 0.048 | 0.098 | +| LCM with seed 29345 | 0.520 | 0.502 | -0.020 | -0.002 | +| LCM with seed 68237 | 0.489 | 0.517 | 0.011 | -0.017 | +| R Random Uniform | 0.480 | 0.471 | 0.020 | 0.029 | + +#### Table II, Exponential Distribution Sample Data + +| Method | Mean | Median | $\mu - \bar{x}$ | $m - \tilde{x}$ | +| --------------- | ----- | ------ | --------------- | --------------- | +| LCM Transform | 0.380 | 0.246 | -0.047 | -0.015 | +| RUnif Transform | 0.283 | 0.218 | 0.050 | 0.013 | +| R Exponential | 0.363 | 0.278 | -0.030 | -0.047 | + +### R Code + +```R +library(ggplot2) +linear_congruential = function(seed) { + a = 69069 + c = 0 + m = 2^31 + x = numeric(100) + x[1] = seed + for (i in 2:100) { + x[i] = (a * x[i-1] + c) %% m + } + xnew = x / (max(x) + 1) + xnew +} + +gcd = function(x,y) { + r = x %% y; + return(ifelse(r, gcd(y, r), y)) +} +check_seed = function(seed) { + if (gcd(seed, 2^31) == 1) { + print(paste("The seed value of", seed, "is co-prime")) + } else { + print(paste("The seed value of", seed, "is NOT co-prime")) + } +} + +check_data = function(data, distribution, title) { + print(paste("Currently looking at", title)) + print(summary(data)) + print(ggplot(data.frame(data), aes(x = data)) + + geom_histogram(fill = 'white', color = 'black', bins = 10) + + xlab("Date") + + ylab("Frequency") + + ggtitle(paste("Histogram of", title)) + + theme_bw()) + uqs = (1:100) / 100 + if (distribution == "Uniform") { + qqplot(data, uqs, pch = 1, col = '#001155', main = paste("QQ Plot of", title), xlab = "Sample Data", ylab = "Theoretical Data") + qqline(uqs, distribution = qunif, col="red", lty=2) + } else if (distribution == "Exponential") { + eqs = -log(1-uqs) / 3 + qqplot(data, eqs, pch = 1, col = '#001155', main = paste("QQ Plot of", title), xlab = "Sample Data", ylab = "Theoretical Data") + qqline(eqs, distribution=function(p) { qexp(p, rate = 3)}, col="#AA0000", lty=2) + } +} + +seed1 = 55555 +seed2 = 93463 +seed3 = 29345 +seed4 = 68237 + +check_seed(seed1) +lin_cong = linear_congruential(seed1) +check_data(lin_cong, "Uniform", paste("LCM Random Data with seed", seed1)) + +check_seed(seed2) +lin_cong2 = linear_congruential(seed2) +check_data(lin_cong2, "Uniform", paste("LCM Random Data with seed", seed2)) + +check_seed(seed3) +lin_cong3 = linear_congruential(seed3) +check_data(lin_cong3, "Uniform", paste("LCM Random Data with seed", seed3)) + +check_seed(seed4) +lin_cong4 = linear_congruential(seed4) +check_data(lin_cong4, "Uniform", paste("LCM Random Data with seed", seed4)) + +# Using the standard built-in R function +unif = runif(100, 0, 1) +check_data(unif, "Uniform", "R Random Uniform Data") + +# Building exponential from linear congruence method +exp1 = -log(1 - lin_cong) / 3 +check_data(exp1, "Exponential", "Exponential Data from LCM Random") + +# Building exponential from runif +exp2 = -log(1 - unif) / 3 +check_data(exp2, "Exponential", "Exponential Data from R Random Uniform") + +# Building exponential from rexp +exp3 = rexp(100, rate = 3) +check_data(exp3, "Exponential", "R Generated Exponential Data") +``` + diff --git a/content/notes/stat381/randomwalk.md b/content/notes/stat381/randomwalk.md new file mode 100644 index 0000000..6c78179 --- /dev/null +++ b/content/notes/stat381/randomwalk.md @@ -0,0 +1,551 @@ +# Random Walk + +## Introduction + +This lab features a random walk simulation that answers the following question: Given the radius of a circular room, how many random steps does it take to reach to reach the wall from the center? To explore this, we will look at the distribution of steps required and describe it in terms of a discrete probability distribution. Later on, we will look at the radius parameter and find relationships between it and the different summary statistics that we compute (mean, median, range, variance, skewness). + +The paper will start off with the methods used in this lab. The programming language R was used and a simulation was created to simulate a random walk according to the description above. It will also discuss the methods used to find the discrete probability distribution that best fits the data and how the relationship between the radii and the summary statistics were found using regression. + +After discussing the methods, the paper goes into the results. The discrete probability distribution of the data is revealed and the equations of the different summary statistics based on a regression of the radius is shared. + +## Methods + +### Obtaining the distribution of steps required + +The simulation written performs the following steps given the size of a room: + +1. Start off in the center of the room +2. Calculate a random angle $\theta$ +3. Step in the X direction by $cos(\theta)$ +4. Step in the Y direction by $sin(\theta)$ +5. Repeat steps 2-4 until the wall is reached + +The number of steps required is then recorded into a vector and the simulation is performed 999 more times. This gives us the distribution of steps required to reach the wall given the room size. + +### Computing summary statistics + +Given the distribution vector pertaining to the room size, we then find the following information: + +- Measures of Central Tendency: Mean & Median +- Measures of Variation: Variance & Range +- Skewness & Shape of Histogram + +For every room size selected, a total of three trials of 1000 simulations each is conducted. + +### Fitting the data to a distribution + +Since the simulation counts the steps required before reaching the walls of the room, it describes the process of a geometric distribution. To confirm the suspicion, the function `fitdistr` inside the package `MASS` was used to find the parameter (probability) of the geometric distribution to best fit the simulation data. In this case the simulation data used is of room size 100. + +The probability density histogram of the data is then shown with the overlay of the geometric distribution that best fit the data. + +Another more robust way to visually see the goodness of fit of the distribution is to use what is called a Quantile-Quantile Plot (Q-Q Plot), Using the quantiles from the theoretical distribution, we compare it to the quantiles of the simulated data and check to see that it follows the Q-Q line closely. + +### Finding relationships between the radii and the summary statistics + +From the simulations performed, vectors have been saved containing the summary statistics for the different room sizes. Vectors are then created from these vectors as columns inside a data frame. Having this data frame allows us to use `ggplot` to graph the data using scatter plots. + +`ggplot` was used as opposed to the conventional `base` package since it allows us to add layers to the graphs, which was used to show the geometric distribution on top of the density histogram in the previous section. `ggplot` is also aesthetically more pleasing as it decreases the margins and makes smart choices on the shadings of the axes on the graph. + +After plotting the data, regressions are then taken with respect to different polynomial degrees of radii and analyzed for best fit using the adjusted r squared value as a means for comparison. + +The adjusted r squared value is a good comparator since it tells us a proportion of how much the variation in the data is accounted for by the model. + +## Results + +The shape of the distribution matches the geometric distribution as shown in Figure IX & X. Figure IX shows how the probability density histogram nicely fits the overlay of the geometric distribution with the fitted parameters. The description of the problem closely matches the description of the geometric probability distribution and both distributions are skewed right. These observations increase our confidence that the distribution is a good fit. This can further be verified with the Q-Q Plot. + +The Q-Q Plot in Figure X shows how the theoretical quantiles compare with the quantiles from the distribution. Since the observed sample quantiles start off in one side of the Q-Q line and ends up on the other side at the end, we can say that the data is not skewed with respect to the theoretical distribution. This along with the fact that the sample quantiles closely fit the Q-Q line supports the proposition that the geometric distribution is a good fit for the steps required in the random walk. + +Regressions were then performed for each summary statistic and the models that had the lowest degree polynomial with respect to radii and with relatively small standard error were chosen. + +For the mean, quadratic regression was performed and it produces the following model +$$ +\mu(Steps) = -31.409 + 7.800(radii) + 0.837(radii^2) +$$ +With this model, the adjusted $r^2$ value is 99.938%, which tells us that 99.938% of the variation in means is accounted for by the quadratic regression above. It's fit to the observed values can be seen in Figure XI. + +For the median, quadratic regression was performed and produces the following model +$$ +\widetilde{Steps} = -19.525 + 5.096(radii) + 0.687(radii^2) +$$ +The model above has an adjusted $r^2$ value of 99.957% which tells us that 99.957% of the variation in medians is accounted for by the regression above. It's fit to the observed values can be seen in Figure XIII. + +For the range, the quadratic regression performed creates the following model +$$ +Range(Steps) = 63.873 - 9.073(radii) + 5.572(radii^2) +$$ +The model has an adjusted $r^2$ value of 99.278% which tells us that 99.278% of the variation in the ranges of steps is accounted for by the regression above. It's fit to the observed values can be seen in Figure XV. + +For the variance, the cubic regression performed creates the following model +$$ +\sigma^2(Steps) = -88471.866 + 32256.076(radii) - 2418.835(radii^2) + 61.650(radii^3) +$$ +The model has an adjusted $r^2$ value of 99.779% which tells us that 99.779% of the variation in the variations of steps is accounted for by the regression above. It's fit to the observed values can be seen in Figure XVII + +Looking at the scatter plot of radii vs skewness of steps shown in Figure XVIII, there appears to be no relationship between the radii and skewness of steps. What the scatter plot suggests that the skewness is uniformly distributed. + + + +## Conclusions + +In summation, the distribution of steps required to reach the end of the wall follow a geometric distribution. This was backed up using the probability density histogram and the Q-Q Plot. + +Most of the summary statistics follow a quadratic regression while the variation follows a cubic regression. Skewness are uniformly distributed across the different simulations. + +In other words, the mean, median, and range follow a function that is a second degree polynomial based on the size of the room ($r^2$) and the variation follows a function that is a third degree polynomial based on the size of the room $(r^3)$ + + + +## Appendix + +### Tables + +#### Table I, Summary Statistics for Room Radius of 2 + +| Trial | Mean | Median | Variance | Range | Skewness | +| ----- | ----- | ------ | -------- | ------ | -------- | +| 1 | 5.827 | 5.000 | 13.471 | 36.000 | 2.446 | +| 2 | 5.761 | 5.000 | 10.635 | 22.000 | 1.780 | +| 3 | 5.805 | 5.000 | 11.430 | 21.000 | 1.882 | + + + +#### Table II, Summary Statistics for Room Radius of 3 + +| Trial | Mean | Median | Variance | Range | Skewness | +| ----- | ------ | ------ | -------- | ------ | -------- | +| 1 | 11.566 | 9.000 | 59.055 | 60.000 | 1.854 | +| 2 | 11.940 | 10.000 | 74.487 | 68.000 | 2.467 | +| 3 | 11.242 | 9.000 | 53.417 | 48.000 | 1.922 | + + + +#### Table III, Summary Statistics for Room Radius of 4 + +| Trial | Mean | Median | Variance | Range | Skewness | +| ----- | ------ | ------ | -------- | ------- | -------- | +| 1 | 19.306 | 15.000 | 171.688 | 90.000 | 1.721 | +| 2 | 18.127 | 15.000 | 143.284 | 74.000 | 1.712 | +| 3 | 18.993 | 15.000 | 180.892 | 111.000 | 2.089 | + + + +#### Table IV, Summary Statistics for Room Radius of 5 + +| Trial | Mean | Median | Variance | Range | Skewness | +| ----- | ------ | ------ | -------- | ------- | -------- | +| 1 | 29.272 | 23.000 | 405.817 | 150.000 | 1.737 | +| 2 | 28.382 | 22.000 | 402.801 | 146.000 | 1.862 | +| 3 | 27.891 | 22.000 | 390.221 | 211.000 | 2.308 | + + + +#### Table V, Summary Statistics for Room Radius of 10 + +| Trial | Mean | Median | Variance | Range | Skewness | +| ----- | ------- | ------ | -------- | ------- | -------- | +| 1 | 110.234 | 87.000 | 6070.976 | 547.000 | 1.780 | +| 2 | 109.594 | 88.000 | 5928.037 | 542.000 | 1.864 | +| 3 | 108.398 | 86.000 | 6469.467 | 621.000 | 2.191 | + + + +#### Table VI, Summary Statistics for Room Radius of 25 + +| Trial | Mean | Median | Variance | Range | Skewness | +| ----- | ------- | ------- | -------- | ----- | -------- | +| 1 | 623.260 | 492.000 | 197161.8 | 3262 | 1.965 | +| 2 | 637.890 | 511.000 | 212826.6 | 3394 | 2.009 | +| 3 | 653.661 | 528.5 | 211126.2 | 3694 | 1.841 | + + + +#### Table VII, Summary Statistics for Room Radius of 50 + +| Trial | Mean | Median | Variance | Range | Skewness | +| ----- | --------- | ------ | -------- | ----- | -------- | +| 1 | 2507.935 | 1939.0 | 3231980 | 11471 | 1.726 | +| 2 | 24675.615 | 1992.0 | 3248443 | 14150 | 2.060 | +| 3 | 2488.795 | 2001.5 | 3038915 | 14689 | 1.843 | + + + +#### Table VIII, Summary Statistics for Room Radius of 100 + +| Trial | Mean | Median | Variance | Range | Skewness | +| ----- | -------- | ------ | -------- | ----- | -------- | +| 1 | 8983.406 | 7257.0 | 38271895 | 52549 | 2.027 | +| 2 | 9372.917 | 7537.0 | 41658620 | 51810 | 1.867 | +| 3 | 8974.549 | 7294.5 | 41868765 | 60326 | 2.420 | + + + +### Figures + +#### Figure I, Histogram of Room Radius 2 + +![img]() + + + + + +#### Figure II, Histogram of Room Radius 3 + +![img]() + + + + + +#### Figure III, Histogram of Radius 4 + +![img]() + + + + + +#### Figure IV, Histogram of Radius 5 + +![img]() + + + + + +#### Figure V, Histogram of Radius 10 + +![img]() + + + + + +#### Figure VI, Histogram of Radius 25 + +![img]() + + + + + +#### Figure VII, Histogram of Radius 50 + +![img]() + + + + + +#### Figure VIII, Histogram of Radius 100 + +![img]() + + + + + +#### Figure IX, Probability Density Histogram + +![img]() + + + + + +#### Figure X, QQ-Plot of Theoretical vs Sample Data + +![img]() + + + + + +#### Figure XI, Scatterplot of Radii vs Mean Steps + +![img]() + + + + + +#### Figure XII, Scatterplot with Quadratic Regression of Radii vs Mean Steps + +![img]() + + + + + +#### Figure XIII, Scatterplot of Radii vs Median Steps + +![img]() + + + + + +#### Figure XIV, Scatterplot with Quadratic Regression of Radii vs Median Steps + +![img]() + + + + + +#### Figure XV, Scatterplot of Radii vs Range of Steps + +![img]() + + + + + +#### Figure XVI, Scatterplot with Quadratic Regression of Radii vs Range of Steps + +![img]() + + + + + +#### Figure XVII, Scatterplot of Radii vs Variance of Steps + +![img]() + + + + + +#### Figure XVIII, Scatterplot with Cubic Regression of Radii vs Variance of Steps + +![img]() + + + + + +#### Figure XIX, Scatterplot of Radii vs Skewness + +![img]() + + + + + +### R Code + +```R +rm(list=ls()) +library(moments) +library(ggplot2) + +simulateRoom = function(r) { + n = 1000 + results = numeric(n) + x = 0 + y = 0 + dist = 0 + num = 0 + for (i in 1:n) { + while(dist < r) { + deg = runif(1, min=0, max=360) + newx = cos(deg) + newy = sin(deg) + x = x + newx + y = y + newy + num = num+ 1 + dist=(x^2 + y^2)^0.5 + } + results[i] = num + x= 0 + y = 0 + dist = 0 + num = 0 + i = i + 1 + } + return(results) +} + +repetitions = 3 +radii = c(2, 3, 4, 5, 10, 25, 50, 100) + +median_stepcount = c() +mean_stepcount = c() +variance_stepcount = c() +range_stepcount = c() +skewness_stepcount = c() +for (r in radii) { + room_data = data.frame() + print(paste("Currently simulating r =", r)) + for (i in 1:repetitions) { + simulation = simulateRoom(r) + + ## Summary Statistics + variance = var(simulation) + skewness_ = skewness(simulation) + range_data = range(simulation) + + room_data_temp = data.frame(i, mean(simulation), median(simulation), variance, range_data[2] - range_data[1], skewness_) + names(room_data_temp) = c("Trial", "Mean", "Median", "Variance", "Range", "Skewness") + room_data = rbind(room_data, room_data_temp) + + median_stepcount = c(median_stepcount, median(simulation)) + mean_stepcount = c(mean_stepcount, mean(simulation)) + variance_stepcount = c(variance_stepcount, variance) + range_stepcount = c(range_stepcount, range_data[2] - range_data[1]) + skewness_stepcount = c(skewness_stepcount, skewness_) + + simulation = data.frame(simulation) + print(ggplot(simulation, aes(x = simulation)) + + geom_histogram(color = 'black', fill = 'white') + + xlab("Steps") + + ylab("Count") + + ggtitle(paste("Distribution of r =", r)) + + theme_bw()) + } + print(room_data) +} + +## Show the probability distribution +library(MASS) +distribution = fitdistr(simulation$simulation, "geometric") +probability_simulation = data.frame(simulation, + rgeom(1:1000, distribution$estimate['prob'])) +names(probability_simulation) = c("simulation", "geometric") +ggplot(data = probability_simulation, aes(x = simulation)) + + geom_histogram(aes(y = ..density..), color = 'black', fill = 'white') + + geom_density(aes(x = geometric), fill = '#0000AA', alpha = .5) + + xlab("Steps") + + ylab("Probability Density") + + ggtitle("Probability Density Histogram with Geometric Overlay") + + theme_bw() + +## Calculate QQ Plot of Geometric Distribution and Sample +yquantiles = quantile(simulation$simulation, c(0.25, 0.75)) +xquantiles = qgeom(prob = distribution$estimate['prob'], c(0.25, 0.75)) +slope = diff(yquantiles) / diff(xquantiles) +intercept = yquantiles[1] - slope * xquantiles[1] +ggplot() + aes(sample=simulation$simulation) + + stat_qq(distribution=qgeom, dparams = distribution$estimate['prob']) + + geom_abline(intercept=intercept, slope=slope) + + ggtitle("QQ Plot of Geometric Distribution") + + xlab("Theoretical Quantiles") + + ylab("Sample Quantiles") + + theme_bw() + + +## Create a dataframe +room_simulation_data = data.frame(as.vector(sapply(radii, function(x) { rep(x, repetitions)})), mean_stepcount, median_stepcount, range_stepcount, skewness_stepcount, variance_stepcount) +names(room_simulation_data) = c("radii", "mean_stepcount", "median_stepcount", "range_stepcount", "skewness_stepcount", "variance_stepcount") +######### ANALYSIS OF MEANS +ggplot(room_simulation_data, aes(x = radii, y = mean_stepcount)) + + geom_point(shape = 21, size = 2) + + xlab("Radii") + + ylab("Mean Steps") + + ggtitle("Radii vs Mean Steps") + + theme_bw() + +## Quadratic Regression of Means +quadratic_mean_model = lm(mean_stepcount ~ poly(radii, 2, raw = T), data = room_simulation_data) +quadratic_mean_model_summary = summary(quadratic_mean_model) +ggplot(room_simulation_data, aes(x = radii, y = mean_stepcount)) + + geom_point(shape = 21, size = 2) + + geom_smooth(method = "lm", formula = y ~ poly(x, 2, raw = T), se = T) + + xlab("Radii") + + ylab("Mean Steps") + + ggtitle("Radii vs Mean Steps") + + theme_bw() + +## Analysis of Quadratic Regression of Means +quadratic_mean_coefficients = as.vector(quadratic_mean_model$coefficients) +print(paste("The quadratic regression equation is: Mean Steps =", quadratic_mean_coefficients[1], "+", quadratic_mean_coefficients[2], "radii", quadratic_mean_coefficients[3], "radii^2")) +print(paste(quadratic_mean_model_summary$adj.r.squared * 100, "% of the variation of the means is accounted for by the Quadratic Model", sep = "")) + + +######### ANALYSIS OF MEDIANS +ggplot(room_simulation_data, aes(x = radii, y = median_stepcount)) + + geom_point(shape = 21, size = 2) + + xlab("Radii") + + ylab("Median Steps") + + ggtitle("Radii vs Median Steps") + + theme_bw() + +## Quadratic Regression of Medians +quadratic_median_model = lm(median_stepcount ~ poly(radii, 2, raw = T), data = room_simulation_data) +quadratic_median_model_summary = summary(quadratic_median_model) +ggplot(room_simulation_data, aes(x = radii, y = median_stepcount)) + + geom_point(shape = 21, size = 2) + + geom_smooth(method = "lm", formula = y ~ poly(x, 2, raw = T), se = T) + + xlab("Radii") + + ylab("Median Steps") + + ggtitle("Radii vs Median Steps") + + theme_bw() + +## Analysis of Quadratic Regression of Medians +quadratic_median_coefficients = as.vector(quadratic_median_model$coefficients) +print(paste("The Quadratic Regression Equation is: Median Steps =", quadratic_median_coefficients[1], "+", quadratic_median_coefficients[2], "radii", quadratic_median_coefficients[3], "radii^2")) +print(paste(quadratic_median_model_summary$adj.r.squared * 100, "% of the variation of the medians is accounted for by the Quadratic Model", sep = "")) + + +######### ANALYSIS OF RANGES +ggplot(room_simulation_data, aes(x = radii, y = range_stepcount)) + + geom_point(shape = 21, size = 2) + + xlab("Radii") + + ylab("Range of Steps") + + ggtitle("Radii vs Range Steps") + + theme_bw() + +## Quadratic Regression of Ranges +quadratic_range_model = lm(range_stepcount ~ poly(radii, 2, raw = T), data = room_simulation_data) +quadratic_range_model_summary = summary(quadratic_range_model) +ggplot(room_simulation_data, aes(x = radii, y = range_stepcount)) + + geom_point(shape = 21, size = 2) + + geom_smooth(method = "lm", formula = y ~ poly(x, 2, raw = T), se = T) + + xlab("Radii") + + ylab("Range of Steps") + + ggtitle("Radii vs Range of Steps") + + theme_bw() + +## Analysis of Quadratic Regression of Ranges +quadratic_range_coefficients = as.vector(quadratic_range_model$coefficients) +print(paste("The Quadratic Regression Equation is: Range of Steps =", quadratic_range_coefficients[1], "+", quadratic_range_coefficients[2], "radii", quadratic_range_coefficients[3], "radii^2")) +print(paste(quadratic_range_model_summary$adj.r.squared * 100, "% of the variation of the ranges is accounted for by the Quadratic Model", sep = "")) + + + +######### ANALYSIS OF SKEWNESS +ggplot(room_simulation_data, aes(x = radii, y = skewness_stepcount)) + + geom_point(shape = 21, size = 2) + + xlab("Radii") + + ylab("Skewness") + + ggtitle("Radii vs Skewness Steps") + + theme_bw() + + +######### ANALYSIS OF VARIANCES +ggplot(room_simulation_data, aes(x = radii, y = variance_stepcount)) + + geom_point(shape = 21, size = 2) + + xlab("Radii") + + ylab("Variance of Steps") + + ggtitle("Radii vs Variance Steps") + + theme_bw() + +## Cubic Regression of Variance +cubic_variance_model = lm(variance_stepcount ~ poly(radii, 3, raw = T), data = room_simulation_data) +cubic_variance_model_summary = summary(cubic_variance_model) +ggplot(room_simulation_data, aes(x = radii, y = variance_stepcount)) + + geom_point(shape = 21, size = 2) + + geom_smooth(method = "lm", formula = y ~ poly(x, 3, raw = T), se = T) + + xlab("Radii") + + ylab("Variance of Steps") + + ggtitle("Radii vs Variance of Steps") + + theme_bw() + +## Analysis of Cubic Regression +cubic_variance_coefficients = as.vector(cubic_variance_model$coefficients) +print(paste("The Cubic Regression Equation is: Variance of Steps =", cubic_variance_coefficients[1], "+", cubic_variance_coefficients[2], "radii", cubic_variance_coefficients[3], "radii^2", cubic_variance_coefficients[4], "radii^3")) +print(paste(cubic_variance_model_summary$adj.r.squared * 100, "% of the variation of the variations is accounted for by the Cubic Model", sep = "")) +``` + diff --git a/content/presentations.md b/content/presentations.md new file mode 100644 index 0000000..4d61e2c --- /dev/null +++ b/content/presentations.md @@ -0,0 +1,29 @@ +--- +title: Presentations +description: This is a page of presentations I was a part of. +--- + +## Expedited Learning via Interactive Demonstrations + +On December 4, 2019, I gave a defense on my honors research in the incorporation of demonstration data throughout a reinforcement learning algorithm. I have shown that this technique expedites the learning process. + +[Slides PPTX](/files/research/ExpeditedLearningInteractiveDemo.pptx) + +## Building a Linux Cluster + +In June 2019, Stefano Coronado and I were volunteered to give a talk at the Fredericksburg Linux Users group on our experiences building a Beowulf cluster for our University. + +[Slides PDF](/files/slides/buildinglinuxcluster.pdf) + +## Embezzlement of Parking Meter Funds: A Computational Approach to Hypothesis Testing + +I was invited to give a talk to the Data Science Group at the University of Mary Washington called the Data Mavens. It was a 25 minute presentation on the bootstrap resampling technique with code on how to get started. + +[Slides PDF](/files/slides/embezzlement.pdf) + +## Similyrics: A Music Recommendation Engine Based on Lyrics +At the VCU RamHacks hackathon, Clare Arrington, Harrison Crosse, and I demoed our product Similyrics. It's a web application that takes your favorite song, grabs the lyrics, and finds a song from a database that closely matches to the song you have chosen lyric wise. + +[Slides PDF](/files/slides/similyrics.pdf) + + diff --git a/content/projects/mathio.md b/content/projects/mathio.md new file mode 100644 index 0000000..99aa6eb --- /dev/null +++ b/content/projects/mathio.md @@ -0,0 +1,22 @@ +--- +id: 1609 +title: Math I/O +date: 2016-10-23T23:33:41+00:00 +author: rozek_admin +layout: revision +guid: http://brandonrozek.com/2016/10/362-revision-v1/ +permalink: /2016/10/362-revision-v1/ +--- +Screenshot of the Math I/O Website + +### [Math I/O](http://math-io.com) {.project-title} + +Math I/O is a website I founded with [David Thames](http://davidcthames.com) and Stephen Shamaiengar. The goal of this website is to help reinforce high school level math concepts in the form of enjoyable games. Most of the games are made using HTML5 Canvas and Javascript. You can check them out [here](http://math-io.com/). + + + +I ran Math I/O for a year until I moved away from the area. During that year, I worked on the Darts game, Speed Transformations, and Theta. I then took about a year off to get adjusted to my new place when I moved. + +While I was away, Math I/O gained many new people, making it hard for them to work as one large group. David then decided to split the group up into smaller teams, inviting me to come back and lead one. I never ran a team remotely before, so I was excited to see how it would be like. + +The team I lead are mostly full of people starting out in programming. To help them out, I started giving lectures once a week to introduce concepts, and posted them here on my writings page. We would then practice these concepts while making a new game during the meetings. I couldn’t ask for a better team, their enthusiasm drives me to keep working at Math I/O. \ No newline at end of file diff --git a/content/projects/sentenceworthy.md b/content/projects/sentenceworthy.md new file mode 100644 index 0000000..8fd70a4 --- /dev/null +++ b/content/projects/sentenceworthy.md @@ -0,0 +1,20 @@ +--- +id: 1608 +title: Sentence Worthy +date: 2016-10-23T23:33:11+00:00 +author: rozek_admin +layout: revision +guid: http://brandonrozek.com/2016/10/360-revision-v1/ +permalink: /2016/10/360-revision-v1/ +--- +SentenceWorthy + +### [Sentence Worthy](http://sentenceworthy.com) {.project-title} + +Sentence Worthy is a side project created by [Tori Dayton](http://toridayton.com) and I. We combine both of our passions, writing and photography, and make something for others to enjoy. Have a look at our [creation](http://sentenceworthy.com). + + + +I am the main developer and photographer of this site. I head out every so often and take pictures of whatever interests me. Then, I email Tori my choice picks and she tells me what she wants to do with the pictures and what ideas she has for them. I then edit the picture with her ideas in mind. After we go back and forth on the picture edits, Tori sends me a one sentence story she made that goes along with the picture. The picture and story then get published together onto the website. Hence the tagline, every picture is worth a sentence. + + \ No newline at end of file diff --git a/content/projects/toridayton.md b/content/projects/toridayton.md new file mode 100644 index 0000000..eaa2d11 --- /dev/null +++ b/content/projects/toridayton.md @@ -0,0 +1,18 @@ +--- +id: 1607 +title: ToriDayton.com +date: 2016-10-23T23:32:34+00:00 +author: rozek_admin +layout: revision +guid: http://brandonrozek.com/2016/10/364-revision-v1/ +permalink: /2016/10/364-revision-v1/ +--- +Screenshot of Tori Dayton's website + +### [Tori Dayton](http://toridayton.com) {.project-title} + +Tori Dayton is a great friend and poet, this is the site I made for her to showcase her writings. It’s the first WordPress project I worked on and it set the tone for all the future ones I did. Check out her [writings!](http://toridayton.com/work) I’m a fan of her work. (Not biased at all) + + + +Fun Fact: I also worked on the [Tori Bot](http://toridayton.com/category/tori-bot/) on the site. Tori Bot takes existing poems and tries to generate a new one using the [Natural Language Toolkit](http://www.nltk.org/) library made for Python. \ No newline at end of file diff --git a/content/research.md b/content/research.md new file mode 100644 index 0000000..7d0e3f7 --- /dev/null +++ b/content/research.md @@ -0,0 +1,77 @@ +--- +Title: Research +Description: A list of my research Projects +--- + +[Quick List of Publications](publications) + +## Computer Science / Data Science Research + +### Reinforcement Learning + +**Deep Reinforcement Learning:** With Dr. Ron Zacharski I focused more on a particular instance of Reinforcement Learning where deep neural networks are used. During this time, I built out a Reinforcement Learning library written in PyTorch. This library helps me have a test bed for trying out different algorithms and attempts to create my own. + +One particular problem I'm fascinated by is how to make Reinforcement Learning algoirthms more sample efficient. This means, how can we make it so that it learns more from every observation or make it so that we can achieve our goal quicker? + +[RL Library on Github](https://github.com/brandon-rozek/rltorch) + +[Interactive Demonstrations Library](https://github.com/brandon-rozek/gyminteract) + +[Honors Thesis](/files/research/honorsthesis.pdf) + +[Honors Defense](/files/research/ExpeditedLearningInteractiveDemo.pptx) + +[QEP Algorithm Slides](/files/research/QEP.pptx) + +[More...](deepreinforcementlearning) + +**Reinforcement Learning:** Studied the fundamentals of reinforcement learning with Dr. Stephen Davies. We went over the fundamentals such as value functions, policy functions, how we can describe our environment as a markov decision processes, etc. + +[Notes and Other Goodies](reinforcementlearning) + +[Github Code](https://github.com/brandon-rozek/ReinforcementLearning) + + +### Symbolic Methods +Worked with Dr. Andrew Marshall under an ONR grant in collaboration with University at Albany, Clarkson University, and the Naval Research lab in order to automatically generated and verify cryptographic algorithms. + +During that time period I built a free algebra library, rewrite library, parts of the crypto tool, and dabbled in Unification algorithms. We're hoping to open source the code base by 2021. (Ping me if its past due) + +Currently I'm an external collaborator focused on strengthing the rewrite library. My dream is to slowly work towards building an easy to use theorem prover. + +### Programming Languages + +Studying the design of programming languages. So far I made an implementation of the SLOTH programming language, experimenting with what I want my own programming language to be syntatically and paradigm wise. + +[SLOTH Code](https://github.com/brandon-rozek/SLOTH) + +Before this study, I worked though a book called "Build your own Lisp" and my implementation of a lisp like language is below. + +[Lispy Code](https://github.com/brandon-rozek/lispy) + +### Other + +**Competitive Programming:** Studying algorithms and data structures necessary for competitive programming. Attended ACM ICPC in November 2018/2019 with a team of two other students. + +## Math/Statistics Research + +Worked on an independent study on the topic of **Cluster Analysis**. This is where you try to group similar observations without knowing what the labels are. +I studied under the guidance of Dr. Melody Denhere, the link below gives you more of a description of the project along with my course notes. + +[Cluster Analysis Spring 2018](clusteranalysis) + +## Physics Research + +For the two projects below, I worked on Quantum Research in a physics lab with a fellow student Hannah Killian and an advisor Dr. Hai Nguyen. I mostly assisted with the software support for the project and assisted in the mathematics in whatever way I can. + +[Modeling Population Dynamics of Incoherent and Coherent Excitation](/files/research/modellingpopulationdynamics.pdf) + +[Coherent Control of Atomic Population Using the Genetic Algorithm](/files/research/coherentcontrolofatomicpopulation.pdf) + + +In order to circumvent the frustrations I had with simulation code taking a while, I applied and received funding to build out a Beowulf cluster for the Physics department. Dr. Maia Magrakvilidze was the advisor for this project. + +[High Performance Cluster for Research and Education Report (nicknamed LUNA-C)](/files/research/LUNAC.pdf) + +[LUNA-C Poster](/files/research/LUNACposter.pdf) + diff --git a/content/research/_index.md b/content/research/_index.md new file mode 100644 index 0000000..e69de29 diff --git a/content/research/clusteranalysis.md b/content/research/clusteranalysis.md new file mode 100644 index 0000000..9eebd18 --- /dev/null +++ b/content/research/clusteranalysis.md @@ -0,0 +1,22 @@ +--- +Title: Cluster Analysis +Description: A study of grouping observations +--- + +# Cluster Analysis +Cluster Analysis is the art of finding inherent structures in data to form groups of similar observations. This has a myriad of applications from recommendation engines to social network analysis. + +This is an independent study, meaning that I will be studying this topic under the direction of a professor, in this case being Dr. Denhere. + +I have provided a list of topics that I wish to explore in a [syllabus](syllabus) + +Dr. Denhere likes to approach independent studies from a theoretical and applied sense. Meaning, I will learn the theory of the different algorithms, and then figure out a way to apply them onto a dataset. + +## Readings +There is no definitive textbook for this course. Instead I and Dr. Denhere search for materials that we think best demonstrates the topic at hand. + +I have created a [Reading Page](readings) to keep track of the different reading materials. + + +## Learning Notes +I like to type of the content I learn from different sources. A [notes page](notes) is created to keep track of the content discussed each meeting. diff --git a/content/research/clusteranalysis/notes.md b/content/research/clusteranalysis/notes.md new file mode 100644 index 0000000..5102309 --- /dev/null +++ b/content/research/clusteranalysis/notes.md @@ -0,0 +1,43 @@ +# Lecture Notes for Cluster Analysis + +[Lecture 1: Measures of Similarity](lec1) + +[Lecture 2.1: Distance Measures Reasoning](lec2-1) + +[Lecture 2.2: Principle Component Analysis Pt. 1](lec2-2) + +Lecture 3: Discussion of Dataset + +[Lecture 4: Principal Component Analysis Pt. 2](lec4) + +[Lecture 4.2: Revisiting Measures](lec4-2) + +[Lecture 4.3: Cluster Tendency](lec4-3) + +[Lecture 5: Introduction to Connectivity Based Models](lec5) + +[Lecture 6: Agglomerative Methods](lec6) + +[Lecture 7: Divisive Methods Part 1: Monothetic](lec7) + +[Lecture 8: Divisive Methods Part 2: Polythetic](lec8) + +[Lecture 9.1: CURE and TSNE](lec9-1) + +[Lecture 9.2: Cluster Validation Part I](lec9-2) + +[Lecture 10.1: Silhouette Coefficient](lec10-1) + +[Lecture 10.2: Centroid-Based Clustering](lec10-2) + +[Lecture 10.3: Voronoi Diagrams](lec10-3) + +[Lecture 11.1: K-means++](lec11-1) + +[Lecture 11.2: K-medoids](lec11-2) + +[Lecture 11.3: K-medians](lec11-3) + +[Lecture 12: Introduction to Density Based Clustering](lec12) + + diff --git a/content/research/clusteranalysis/notes/lec1.md b/content/research/clusteranalysis/notes/lec1.md new file mode 100644 index 0000000..5b61503 --- /dev/null +++ b/content/research/clusteranalysis/notes/lec1.md @@ -0,0 +1,331 @@ +# Measures of similarity + +To identify clusters of observations we need to know how **close individuals are to each other** or **how far apart they are**. + +Two individuals are 'close' when their dissimilarity of distance is small and their similarity large. + +Special attention will be paid to proximity measures suitable for data consisting of repeated measures of the same variable, for example taken at different time points. + +## Similarity Measures for Categorical Data + +Measures are generally scaled to be in the interval $[0, 1]$, although occasionally they are expressed as percentages in the range $0-100\%$ + +Similarity value of unity indicates that both observations have identical values for all variables + +Similarity value of zero indicates that the two individuals differ maximally for all variables. + +### Similarity Measures for Binary Data + +An extensive list of similarity measures for binary data exist, the reason for such is that a large number of possible measures has to do with the apparent uncertainty as to how to **deal with the count of zero-zero matches** + +In some cases, zero-zero matches are equivalent to one-one matches and therefore should be included in the calculated similarity measure + +Example: Gender, where there is no preference as to which of the two categories should be coded as zero or one + +In other cases the inclusion or otherwise of the matches is more problematic + +Example: When the zero category corresponds to the genuine absence of some property, such as wings in a study of insects + +The question that then needs to be asked is do the co-absences contain useful information about the similarity of the two objects? + +Attributing a high degree of similarity to a pair of individuals simply because they both lack a large number of attributes may not be sensible in many situations + +The following table below will help when it comes to interpreting the measures + +![img](file:///home/rozek/Documents/Spring2018/Cluster%20Analysis/BinaryOutcomeTable.png?lastModify=1516246712) + +Measure that ignore the co-absence (lack of both objects having a zero) are Jaccard's Coefficient (S2), Sneath and Sokal (S4) + +When co-absences are considered informative, the simple matching coefficient (S1) is usually employed. + +Measures S3 and S5 are further examples of symmetric coefficients that treat positive matches (a) and negative matches (d) in the same way. + +![BinarySimilarityMeasures](/home/rozek/Documents/Spring2018/Cluster Analysis/BinarySimilarityMeasures.png) + +### Similarity Measures for Categorical Data with More Than Two Levels + +Categorical data where the variables have more than two levels (for example, eye color) could be dealt with in a similar way to binary data, with each level of a variable being regarded as a single binary variable. + +This is not an attractive approach, however, simply because of the large number of ‘negative’ matches which will inevitably be involved. + +A superior method is to allocate a score of zero or one to each variable depending on whether the two observations are the same on that variable. These scores are then averaged over all p variables to give the required similarity coefficient as +$$ +s_{ij} = \frac{1}{p}\sum_{k = 1}^p{s_{ik}} +$$ + +### Dissimilarity and Distance Measures for Continuous Data + +A **metric** on a set $X$ is a distance function +$$ +d : X \times X \to [0, \infty) +$$ +where $[0, \infty)$ is the set of non-negative real numbers and for all $x, y, z \in X$, the following conditions are satisfied + +1. $d(x, y) \ge 0$ non-negativity or separation axiom + 1. $d(x, y) = 0 \iff x = y$ identity of indiscernibles +2. $d(x, y) = d(y, x)$ symmetry +3. $d(x, z) \le d(x, y) + d(y, z)$ subadditivity or triangle inequality + +Conditions 1 and 2 define a positive-definite function + +All distance measures are formulated so as to allow for differential weighting of the quantitative variables $w_k$ denotes the nonnegative weights of $p$ variables + +![continuousdissimilaritymeasures](/home/rozek/Documents/Spring2018/Cluster Analysis/continuousdissimilaritymeasures.png) + +Proposed dissimilarity measures can be broadly divided into distance measures and correlation-type measures. + +#### Distance Measures + +#####$L^p$ Space + +The Minkowski distance is a metric in normed vector space which can be considered as a generalization of both the Euclidean distance and the Manhattan distance +$$ +D(X, Y) = (\sum_{i = 1}^n{w_i^p|x_i - y_i|^p})^{\frac{1}{p}} +$$ +This is a metric for $p > 1$ + +######Manhattan Distance + +This is the case in the Minkowski distance when $p = 1$ +$$ +d(X, Y) = \sum_{i = 1}^n{w_i|x_i - y_i|} +$$ +Manhattan distance depends on the rotation of the coordinate system, but does not depend on its reflection about a coordinate axis or its translation +$$ +d(x, y) = d(-x, -y) +$$ + +$$ +d(x, y) = d(x + a, y + a) +$$ + +Shortest paths are not unique in this metric + +######Euclidean Distance + +This is the case in the Minkowski distance when $p = 2$. The Euclidean distance between points X and Y is the length of the line segment connection them. +$$ +d(X, Y) = \sqrt{\sum_{i = 1}^n{w_i^2(x_i - y_i)^2}} +$$ +There is a unique path in which it has the shortest distance. This distance metric is also translation and rotation invariant + +######Squared Euclidean Distance + +The standard Euclidean distance can be squared in order to place progressively greater weight on objects that are farther apart. In this case, the equation becomes +$$ +d(X, Y) = \sum_{i = 1}^n{w_i^2(x_i - y_i)^2} +$$ +Squared Euclidean Distance is not a metric as it does not satisfy the [triangle inequality](https://en.wikipedia.org/wiki/Triangle_inequality), however, it is frequently used in optimization problems in which distances only have to be compared. + +######Chebyshev Distance + +The Chebyshev distance is where the distance between two vectors is the greatest of their differences along any coordinate dimension. + +It is also known as **chessboard distance**, since in the game of [chess](https://en.wikipedia.org/wiki/Chess) the minimum number of moves needed by a [king](https://en.wikipedia.org/wiki/King_(chess)) to go from one square on a [chessboard](https://en.wikipedia.org/wiki/Chessboard) to another equals the Chebyshev distance +$$ +d(X, Y) = \lim_{p \to \infty}{(\sum_{i = 1}^n{|x_i - y_i|^p})}^\frac{1}{p} +$$ + +$$ += max_i(|x_i - y_i|) +$$ + +Chebyshev distance is translation invariant + +##### Canberra Distance Measure + +The Canberra distance (D4) is a weighted version of the $L_1$ Manhattan distance. This measure is very sensitive to small changes close to $x_{ik} = x_{jk} = 0$. + +It is often regarded as a generalization of the dissimilarity measure for binary data. In this context the measure can be divided by the number of variables, $p$, to ensure a dissimilarity coefficient in the interval $[0, 1]$ + +It can then be shown that this measure for binary variables is just one minus the matching coefficient. + +### Correlation Measures + +It has often been suggested that the correlation between two observations can be used to quantify the similarity between them. + +Since for correlation coefficients we have that $-1 \le \phi_{ij} \le 1$ with the value ‘1’ reflecting the strongest possible positive relationship and the value ‘-1’ the strongest possible negative relationship, these coefficients can be transformed into dissimilarities, $d_{ij}$, within the interval $[0, 1]$ + +The use of correlation coefficients in this context is far more contentious than its noncontroversial role in assessing the linear relationship between two variables based on $n$ observations. + +When correlations between two individuals are used to quantify their similarity the rows of the data matrix are standardized, not its columns. + +**Disadvantages** + +When variables are measured on different scales the notion of a difference between variable values and consequently that of a mean variable value or a variance is meaningless. + +In addition, the correlation coefficient is unable to measure the difference in size between two observations. + +**Advantages** + +However, the use of a correlation coefficient can be justified for situations where all of the variables have been measured on the same scale and precise values taken are important only to the extent that they provide information about the subject's relative profile + +Example: In classifying animals or plants, the absolute size of the organisms or their parts are often less important than their shapes. In such studies the investigator requires a dissimilarity coefficient that takes the value zero if and only if two individuals' profiles are multiples of each other. The angular separation dissimilarity measure has this property. + +**Further considerations** + +The Pearson correlation is sensitive to outliers. This has prompted a number of suggestions for modifying correlation coefficients when used as similarity measures; for example, robust versions of correlation coefficients such as *jackknife correlation* or altogether more general association coefficients such as *mutual information distance measure* + +####Mahalanobis (Maximum) Distance [Not between 2 observations] + +Mahalanobis distance is a measure of distance between a point P and a distribution D. It is a multi-dimensional generalization of the idea of measuring how many standard deviations away P is from the mean of D + +Mahalanobis distance is unitless and scale-invariant and takes into account the correlations of the data set +$$ +D(\vec{x}) = \sqrt{(\vec{x} - \vec{\mu})^T S^{-1}(\vec{x}-\vec{\mu})} +$$ +Where $\mu$ is a set of mean observations and $S$ is the covariance matrix + +If the covariance matrix is diagonal then the resulting distance measure is called a normalized Euclidean distance. +$$ +d(\vec{x}, \vec{y}) = \sqrt{\sum_{i = 1}^N{\frac{(x_i - y_i)^2}{s^2_i}}} +$$ +Where $s_i$ is the standard deviation of the $x_i$ and $y_i$ over the sample set + +####Discrete Metric + +This metric describes whether or not two observations are equivalent +$$ +\rho(x, y) = \begin{cases} + 1 & x \not= y \\ + 0 & x = y + \end{cases} +$$ + +## Similarity Measures for Data Containing both Continuous and Categorical Variables + +There are a number of approaches to constructing proximities for mixed-mode data, that is, data in which some variables are continuous and some categorical. + +1. Dichotomize all variables and use a similarity measure for binary data +2. Rescale all the variables so that they are on the same scale by replacing variable values by their ranks among the objects and then using a measure for continuous data +3. Construct a dissimilarity measure for each type of variable and combine these, either with or without differential weighting into a single coefficient. + +Most general-purpose statistical software implement a number of measurs for converting two-mode data matrix into a one-mode dissimilarity matrix. + +R has `cluster`, `clusterSim`, or `proxy` + +### Proximity Measures for Structured Data + +We'll be looking at data that consists of repeated measures of the same outcome variable but under different conditions. + +The simplest and perhaps most commonly used approach to exploiting the reference variable is in the construction of a reduced set of relevant summaries per object which are then used as the basis for defining object similarity. + +Here we will look at some approaches for choosing summary measures and resulting proximity measures for the most frequently encountered reference vectors (e.g. time, experimental condition, and underlying factor) + +Structured data arise when the variables can be assumed to follow a known *factor model*. Under *confirmatory factor analysis model* each variable or item can be allocated to one of a set of underlying factors or concepts. The factors cannot be observed directly but are 'indicated' by a number of items that are all measured on the same scale. + +Note that the summary approach, while typically used with continuous variables, is not limited to variables on an interval scale. The same principles can be applied to dealing with categorical data. The difference is that summary measures now need to capture relevant aspects of the distribution of categorical variables over repeated measures. + +Rows of **$X$** which represent ordered lists of elements, that is all the variables provide a categorical outcome and these variables can be aligned in one dimension, are more generally referred to as *sequences*. *Sequence analysis* is an area of research that centers on problems of events and actions in their temporal context and includes the measurements of similarities between sequences. + +The most popular measure of dissimilarity between two sequences is the Levenhstein distance and counts the minimum number of operations needed to transform one sequence of categories into another, where an operation is an insertion, a deletion, or a substitution of a single category. Each operation may be assigned a penalty weight (a typical choice would be to give double the penalty to a substitution as opposed to an insertion or deletion. The measure is sometimes called the 'edit distance' due to its application in spell checkers. + +Optimal matching algorithms (OMAs) need to be employed to find the minimum number of operations required to match one sequence to another. One such algorithm for aligning sequences is the Needleman-Wunsch algorithm, which is commonly used in bioinformatics to align proteins. + +The *Jary similarity measure* is a related measure of similarity between sequences of categories often used to delete duplicates in the area of record linkage. + +## Inter-group Proximity Measures + +In clustering applications, it becomes necessary to consider how to measure the proximity between groups of individuals. + +1. The proximity between two groups might be defined by a suitable summary of the proximities between individuals from either group +2. Each group might be described by a representative observation by choosing a suitable summary statistic for each variable, and the inter group proximity defined as the proximity between the representative observations. + +### Inter-group Proximity Derived from the Proximity Matrix + +For deriving inter-group proximities from a matrix of inter-individual proximities, there are a variety of possibilities + +- Take the smallest dissimilarity between any two individuals, one from each group. This is referred to as *nearest-neighbor distance* and is the basis of the clustering technique known as *single linkage* +- Define hte intergroup distance as the largest distance between any two individuals, one from each group. This is known as the *furthest-neighbour distance* and constitute the basis of *complete linkage* cluster method. +- Define as the average dissimiliarity between individuals from both groups. Such a measure is used in *group average clustering* + +### Inter-group Proximity Based on Group Summaries for Continuous Data + +One method for constructing inter-group dissimilarity measures for continuous data is to simply substitute group means (also known as the centroid) for the variable values in the formulae for inter-individual measures + +More appropriate, however, might be measures which incorporate in one way or another, knowledge of within-group variation. One possibility is to use Mahallanobis's generalized distance. + +####Mahalanobis (Maximum) Distance + +Mahalanobis distance is a measure of distance between a point P and a distribution D. It is a multi-dimensional generalization of the idea of measuring how many standard deviations away P is from the mean of D + +Mahalanobis distance is unitless and scale-invariant and takes into account the correlations of the data set +$$ +D(\vec{x}) = \sqrt{(\vec{x} - \vec{\mu})^T S^{-1}(\vec{x}-\vec{\mu})} +$$ +Where $\mu$ is a set of mean observations and $S$ is the covariance matrix + +If the covariance matrix is diagonal then the resulting distance measure is called a normalized Euclidean distance. +$$ +d(\vec{x}, \vec{y}) = \sqrt{\sum_{i = 1}^N{\frac{(x_i - y_i)^2}{s^2_i}}} +$$ +Where $s_i$ is the standard deviation of the $x_i$ and $y_i$ over the sample set + +Thus, the Mahalanobis distance incraeses with increasing distances between the two group centers and with decreasing within-group variation. + +By also employing within-group correlations, the Mahalanobis distance takes account the possibly non-spherical shapes of the groups. + +The use of Mahalanobis implies that the investigator is willing to **assume** that the covariance matrices are at least approximately the same in the two groups. When this is not so, this measure is an inappropriate inter-group measure. Other alternatives exist such as the one proposed by Anderson and Bahadur + +equation + +Another alternative is the *normal information radius* suggested by Jardine and Sibson + +equation + +### Inter-group Proximity Based on Group Summaries for Categorical Data + +Approaches for measuring inter-group dissimilarities between groups of individuals for which categorical variables have been observed have been considered by a number of authors. Balakrishnan and Sanghvi (1968), for example, proposed a dissimilarity index of the form + +![equation](http://proquest.safaribooksonline.com.ezproxy.umw.edu/getfile?item=cjlhZWEzNDg0N2R0cGMvaS9zMG1nODk0czcvN3MwczMwL2UwLXMzL2VpL3RtYTBjMGdzY2QwLmkyLWdtaWY-) + +where $p_{Akl}$ and $p_{Bkl}$ are the proportions of the lth category of the kth variable in group A and B respectively, ![img](http://proquest.safaribooksonline.com.ezproxy.umw.edu/getfile?item=cjlhZWEzNDg0N2R0cGMvaS9zMG1nODk0czcvN3MwczNmL2VnMi8zbGVpL3RtYTBjbmdzaWUuMGlpbg--), ck + 1 is the number of categories for the kth variable and p is the number of variables. + +Kurczynski (1969) suggested adapting the generalized Mahalanobis distance, with categorical variables replacing quantitative variables. In its most general form, this measure for inter-group distance is given by + +![equation](http://proquest.safaribooksonline.com.ezproxy.umw.edu/getfile?item=cjlhZWEzNDg0N2R0cGMvaS9zMG1nODk0czcvN3MwczMxL2UwLXMzL2VpL3RtYTBjMGdzY2QwLmkyLWdtaWY-) + +where ![img](http://proquest.safaribooksonline.com.ezproxy.umw.edu/getfile?item=cjlhZWEzNDg0N2R0cGMvaS9zMG1nODk0czcvN3MwczNmL2VnMy8zbGVpL3RtYTBjbmdzaWUuMGlpbg--) contains sample proportions in group A and ![img](http://proquest.safaribooksonline.com.ezproxy.umw.edu/getfile?item=cjlhZWEzNDg0N2R0cGMvaS9zMG1nODk0czcvN3MwczNmL2VnNC8zbGVpL3RtYTBjbmdzaWUuMGlpbg--) is defined in a similar manner, and ![img](http://proquest.safaribooksonline.com.ezproxy.umw.edu/getfile?item=cjlhZWEzNDg0N2R0cGMvaS9zMG1nODk0czcvN3MwczNmL2VnNS8zbGVpL3RtYTBjbmdzaWUuMGlpbg--) is the m × m common sample covariance matrix, where ![img](http://proquest.safaribooksonline.com.ezproxy.umw.edu/getfile?item=cjlhZWEzNDg0N2R0cGMvaS9zMG1nODk0czcvN3MwczNmL2VnNi8zbGVpL3RtYTBjbmdzaWUuMGlpbg--). + +## Weighting Variables + +To weight a variable means to give it greater or lesser importance than other variables in determining the proximity between two objects. + +The question is 'How should the weights be chosen?' Before we discuss this question, it is important to realize that the selection of variables for inclusion into the study already presents a form of weighting, since the variables not included are effectively being given the weight $0$. + +The weights chosen for the variables reflect the importance that the investigator assigns the variables for the classification task. + +There are several approaches to this + +- Authors obtain perceived dissimilarities between selected objects, they then model the dissimilarities using the underlying variables and weights that indicate their relative importance. The weights that best fit the perceived dissimilarities are then chosen. +- Define the weights to be inversely proportion to some measure of variability in this variable. This choice of weights implies that the importance of a variable decreases when its variability increases. + - For a continous variable, the most commonly emplyed weight is either the reciprocal of its standard deviation or the reciprocal of its range + - Employing variability weights is equivalent to what is commonly referred to as *standardizing* the variables. +- Construct weights from the data matrix using *variable section*. In essence, such procedures proceed in an iterative fashion to identify variables which, when contributing to a cluster algorithm, lead to internally cohesive and externally isolated clusters and, when clustered singly, produce reasonable agreement. + +The second approach assumed the importance of a variable to be inversely proportional to the total variability of that variable. The total variability of a variable comprises variation both within and between groups which may exist within the set of individuals. The aim of cluster analysis is typically to identify such groups. Hence it can be argued that the importance of a variable should not be reduced because of between-group variation (on the contrary, one might wish to assign more importance to a variable that shows larger between-group variation.) + +Gnanadesikan et al. (1995) assessed the ability of squared distance functions based on data-determined weights, both those described above and others, to recover groups in eight simulated and real continuous data sets in a subsequent cluster analysis. Their main findings were: + +1. Equal weights, (total) standard deviation weights, and range weights were generally ineffective, but range weights were preferable to standard deviation weights. +2. Weighting based on estimates of within-cluster variability worked well overall. +3. Weighting aimed at emphasizing variables with the most potential for identifying clusters did enhance clustering when some variables had a strong cluster structure. +4. Weighting to optimize the fitting of a hierarchical tree was often even less effective than equal weighting or weighting based on (total) standard deviations. +5. Forward variable selection was often among the better performers. (Note that all-subsets variable selection was not assessed at the time.) + +## Standardization + +In many clustering applications, the variables describing the objects to be clustered will not be measured in the same units. A number of variability measures have been used for this purpose + +- When standard deviations calculated from the complete set of objects to be clustered are used, the technique is often referred to as *auto-scaling, standard scoring, or z-scoring*. +- Division by the median absolute deviations or by the ranges. + +The second is shown to outperform auto-scaling in many clustering applications. As pointed out in the previous section, standardization of variables to unit variance can be viewed as a special case of weighting. + +## Choice of Proximity Measure + +Firstly, the nature of the data should strongly influence the choice of the proximity measure. + +Next, the choice of measure should depend on the scale of the data. Similarity coefficients should be used when the data is binary. For continuous data, distance of correlation-type dissimilarity measure should be used according to whether 'size' or 'shape' of the objects is of interest. + +Finally, the clustering method to be used might have some implications for the choice of the coefficient. For example, making a choice between several proximity coefficients with similar properties which are also known to be monotonically related can be avoided by employing a cluster method that depends only on the ranking of the proximities, not their absolute values. \ No newline at end of file diff --git a/content/research/clusteranalysis/notes/lec10-1.md b/content/research/clusteranalysis/notes/lec10-1.md new file mode 100644 index 0000000..a984b48 --- /dev/null +++ b/content/research/clusteranalysis/notes/lec10-1.md @@ -0,0 +1,46 @@ +# Silhouette + +This technique validates the consistency within clusters of data. It provides a succinct graphical representation of how well each object lies in its cluster. + +The silhouette ranges from -1 to 1 where a high value indicates that the object is consistent within its own cluster and poorly matched to neighboring clustesr. + +A low or negative silhouette value can mean that the current clustering configuration has too many or too few clusters. + +## Definition + +For each datum $i$, let $a(i)$ be the average distance of $i$ with all other data within the same cluster. + +$a(i)$ can be interpreted as how well $i$ is assigned to its cluster. (lower values mean better agreement) + +We can then define the average dissimilarity of point $i$ to a cluster $c$ as the average distance from $i$ to all points in $c$. + +Let $b(i)$ be the lowest average distance of $i$ to all other points in any other cluster in which i is not already a member. + +The cluster with this lowest average dissimilarity is said to be the neighboring cluster of $i$. From here we can define a silhouette: +$$ +s(i) = \frac{b(i) - a(i)}{max\{a(i), b(i)\}} +$$ +The average $s(i)$ over all data of a cluster is a measure of how tightly grouped all the data in the cluster are. A silhouette plot may be used to visualize the agreement between each of the data and its cluster. + +![img](https://upload.wikimedia.org/wikipedia/commons/thumb/f/fd/Silhouette-plot-orange.png/800px-Silhouette-plot-orange.png) + +### Properties + +Recall that $a(i)$ is a measure of how dissimilar $i$ is to its own cluster, a smaller value means that it's in agreement to its cluster. For $s(i)$ to be close to 1, we require $a(i) << b(i)$ . + +If $s(i)$ is close to negative one, then by the same logic we can see that $i$ would be more appropriate if it was clustered in its neighboring cluster. + +$s(i)$ near zero means that the datum is on the border of two natural clusters. + +## Determining the number of Clusters + +This can also be used in helping to determine the number of clusters in a dataset. The ideal number of cluster is one that produces the highest silhouette value. + +Also a good indication that one has too many clusters is if there are clusters with the majority of observations being under the mean silhouette value. + +https://kapilddatascience.wordpress.com/2015/11/10/using-silhouette-analysis-for-selecting-the-number-of-cluster-for-k-means-clustering/ + +![plot_kmeans_silhouette_analysis_004](https://kapilddatascience.files.wordpress.com/2015/11/plot_kmeans_silhouette_analysis_004.png?w=660&h=257) + + + diff --git a/content/research/clusteranalysis/notes/lec10-2.md b/content/research/clusteranalysis/notes/lec10-2.md new file mode 100644 index 0000000..ec85b61 --- /dev/null +++ b/content/research/clusteranalysis/notes/lec10-2.md @@ -0,0 +1,54 @@ + # Centroid-based Clustering + +In centroid-based clustering, clusters are represented by some central vector which may or may not be a member of the dataset. In practice, the number of clusters is fixed to $k$ and the goal is to solve some sort of optimization problem. + +The similarity of two clusters is defined as the similarity of their centroids. + +This problem is computationally difficult so there are efficient heuristic algorithms that are commonly employed. These usually converge quickly to a local optimum. + +## K-means clustering + +This aims to partition $n$ observations into $k$ clusters in which each observation belongs to the cluster with the nearest mean which serves as the centroid of the cluster. + +This technique results in partitioning the data space into Voronoi cells. + +### Description + +Given a set of observations $x$, k-means clustering aims to partition the $n$ observations into $k$ sets $S$ so as to minimize the within-cluster sum of squares (i.e. variance). More formally, the objective is to find +$$ +argmin_s{\sum_{i = 1}^k{\sum_{x \in S_i}{||x-\mu_i||^2}}}= argmin_{s}{\sum_{i = 1}^k{|S_i|Var(S_i)}} +$$ +where $\mu_i$ is the mean of points in $S_i$. This is equivalent to minimizing the pairwise squared deviations of points in the same cluster +$$ +argmin_s{\sum_{i = 1}^k{\frac{1}{2|S_i|}\sum_{x, y \in S_i}{||x-y||^2}}} +$$ + +### Algorithm + +Given an initial set of $k$ means, the algorithm proceeds by alternating between two steps. + +**Assignment step**: Assign each observation to the cluster whose mean has the least squared euclidean distance. + +- Intuitively this is finding the nearest mean +- Mathematically this means partitioning the observations according to the Voronoi diagram generated by the means + +**Update Step**: Calculate the new means to be the centroids of the observations in the new clusters + +The algorithm is known to have converged when assignments no longer change. There is no guarantee that the optimum is found using this algorithm. + +The result depends on the initial clusters. It is common to run this multiple times with different starting conditions. + +Using a different distance function other than the squared Euclidean distance may stop the algorithm from converging. + +### Initialization methods + +Commonly used initialization methods are Forgy and Random Partition. + +**Forgy Method**: This method randomly chooses $k$ observations from the data set and uses these are the initial means + +This method is known to spread the initial means out + +**Random Partition Method**: This method first randomly assigns a cluster to each observation and then proceeds to the update step. + +This method is known to place most of the means close to the center of the dataset. + diff --git a/content/research/clusteranalysis/notes/lec10-3.md b/content/research/clusteranalysis/notes/lec10-3.md new file mode 100644 index 0000000..c68221f --- /dev/null +++ b/content/research/clusteranalysis/notes/lec10-3.md @@ -0,0 +1,18 @@ +# Voronoi Diagram + +A Voronoi diagram is a partitioning of a plan into regions based on distance to points in a specific subset of the plane. + +The set of points (often called seeds, sites, or generators) is specified beforehand, and for each seed there is a corresponding region consisting of all points closer to that seed than any other. + +Different metrics may be used and often result in different Voronoi diagrams + +**Euclidean** + +![](https://upload.wikimedia.org/wikipedia/commons/thumb/5/54/Euclidean_Voronoi_diagram.svg/382px-Euclidean_Voronoi_diagram.svg.png) + +**Manhattan** + +![](https://upload.wikimedia.org/wikipedia/commons/thumb/6/6d/Manhattan_Voronoi_Diagram.svg/382px-Manhattan_Voronoi_Diagram.svg.png) + + + diff --git a/content/research/clusteranalysis/notes/lec11-1.md b/content/research/clusteranalysis/notes/lec11-1.md new file mode 100644 index 0000000..99473f2 --- /dev/null +++ b/content/research/clusteranalysis/notes/lec11-1.md @@ -0,0 +1,18 @@ +# K-means++ + +K-means++ is an algorithm for choosing the initial values or seeds for the k-means clustering algorithm. This was proposed as a way of avoiding the sometimes poor clustering found by a standard k-means algorithm. + +## Intuition + +The intuition behind this approach involves spreading out the $k$ initial cluster centers. The first cluster center is chosen uniformly at random from the data points that are being clustered, after which each subsequent cluster center is chosen from the remaining data points with probability proportional to its squared distance from the point's closest existing cluster center. + +## Algorithm + +The exact algorithm is as follows + +1. Choose one center uniformly at random from among data points +2. For each data point $x$, compute $D(x)$, the distance between $x$ and the nearest center that has already been chosen. +3. Choose one new data point at random as a new center, using a weighted probability distribution where a point $x$ is chosen with probability proporitonal to $D(x)^2$ +4. Repeat steps 2 and 3 until $k$ centers have been chosen +5. Now that the initial centers have been chosen, proceed using standard k-means clustering + diff --git a/content/research/clusteranalysis/notes/lec11-2.md b/content/research/clusteranalysis/notes/lec11-2.md new file mode 100644 index 0000000..e93639b --- /dev/null +++ b/content/research/clusteranalysis/notes/lec11-2.md @@ -0,0 +1,52 @@ +# K-Medoids + +A medoid can be defined as the object of a cluster whose average dissimilarity to all the objects in the cluster is minimal. + +The K-medoids algorithm is related to k-means and the medoidshift algorithm. Both the k-means and k-medoids algorithms are partition and both attempt to minimize the distance between points in the cluster to it's center. In contrast to k-means, it chooses data points as centers and uses the Manhattan Norm to define the distance between data points instead of the Euclidean. + +This method is known to be more robust to noise and outliers compared to k-means since it minimizes the sum of pairwise dissimilarities instead of the sum of squared Euclidean distances. + +## Algorithms + +There are several algorithms that have been created as an optimization to an exhaustive search. In this section, we'll discuss PAM and Voronoi iteration method. + +### Partitioning Around Medoids (PAM) + +1. Select $k$ of the $n$ data points as medoids +2. Associate each data point to the closes medoid +3. While the cost of the configuration decreases: + 1. For each medoid $m$, for each non-medoid data point $o$: + 1. Swap $m$ and $o$, recompute the cost (sum of distances of points to their medoid) + 2. If the total cost of the configuration increased in the previous step, undo the swap + + + +### Voronoi Iteration Method + +1. Select $k$ of the $n$ data points as medoids +2. While the cost of the configuration decreases + 1. In each cluster, make the point that minimizes the sum of distances within the cluster the medoid + 2. Reassign each point to the cluster defined by the closest medoid determined in the previous step. + + + +### Clustering Large Applications (CLARA + +This is a variant of the PAM algorithm that relies on the sampling approach to handle large datasets. The cost of a particular cluster configuration is the mean cost of all the dissimilarities. + + + +## R Implementations + +Both PAM and CLARA are defined in the `cluster` package in R. + +```R +clara(x, k, metric = "euclidean", stand = FALSE, samples = 5, + sampsize = min(n, 40 + 2 * k), trace = 0, medoids.x = TRUE, + keep.data = medoids.x, rngR = FALSE) +``` + +```R +pam(x, k, metric = "euclidean", stand = FALSE) +``` + diff --git a/content/research/clusteranalysis/notes/lec11-3.md b/content/research/clusteranalysis/notes/lec11-3.md new file mode 100644 index 0000000..20bbebb --- /dev/null +++ b/content/research/clusteranalysis/notes/lec11-3.md @@ -0,0 +1,19 @@ +# K-Medians + +This is a variation of k-means clustering where instead of calculating the mean for each cluster to determine its centroid we are going to calculate the median instead. + +This has the effect of minimizing error over all the clusters with respect to the Manhattan norm as opposed to the Euclidean squared norm which is minimized in K-means + +### Algorithm + +Given an initial set of $k$ medians, the algorithm proceeds by alternating between two steps. + +**Assignment step**: Assign each observation to the cluster whose median has the leas Manhattan distance. + +- Intuitively this is finding the nearest median + +**Update Step**: Calculate the new medians to be the centroids of the observations in the new clusters + +The algorithm is known to have converged when assignments no longer change. There is no guarantee that the optimum is found using this algorithm. + +The result depends on the initial clusters. It is common to run this multiple times with different starting conditions. \ No newline at end of file diff --git a/content/research/clusteranalysis/notes/lec12.md b/content/research/clusteranalysis/notes/lec12.md new file mode 100644 index 0000000..83dcee3 --- /dev/null +++ b/content/research/clusteranalysis/notes/lec12.md @@ -0,0 +1,56 @@ +# Introduction to Density Based Clustering + +In density-based clustering, clusters are defined as areas of higher density than the remainder of the data sets. Objects in more sparse areas are considered to be outliers or border points. This helps discover clusters of arbitrary shape. + +## DBSCAN + +Given a set of points in space, it groups together points that are closely packed together while marking points that lie alone in low-density regions as outliers. + +### Preliminary Information + +- A point $p$ is a core point if at least k (often referred to as minPts) are within $\epsilon$ of it. Those points are said to be *directly reachable* from $p$. +- A point $q$ is directly reachable from $p$ if point $q$ is within distance $\epsilon$ from point $p$ and $p$ must be a core point +- A point $q$ is reachable from $p$ if there is a path $p_1, \dots, p_n$ with $p_1 = p$ and $p_n = q$ where each $p_{i + 1}$ is directly reachable from $p_i$. (All points on the path must be core points, with the possible exception of $q$) +- All points not reachable from any other points are outliers + +Non core points can be part of a cluster, but they form its "edge", since they cannot be used to reach more points. + +Reachability is not a symmetric relation since, by definition, no point may be reachable from a non-core point, regardless of distance. + +Two points $p$ and $q$ are density-connected if there is a point $o$ such that both $p$ and $q$ are reachable from $o$. Density-connectedness is symmetric. + +A cluster then satisfies two properties: + +1. All points within the cluster are mutually density-connected +2. If a point is density-reachable from any point of the cluster, it is part of the cluster as well. + + +### Algorithm + +1. Find the $\epsilon$ neighbors of every point, and identify the core points with more than $k$ neighbors. +2. Find the connected components of *core* points on the neighborhood graph, ignoring all non-core points. +3. Assign each non-core point to a nearby cluster if the cluster is an $\epsilon$ (eps) neighbor, otherwise assign it to noise. + +###Advantages + +- Does not require one to specify the number of clusters in the data +- Can find arbitrarily shaped clusters +- Has a notion of noise and is robust to outliers + +### Disadvantages + +- Not entirely deterministic: border points that are reachable from more than one cluster can be part of either cluster. +- The quality to DBSCAN depends on the distance measure used. +- Cannot cluster data sets well with large differences in densities. + +### Rule of Thumbs for parameters + +$k$: $k$ must be larger than $(D + 1)$ where $D$ is the number of dimensions in the dataset. Normally $k$ is chosen to be twice the number of dimensions. + +$\epsilon$: Ideally the $k^{th}$ nearest neighbors are at roughly the same distance. Plot the sorted distance of every point to it's $k^{th}$ nearest neighbor + + + +Example of Run Through + +https://www.cse.buffalo.edu/~jing/cse601/fa12/materials/clustering_density.pdf \ No newline at end of file diff --git a/content/research/clusteranalysis/notes/lec2-1.md b/content/research/clusteranalysis/notes/lec2-1.md new file mode 100644 index 0000000..c7f420f --- /dev/null +++ b/content/research/clusteranalysis/notes/lec2-1.md @@ -0,0 +1,34 @@ +# Why use different distance measures? + +I made an attempt to find out in what situations people use different distance measures. Looking around in the Internet usually produces the results "It depends on the problem" or "I typically just always use Euclidean" + +Which as you might imagine, isn't a terribly useful answer. Since it doesn't give me any examples of which types of problems different distances solve. + +Therefore, let's think about it in a different way. What properties do different distance measures have that make them desirable? + +## Manhattan Advantages + +- The gradient of this function has a constant magnitude. There's no power in the formula +- Unusual values affect distances on Euclidean more since the difference is squared + +https://datascience.stackexchange.com/questions/20075/when-would-one-use-manhattan-distance-as-opposite-to-euclidean-distance + + + +## Mahalanobis Advantages + +Variables can be on different scales. The Mahalanobis formula has a built in variance-covariance matrix which allows you to rescale your variables to make distances of different variables more comparable. + +https://stats.stackexchange.com/questions/50949/why-use-the-mahalanobis-distance#50956 + + + +## Euclidean Disadvantages + +In higher dimensions, the points essentially become uniformly distant from one another. This is a problem observed in most distance metrics but it's more obvious with the Euclidean one. + +https://stats.stackexchange.com/questions/99171/why-is-euclidean-distance-not-a-good-metric-in-high-dimensions/ + + + +Hopefully in this course, we'll discover more properties as to why it makes sense to use different distance measures since it can have a impact on how our clusters are formed. \ No newline at end of file diff --git a/content/research/clusteranalysis/notes/lec2-2.md b/content/research/clusteranalysis/notes/lec2-2.md new file mode 100644 index 0000000..cb89f91 --- /dev/null +++ b/content/research/clusteranalysis/notes/lec2-2.md @@ -0,0 +1,53 @@ +# Principal Component Analysis Pt. 1 + +## What is PCA? + +Principal component analysis is a statistical procedure that performs an orthogonal transformation to convert a set of variables into a set of linearly uncorrelated variables called principle components. + +Number of distinct principle components equals $min(\# Variables, \# Observations - 1)$ + +The transformation is defined in such a way that the first principle component has the largest possible variance explained in the data. + +Each succeeding component has the highest possible variance under the constraint of having to be orthogonal to the preceding components. + +PCA is sensitive to the relative scaling of the original variables. + +### Results of a PCA + +Results are discussed in terms of *component scores* which is the transformed variables and *loadings* which is the weight by which each original variable should be multiplied to get the component score. + +## Assumptions of PCA + +1. Linearity +2. Large variances are important and small variances denote noise +3. Principal components are orthogonal + +## Why perform PCA? + +- Distance measures perform poorly in high-dimensional space (https://stats.stackexchange.com/questions/256172/why-always-doing-dimensionality-reduction-before-clustering) +- Helps eliminates noise from the dataset (https://www.quora.com/Does-it-make-sense-to-perform-principal-components-analysis-before-clustering-if-the-original-data-has-too-many-dimensions-Is-it-theoretically-unsound-to-try-to-cluster-data-with-no-correlation) +- One initial cost to help reduce further computations + +## Computing PCA + +1. Subtract off the mean of each measurement type +2. Compute the covariance matrix +3. Take the eigenvalues/vectors of the covariance matrix + +## R Code + +```R +pcal = function(data) { + centered_data = scale(data) + covariance = cov(centered_data) + eigen_stuff = eigen(covariance) + sorted_indices = sort(eigen_stuff$values, + index.return = T, + decreasing = T)$ix + loadings = eigen_stuff$values[sorted_indices] + components = eigen_stuff$vectors[sorted_indices,] + combined_list = list(loadings, components) + names(combined_list) = c("Loadings", "Components") + return(combined_list) +} +``` \ No newline at end of file diff --git a/content/research/clusteranalysis/notes/lec4-2.md b/content/research/clusteranalysis/notes/lec4-2.md new file mode 100644 index 0000000..1cbad20 --- /dev/null +++ b/content/research/clusteranalysis/notes/lec4-2.md @@ -0,0 +1,24 @@ +# Revisiting Similarity Measures + +## Manhatten Distance + +An additional use case for Manhatten distance is when dealing with binary vectors. This approach, otherwise known as the Hamming distance, is the number of bits that are different between two binary vectors. + +## Ordinal Variables + +Ordinal variables can be treated as if they were on a interval scale. + +First, replace the ordinal variable value by its rank ($r_{if}$) Then map the range of each variable onto the interval $[0, 1]$ by replacing the $f_i$ where f is the variable and i is the object by +$$ +z_{if} = \frac{r_{if} - 1}{M_f - 1} +$$ +Where $M_f$ is the maximum rank. + +### Example + +Freshman = $0$ Sophmore = $\frac{1}{3}$ Junior = $\frac{2}{3}$ Senior = $1$ + +$d(freshman, senior) = 1$ + +$d(junior, senior) = \frac{1}{3}$ + diff --git a/content/research/clusteranalysis/notes/lec4-3.md b/content/research/clusteranalysis/notes/lec4-3.md new file mode 100644 index 0000000..b65b103 --- /dev/null +++ b/content/research/clusteranalysis/notes/lec4-3.md @@ -0,0 +1,40 @@ +# Cluster Tendency + +This is the assessment of the suitability of clustering. Cluster Tendency determines whether the data has any inherent grouping structure. + +This is a hard task since there are so many different definitions of clusters (portioning, hierarchical, density, graph, etc.) Even after fixing a cluster type, this is still hard in defining an appropriate null model for a data set. + +One way we can go about measuring cluster tendency is to compare the data against random data. On average, random data should not contain clusters. + +There are some clusterability assessment methods such as Spatial histogram, distance distribution and Hopkins statistic. + +## Hopkins Statistic + +Let $X$ be the set of $n$ data points in $d$ dimensional space. Consider a random sample (without replacement) of $m << n$ data points. Also generate a set $Y$ of $m$ uniformly randomly distributed data points. + +Now define two distance measures $u_i$ to be the distance of $y_i \in Y$ from its nearest neighbor in X and $w_i$ to be the distance of $x_i \in X$ from its nearest neighbor in X + +We can then define Hopkins statistic as +$$ +H = \frac{\sum_{i = 1}^m{u_i^d}}{\sum_{i = 1}^m{u_i^d} + \sum_{i =1}^m{w_i^d}} +$$ + +### Properties + +With this definition, uniform random data should tend to have values near 0.5, and clustered data should tend to have values nearer to 1. + +### Drawbacks + +However, data containing a single Gaussian will also score close to one. As this statistic measures deviation from a uniform distribution. Making this statistic less useful in application as real data is usually not remotely uniform. + + + +## Spatial Histogram Approach + +For this method, I'm not too sure how this works, but here are some key points I found. + +Divide each dimension in equal width bins, and count how many points lie in each of the bins and obtain the empirical joint probability mass function. + +Do the same for the randomly sampled data + +Finally compute how much they differ using the Kullback-Leibler (KL) divergence value. If it differs greatly than we can say that the data is clusterable. \ No newline at end of file diff --git a/content/research/clusteranalysis/notes/lec4.md b/content/research/clusteranalysis/notes/lec4.md new file mode 100644 index 0000000..984a04f --- /dev/null +++ b/content/research/clusteranalysis/notes/lec4.md @@ -0,0 +1,171 @@ +# Principal Component Analysis Part 2: Formal Theory + +##Properties of PCA + +There are a number of ways to maximize the variance of a principal component. To create an unique solution we should impose a constraint. Let us say that the sum of the square of the coefficients must equal 1. In vector notation this is the same as +$$ +a_i^Ta_i = 1 +$$ +Every future principal component is said to be orthogonal to all the principal components previous to it. +$$ +a_j^Ta_i = 0, i < j +$$ +The total variance of the $q$ principal components will equal the total variance of the original variables +$$ +\sum_{i = 1}^q {\lambda_i} = trace(S) +$$ +Where $S$ is the sample covariance matrix. + +The proportion of accounted variation in each principle component is +$$ +P_j = \frac{\lambda_j}{trace(S)} +$$ +From this, we can generalize to the first $m$ principal components where $m < q$ and find the proportion $P^{(m)}$ of variation accounted for +$$ +P^{(m)} = \frac{\sum_{i = 1}^m{\lambda_i}}{trace(S)} +$$ +You can think of the first principal component as the line of best fit that minimizes the residuals orthogonal to it. + +### What to watch out for + +As a reminder to the last lecture, *PCA is not scale-invariant*. Therefore, transformations done to the dataset before PCA and after PCA often lead to different results and possibly conclusions. + +Additionally, if there are large differences between the variances of the original variables, then those whose variances are largest will tend to dominate the early components. + +Therefore, principal components should only be extracted from the sample covariance matrix when all of the original variables have roughly the **same scale**. + +### Alternatives to using the Covariance Matrix + +But it is rare in practice to have a scenario when all of the variables are of the same scale. Therefore, principal components are typically extracted from the **correlation matrix** $R$ + +Choosing to work with the correlation matrix rather than the covariance matrix treats the variables as all equally important when performing PCA. + +## Example Derivation: Bivariate Data + +Let $R$ be the correlation matrix +$$ +R = \begin{pmatrix} +1 & r \\ +r & 1 +\end{pmatrix} +$$ +Let us find the eigenvectors and eigenvalues of the correlation matrix +$$ +det(R - \lambda I) = 0 +$$ + +$$ +(1-\lambda)^2 - r^2 = 0 +$$ + +$$ +\lambda_1 = 1 + r, \lambda_2 = 1 - r +$$ + +Let us remember to check the condition "sum of the principal components equals the trace of the correlation matrix": +$$ +\lambda_1 + \lambda_2 = 1+r + (1 - r) = 2 = trace(R) +$$ + +###Finding the First Eigenvector + +Looking back at the characteristic equation +$$ +Ra_1 = \lambda a_1 +$$ +We can get the following two formulas +$$ +a_{11} + ra_{12} = (1+r)a_{11} \tag{1} +$$ + +$$ +ra_{11} + a_{12} = (1 + r)a_{12} \tag{2} +$$ + +Now let us find out what $a_{11}$ and $a_{12}$ equal. First let us solve for $a_{11}$ using equation $(1)$ +$$ +ra_{12} = (1+r)a_{11} - a_{11} +$$ + +$$ +ra_{12} = a_{11}(1 + r - 1) +$$ + +$$ +ra_{12} = ra_{11} +$$ + +$$ +a_{12} = a_{11} +$$ + +Where $r$ does not equal $0$. + +Now we must apply the condition of sum squares +$$ +a_1^Ta_1 = 1 +$$ + +$$ +a_{11}^2 + a_{12}^2 = 1 +$$ + +Recall that $a_{12} = a_{11}$ +$$ +2a_{11}^2 = 1 +$$ + +$$ +a_{11}^2 = \frac{1}{2} +$$ + +$$ +a_{11} =\pm \frac{1}{\sqrt{2}} +$$ + +For sake of choosing a value, let us take the principal root and say $a_{11} = \frac{1}{\sqrt{2}}$ + +###Finding the Second Eigenvector + +Recall the fact that each subsequent eigenvector is orthogonal to the first. This means +$$ +a_{11}a_{21} + a_{12}a_{22} = 0 +$$ +Substituting the values for $a_{11}$ and $a_{12}$ calculated in the previous section +$$ +\frac{1}{\sqrt{2}}a_{21} + \frac{1}{\sqrt{2}}a_{22} = 0 +$$ + +$$ +a_{21} + a_{22} = 0 +$$ + +$$ +a_{21} = -a_{22} +$$ + +Since this eigenvector also needs to satisfy the first condition, we get the following values +$$ +a_{21} = \frac{1}{\sqrt{2}} , a_{22} = \frac{-1}{\sqrt{2}} +$$ + +### Conclusion of Example + +From this, we can say that the first principal components are given by +$$ +y_1 = \frac{1}{\sqrt{2}}(x_1 + x_2), y_2 = \frac{1}{\sqrt{2}}(x_1-x_2) +$$ +With the variance of the first principal component being given by $(1+r)$ and the second by $(1-r)$ + +Due to this, as $r$ increases, so does the variance explained in the first principal component. This in turn, lowers the variance explained in the second principal component. + +## Choosing a Number of Principal Components + +Principal Component Analysis is typically used in dimensionality reduction efforts. Therefore, there are several strategies for picking the right number of principal components to keep. Here are a few: + +- Retain enough principal components to account for 70%-90% of the variation +- Exclude principal components where eigenvalues are less than the average eigenvalue +- Exclude principal components where eigenvalues are less than one. +- Generate a Scree Plot + - Stop when the plot goes from "steep" to "shallow" + - Stop when it essentially becomes a straight line. \ No newline at end of file diff --git a/content/research/clusteranalysis/notes/lec5.md b/content/research/clusteranalysis/notes/lec5.md new file mode 100644 index 0000000..d6f874b --- /dev/null +++ b/content/research/clusteranalysis/notes/lec5.md @@ -0,0 +1,35 @@ +# Introduction to Connectivity Based Models + +Hierarchical algorithms combine observations to form clusters based on their distance. + +## Connectivity Methods + +Hierarchal Clustering techniques can be subdivided depending on the method of going about it. + +First there are two different methods in forming the clusters *Agglomerative* and *Divisive* + +Agglomerative is when you combine the n individuals into groups through each iteration + +Divisive is when you are separating one giant group into finer groupings with each iteration. + +Hierarchical methods are an irrevocable algorithm, once it joins or separates a grouping, it cannot be undone. As Kaufman and Rousseeuw (1990) colorfully comment: *"A hierarchical method suffers from the defect that it can never repair what was done in previous steps"*. + +It is the job of the statistician to decide when to stop the agglomerative or decisive algorithm, since having one giant cluster containing all observations or having each observation be a cluster isn't particularly useful. + +At different distances, different clusters are formed and are more readily represented using a **dendrogram**. These algorithms do not provide a unique solution but rather provide an extensive hierarchy of clusters that merge or divide at different distances. + +## Linkage Criterion + +Apart from the method of forming clusters, the user also needs to decide on a linkage criterion to use. Meaning, how do you want to optimize your clusters. + +Do you want to group based on the nearest points in each cluster? Nearest Neighbor Clustering + +Or do you want to based on the farthest observations in each cluster? Farthest neighbor clustering. + +![http://www.multid.se/genex/onlinehelp/clustering_distances.png](http://www.multid.se/genex/onlinehelp/clustering_distances.png) + +## Shortcomings + +This method is not very robust towards outliers, which will either show up as additional clusters or even cause other clusters to merge depending on the clustering method. + +As we go through this section, we will go into detail about the different linkage criterion and other parameters of this model. \ No newline at end of file diff --git a/content/research/clusteranalysis/notes/lec6.md b/content/research/clusteranalysis/notes/lec6.md new file mode 100644 index 0000000..2c03e9e --- /dev/null +++ b/content/research/clusteranalysis/notes/lec6.md @@ -0,0 +1,90 @@ +# Agglomerative Methods + +## Single Linkage + +First let us consider the single linkage (nearest neighbor) approach. The clusters can be found through the following algorithm + +1. Find the smallest non-zero distance +2. Group the two objects together as a cluster +3. Recompute the distances in the matrix by taking the minimum distances + - Cluster a,b -> c = min(d(a, c), d(b, c)) + +Single linkage can operate directly on a proximity matrix, the actual data is not required. + +A wonderful visual representation can be found in Everitt Section 4.2 + +## Centroid Clustering + +This is another criterion measure that requires both the data and proximity matrix. These are the following steps of the algorithm. Requires Euclidean distance measure to preserve geometric correctness + +1. Find the smallest non-zero distance +2. Group the two objects together as a cluster +3. Recompute the distances by taking the mean of the clustered observations and computing the distances between all of the observations + - Cluster a,b -> c = d(mean(a, b), c) + +## Complete Linkage + +This is like Single Linkage, except now we're taking the farthest distance. The algorithm can be adjusted to the following + +1. Find the smallest non-zero distance +2. Group the two objects together as a cluster +3. Recompute the distances in the matrix by taking the maximum distances + - Cluster a,b -> c = max(d(a, c), d(b, c)) + +##Unweighted Pair-Group Method using the Average Approach (UPGMA) + +In this criterion, we are no longer summarizing each cluster before taking distances, but instead comparing each observation in the cluster to the outside point and taking the average + +1. Find the smallest non-zero distance +2. Group the two objects together as a cluster +3. Recompute the distances in the matrix by taking the mean + - Cluster A: a,b -> c = $mean_{i = 0}(d(A_i, c))$ + +## Median Linkage + +This approach is similar to the UPGMA approach, except now we're taking the median instead of the mean + +1. Find the smallest non-zero distance +2. Group the two objects together as a cluster +3. Recompute the distances in the matrix by taking the median + - Cluster A: a,b -> c = $median_{i = 0}{(d(A_i, c))}$ + +## Ward Linkage + +This one I didn't look too far into but here's the description: With Ward's linkage method, the distance between two clusters is the sum of squared deviations from points to centroids. The objective of Ward's linkage is to minimize the within-cluster sum of squares. + +## When to use different Linkage Types? + +According to the following two stack overflow posts: https://stats.stackexchange.com/questions/195446/choosing-the-right-linkage-method-for-hierarchical-clustering and https://stats.stackexchange.com/questions/195456/how-to-select-a-clustering-method-how-to-validate-a-cluster-solution-to-warran/195481#195481 + +These are the following ways you can justify a linkage type. + +**Cluster metaphor**. *"I preferred this method because it constitutes clusters such (or such a way) which meets with my concept of a cluster in my particular project."* + +**Data/method assumptions**. *"I preferred this method because my data nature or format predispose to it."* + +**Internal validity**. *"I preferred this method because it gave me most clear-cut, tight-and-isolated clusters."* + +**External validity**. *"I preferred this method because it gave me clusters which differ by their background or clusters which match with the true ones I know."* + +**Cross-validity**. *"I preferred this method because it is giving me very similar clusters on equivalent samples of the data or extrapolates well onto such samples."* + +**Interpretation**. *"I preferred this method because it gave me clusters which, explained, are most persuasive that there is meaning in the world."* + +### Cluster Metaphors + +Let us explore the idea of cluster metaphors now. + +**Single Linkage** or **Nearest Neighbor** is a *spectrum* or *chain*. + +Since single linkage joins clusters by the shortest link between them, the technique cannot discern poorly separated clusters. On the other hand, single linkage is one of the few clustering methods that can delineate nonelipsodial clusters. + +**Complete Linkage** or **Farthest Neighbor** is a *circle*. + + **Between-Group Average linkage** (UPGMA) is a united *class + +**Centroid method** (UPGMC) is *proximity of platforms* (commonly used in politics) + +## Dendrograms + +A **dendrogram** is a tree diagram frequently used to illustrate the arrangement of the clusters produced by hierarchical clustering. It shows how different clusters are formed at different distance groupings. \ No newline at end of file diff --git a/content/research/clusteranalysis/notes/lec7.md b/content/research/clusteranalysis/notes/lec7.md new file mode 100644 index 0000000..2fe9e7a --- /dev/null +++ b/content/research/clusteranalysis/notes/lec7.md @@ -0,0 +1,74 @@ +# Divisive Methods Pt.1 + +Divisive methods work in the opposite direction of agglomerative methods. They take one large cluster and successively splits it. + +This is computationally demanding if all $2^{k - 1} - 1$ possible divisions into two sub-clusters of a cluster of $k$ objects are considered at each stage. + +While less common than Agglomerative methods, divisive methods have the advantage that most users are interested in the main structure in their data, and this is revealed from the outset of a divisive method. + +## Monothetic Divisive Methods + +For data consisting of $p$ **binary variables**, there is a computationally efficient method known as *monothetic divisive methods* available. + +Monothetic divisions divide clusters according to the presence or absence of each of the $p$ variables, so that at each stage, clusters contain members with certain attributes that are either all present or all absent. + +The term 'monothetic' refers to the use of a single variable on which to base the split on. *Polythetic* methods use all the variables at each stage. + +### Choosing the Variable to Split On + +The choice of the variable on which a split is made depends on optimizing a criterion reflecting either cluster homogeneity or association with other variables. + +This tends to minimize the number of splits that have to be made. + +An example of an homogeneity criterion is the information content $C$ + +This is defined with $p$ variables and $n$ objections where $f_k$ is the number of individuals with the $k$ attribute +$$ +C = pn\log{n}-\sum_{k = 1}^p{(f_k\log{f_k} - (n-f_k)\log{(n-f_k)})} +$$ + +### Association with other variables + +Recall that another way to split is based on the association with other variables. The attribute used at each step can be chosen according to its overall association with all attributes remaining at each step. + +This is sometimes termed *association analysis*. + +| | V1 | V2 | +| ---- | ---- | ---- | +| | 1 | 0 | +| 1 | a | b | +| 0 | c | d | + +####Common measures of association + +$$ +|ad-bc| \tag{4.6} +$$ + +$$ +(ad-bc)^2 \tag{4.7} +$$ + +$$ +\frac{(ad-bc)^2n}{(a+b)(a+c)(b+d)(c+d)} \tag{4.8} +$$ + +$$ +\sqrt{\frac{(ad-bc)^2n}{(a+b)(a+c)(b+d)(c+d)}} \tag{4.9} +$$ + +$$ +\frac{(ad-bc)^2}{(a+b)(a+c)(b+d)(c+d)} \tag{4.10} +$$ + +$(4.6)$ and $(4.7)$ have the advantage that there is no danger of computational problems if any marginal totals are near zero. + +The last three, $(4.8)$, $(4.9)$, $(4.10)$, are all related to the $\chi^2$ statistic, its square root, and the Pearson correlation coefficient respectively. + +### Advantages/Disadvantages of Monothetic Methods + +Appealing features of monothetic divisive methods are the easy classification of new members and the including of cases with missing values. + +A further advantage of monothetic divisive methods is that it is obvious which variables produce the split at any stage of the process. + +A disadvantage with these methods is that the possession of a particular attribute which is either rare or rarely found in combination with others may take an individual down a different path. \ No newline at end of file diff --git a/content/research/clusteranalysis/notes/lec8.md b/content/research/clusteranalysis/notes/lec8.md new file mode 100644 index 0000000..0c47d8e --- /dev/null +++ b/content/research/clusteranalysis/notes/lec8.md @@ -0,0 +1,48 @@ +# Divisive Methods Pt 2. + +Recall in the previous section that we spoke about Monothetic and Polythetic methods. Monothetic methods only looks at a single variable at a time while Polythetic looks at multiple variables simultaneously. In this section, we will speak more about polythetic divisive methods. + +## Polythetic Divisive Methods + +Polythetic methods operate via a distance matrix. + +This procedure avoids considering all possible splits by + +1. Finding the object that is furthest away from the others within a group and using that as a seed for a splinter group. +2. Each object is then considered for entry to that separate splinter group: any that are closer to the splinter group than the main group is moved to the splinter one. +3. The step is then repeated. + +This process has been developed into a program named `DIANA` (DIvisive ANAlysis Clustering) which is implemented in `R`. + +### Similarities to Politics + +This somewhat resembles a way a political party might split due to inner conflicts. + +Firstly, the most discontented member leaves the party and starts a new one, and then some others follow him until a kind of equilibrium is attained. + +## Methods for Large Data Sets + +There are two common hierarchical methods used for large data sets `BIRCH` and `CURE`. Both of these algorithms employ a pre-clustering phase in where dense regions are summarized, the summaries being then clustered using a hierarchical method based on centroids. + +### CURE + +1. `CURE` starts with a random sample of points and represents clusters by a smaller number of points that capture the shape of the cluster +2. Which are then shrunk towards the centroid as to dampen the effect of the outliers +3. Hierarchical clustering then operates on the representative points + +`CURE` has been shown to be able to cope with arbitrary-shaped clusters and in that respect may be superior to `BIRCH`, although it does require judgment as to the number of clusters and also a parameter which favors either more or less compact clusters. + +## Revisiting Topics: Cluster Dissimilarity + +In order to decide where clusters should be combined (for agglomerative), or where a cluster should be split (for divisive), a measure of dissimilarity between sets of observations is required. + +In most methods of hierarchical clustering this is achieved by a use of an appropriate + +- Metric (a measure of distance between pairs of observations) +- Linkage Criterion (which specifies the dissimilarities of sets as functions of pairwise distances observations in the sets) + +## Advantages of Hierarchical Clustering + +- Any valid measure of distance measure can be used +- In most cases, the observations themselves are not required, just hte matrix of distances + - This can have the advantage of only having to store a distance matrix in memory as opposed to a n-dimensional matrix. \ No newline at end of file diff --git a/content/research/clusteranalysis/notes/lec9-1.md b/content/research/clusteranalysis/notes/lec9-1.md new file mode 100644 index 0000000..d8bb4da --- /dev/null +++ b/content/research/clusteranalysis/notes/lec9-1.md @@ -0,0 +1,58 @@ +# CURE and TSNE + +##Clustering Using Representatives (CURE) + +Clustering using Representatives is a Hierarchical clustering technique in which you can represent a cluster using a **set** of well-scattered representative points. + +This algorithm has a parameter $\alpha$ which defines the factor of the points in which to shrink towards the centroid. + +CURE is known to be robust to outliers and able to identify clusters that have a **non-spherical** shape and size variance. + +The clusters with the closest pair of representatives are the clusters that are merged at each step of CURE's algorithm. + +This algorithm cannot be directly applied to large datasets due to high runtime complexity. Several enhancements were added to address this requirement + +- Random sampling: This involves a trade off between accuracy and efficiency. One would hope that the random sample they obtain is representative of the population +- Partitioning: The idea is to partition the sample space into $p$ partitions + +Youtube Video: https://www.youtube.com/watch?v=JrOJspZ1CUw + +Steps + +1. Pick a random sample of points that fit in main memory +2. Cluster sample points hierarchically to create the initial clusters +3. Pick representative point**s** + 1. For each cluster, pick $k$ representative points, as dispersed as possible + 2. Move each representative points to a fixed fraction $\alpha$ toward the centroid of the cluster +4. Rescan the whole dataset and visit each point $p$ in the data set +5. Place it in the "closest cluster" + 1. Closest as in shortest distance among all the representative points. + +## TSNE + +TSNE allows us to reduce the dimensionality of a dataset to two which allows us to visualize the data. + +It is able to do this since many real-world datasets have a low intrinsic dimensionality embedded within the high-dimensional space. + +Since the technique needs to conserve the structure of the data, two corresponding mapped points must be close to each other distance wise as well. Let $|x_i - x_j|$ be the Euclidean distance between two data points, and $|y_i - y_j|$ he distance between the map points. This conditional similarity between two data points is: +$$ +p_{j|i} = \frac{exp(-|x_i-x_j|^2 / (2\sigma_i^2))}{\sum_{k \ne i}{exp(-|x_i-x_k|^2/(2\sigma_i^2))}} +$$ +Where we are considering the **Gaussian distribution** surrounding the distance between $x_j$ from $x_i$ with a given variance $\sigma_i^2$. The variance is different for every point; it is chosen such that points in dense areas are given a smaller variance than points in sparse areas. + +Now the similarity matrix for mapped points are +$$ +q_{ij} = \frac{f(|x_i - x_j|)}{\sum_{k \ne i}{f(|x_i - x_k)}} +$$ +Where $f(z) = \frac{1}{1 + z^2}$ + +This has the same idea as the conditional similarity between two data points, except this is based on the **Cauchy distribution**. + +TSNE works at minimizing the Kullback-Leiber divergence between the two distributions $p_{ij}$ and $q_{ij}$ +$$ +KL(P || Q) = \sum_{i,j}{p_{i,j} \log{\frac{p_{ij}}{q_{ij}}}} +$$ +To minimize this score, gradient descent is typically performed +$$ +\frac{\partial KL(P||Q)}{\partial y_i} = 4\sum_j{(p_{ij} - q_{ij})} +$$ diff --git a/content/research/clusteranalysis/notes/lec9-2.md b/content/research/clusteranalysis/notes/lec9-2.md new file mode 100644 index 0000000..26c3dcf --- /dev/null +++ b/content/research/clusteranalysis/notes/lec9-2.md @@ -0,0 +1,72 @@ +# Cluster Validation + +There are multiple approaches to validating your cluster models + +- Internal Evaluation: This is when you summarize the clustering into a single score. For example, minimizing the the deviations from the centroids. +- External Evaluation: Minimizing the deviations from some known "labels" +- Manual Evaluation: A human expert decides whether or not it's good +- Indirect Evaluation: Evaluating the utility of clustering in its intended application. + +## Some Problems With These Evaluations + +Internal evaluation measures suffer form the problem that they represent functions that are objectives for many clustering algorithms. So of course the result of the clustering algorithm will be such that the objective would be minimized. + +External evaluation suffers from the fact that if we had labels to begin with then we wouldn't need to cluster. Practical applications of clustering occur usually when we don't have labels. On the other hand, possible labeling can reflect one possible partitioning of the data set. There could exist different, perhaps even better clustering. + +## Internal Evaluation + +We like to see a few qualities in cluster models + +- *Robustness*: Refers to the effects of errors in data or missing observations, and changes in the data and methods. +- *Cohesiveness*: Clusters should be compact or high high intra-cluster similarity. +- Clusters should be dissimilar to separate clusters. Should have low inter-cluster similarity +- *Influence*: We should pay attention to and try to control for the influence of certain observations on the overall cluster + +Let us focus on the second and third bullet point for now. Internal evaluation measures are best suited to get some insight into situations where one algorithm performs better than another, this does not imply that one algorithm produces more valid results than another. + +### Davies-Bouldin Index + +$$ +DB = \frac{1}{n}\sum_{i=1}^n{max_{j\ne i}{(\frac{\sigma_i + \sigma_j}{d(c_i,c_j)})}} +$$ + +Where $n$ is the number of clusters, $c$ indicates a centroid, and $\sigma$ represents the deviation from the centroid. + +Better clustering algorithms are indicated by smaller DB values. + +### Dunn Index + +$$ +D= \frac{min_{1\le i < j \le n}{d(i,j)}}{max_{1\le k \le n}{d^\prime(k)}} +$$ + +The Dunn index aims to identify dense and well-separated clusters. This is defined as the ratio between the minimal inter-cluster distance to maximal intra-cluster distance. + +High Dunn Index values are more desirable. + +###Bootstrapping + +In terms of robustness we can measure uncertainty in each of the individual clusters. This can be examined using a bootstrapping approach by Suzuki and Shimodaira (2006). The probability or "p-value" is the proportion of bootstrapped samples that contain the cluster. Larger p-values in this case indicate more support for the cluster. + +This is available in R via `Pvclust` + +### Split-Sample Validation + +One approach to assess the effects of perturbations of the data is by randomly dividing the data into two subsets and performing an analysis on each subset separately. This method was proposed by McIntyre and Blashfield in 1980; their method involves the following steps + +- Divide the sample in two and perform a cluster analysis on one of the samples + - Have a fixed rule for the number of clusters +- Determine the centroids of the clusters, and compute proximities between the objects in teh second sample and the centroids, classifying the objects into their nearest cluster. +- Cluster the second sample using the same methods as before and compare these two alternate clusterings using something like the *adjusted Rand index*. + +![Adjusted Index](https://wikimedia.org/api/rest_v1/media/math/render/svg/b1850490e5209123ab6e5b905495b4d5f9a1f661) + +## Influence of Individual Points + +Using internal evaluation metrics, you can see the impact of each point by doing a "leave one out" analysis. Here you evaluate the dataset minus one point for each of the points. If a positive difference is found, the point is regarded as a *facilitator*, whereas if it is negative then it is considered an *inhibitor*. once an influential inhibitor is found, the suggestion is to normally omit it from the clustering. + +## R Package + +`clValid` contains a variety of internal validation measures. + +Paper: https://cran.r-project.org/web/packages/clValid/vignettes/clValid.pdf \ No newline at end of file diff --git a/content/research/clusteranalysis/readings.md b/content/research/clusteranalysis/readings.md new file mode 100644 index 0000000..27cc818 --- /dev/null +++ b/content/research/clusteranalysis/readings.md @@ -0,0 +1,35 @@ +# Readings for Lectures of Cluster Analysis + +## Lecture 1 +Garson Textbook Chapter 3 + +## Lecture 2 +[A Tutorial on Principal Component Analysis](https://arxiv.org/pdf/1404.1100.pdf) + +## Lecture 3 +No Readings + +## Lecture 4 +An Introduction to Applied Multivariate Analysis with R by Brian Evveritt and Torsten Horthorn. + +Sections 3.0-3.9 Everitt + +## Lecture 5 + +Section 4.1 Everitt + +## Lecture 6 +Section 4.2 Everitt + +Applied Multivariate Statistical Analysis Johnson Section 12.3 + +[Linkage Methods for Cluster Observations](https://support.minitab.com/en-us/minitab/18/help-and-how-to/modeling-statistics/multivariate/how-to/cluster-observations/methods-and-formulas/linkage-methods/#mcquitty) + +## Lecture 7 +Section 4.3 Everitt + +## Lecture 8 +[Introduction to the TSNE Algorithm](https://www.oreilly.com/learning/an-illustrated-introduction-to-the-t-sne-algorithm) + +## Lecture 9 +Section 9.5 Everitt diff --git a/content/research/clusteranalysis/syllabus.md b/content/research/clusteranalysis/syllabus.md new file mode 100644 index 0000000..002dc8a --- /dev/null +++ b/content/research/clusteranalysis/syllabus.md @@ -0,0 +1,119 @@ +# Cluster Analysis Spring 2018 + +### Distance, Dimensionality Reduction, and Tendency + +- Distance + - Euclidean Distance + - Squared Euclidean Distance + - Manhattan Distance + - Maximum Distance + - Mahalanobis Distance +- Which distance function should you use? +- PCA +- Cluster Tendency + - Hopkins Statistic +- Scaling Data + +### Validating Clustering Models + +- Clustering Validation +- Cross Validation + +### Connectivity Models + +- Agglomerative Clustering + - Single Linkage Clustering + - Complete Linkage Clustering + - Unweighted Pair Group Method with Arithmetic Mean (If time permits) +- Dendrograms +- Divisive Clustering +- CURE (Clustering using REpresentatives) algorithm (If time permits) + +### Cluster Evaluation + +- Internal Evaluation + - Dunn Index + - Silhouette Coefficient + - Davies-Bouldin Index (If time permits) +- External Evaluation + - Rand Measure + - Jaccard Index + - Dice Index + - Confusion Matrix + - F Measure (If time permits) + - Fowlkes-Mallows Index (If time permits) + +### Centroid Models + +- Jenks Natural Breaks Optimization +- Voronoi Diagram +- K means clustering +- K medoids clustering +- K Medians/Modes clustering +- When to use K means as opposed to K medoids or K Medians? +- How many clusters should you use? +- Lloyd's Algorithm for Approximating K-means (If time permits) + +### Density Models + +- DBSCAN Density Based Clustering Algorithm +- OPTICS Ordering Points To Identify the Clustering Structure +- DeLi-Clu Density Link Clustering (If time permits) +- What should be your density threshold? + +### Analysis of Model Appropriateness + +- When do we use each of the models above? + +### Distribution Models (If time permits) + +- Fuzzy Clusters +- EM (Expectation Maximization) Clustering +- Maximum Likelihood Gaussian +- Probabilistic Hierarchal Clustering + + + + +## Textbooks + +Cluster Analysis 5th Edition + +- Authors: Brian S. Everitt, Sabine Landau, Morven Leese, Daniel Stahl +- ISBN-13: 978-0470749913 +- Cost: Free on UMW Library Site +- Amazon Link: https://www.amazon.com/Cluster-Analysis-Brian-S-Everitt/dp/0470749911/ref=sr_1_1?ie=UTF8&qid=1509135983&sr=8-1 +- Table of Contents: http://www.wiley.com/WileyCDA/WileyTitle/productCd-EHEP002266.html + +Cluster Analysis: 2014 Edition (Statistical Associates Blue Book Series 24) + +- Author: David Garson +- ISBN: 978-1-62638-030-1 +- Cost: Free with Site Registration +- Website: http://www.statisticalassociates.com/clusteranalysis.htm + + + +## Schedule + +In an ideal world, the topics below I estimated being a certain time period for learning them. Of course you have more experience when it comes to how long it actually takes to learn these topics, so I'll leave this mostly to your discretion. + +**Distance, Dimensionality Reduction, and Tendency** -- 3 Weeks + +**Validating Cluster Models** -- 1 Week + +**Connectivity Models** -- 2 Weeks + +**Cluster Evaluation** -- 1 Week + +**Centroid Models** -- 3 Weeks + +**Density Models** -- 3 Weeks + +**Analysis of Model Appropriateness** -- 1 Week + +The schedule above accounts for 14 weeks, so there is a week that is free as a buffer. + +## Conclusion + +Creating this document got me really excited for this independent study. Feel free to give me feedback :) \ No newline at end of file diff --git a/content/research/deepreinforcementlearning.md b/content/research/deepreinforcementlearning.md new file mode 100644 index 0000000..da28df2 --- /dev/null +++ b/content/research/deepreinforcementlearning.md @@ -0,0 +1,22 @@ +--- +Title: Deep Reinforcement Learning +Description: Combining Reinforcement Learning with Deep Learning +--- + +In the Fall of 2019, I look at integrating demonstration data into a reinforcement learning algorithm in order to make it sample efficient. + +The results are positive and are heavily documented through the following: + +[Honors Thesis](/files/research/honorsthesis.pdf) + +[Honors Defense](/files/research/ExpeditedLearningInteractiveDemo.pptx) + +Thanks to my advisor Dr. Ron Zacharksi and my committee members for all their feedback on my work! + +In the spring of 2019, under the guidance of Dr. Ron Zacharski I practiced several of the modern techniques used in Reinforcement Learning today. + +I facilitated my learning by creating a [reinforcement learning library](https://github.com/brandon-rozek/rltorch) with implementations of several popular papers. ([Semi-Weekly Progress](weeklyprogress)) + +I also presented my research (which involved creating an algorithm) at my school's research symposium. ([Slides](/files/research/QEP.pptx)) ([Abstract](abstractspring2019)) + +In the summer of 2019, I became interested in having the interactions with the environment be in a separate process. This inspired two different implementations, [ZeroMQ](https://github.com/brandon-rozek/zerogym) and [HTTP](https://github.com/brandon-rozek/gymhttp). Given the option, you should use the ZeroMQ implementation since it contains less communication overhead. diff --git a/content/research/deepreinforcementlearning/WeeklyProgress.md b/content/research/deepreinforcementlearning/WeeklyProgress.md new file mode 100644 index 0000000..cc9d00c --- /dev/null +++ b/content/research/deepreinforcementlearning/WeeklyProgress.md @@ -0,0 +1,13 @@ +## Weekly Progress + +I didn't do the greatest job at writing a progress report every week but here on the page are the ones I did write. + +[January 29 2019](Jan29) + +[February 12 2019](Feb12) + +[February 25 2019](Feb25) + +[March 26 2019](Mar26) + +[April 2 2019](Apr2) \ No newline at end of file diff --git a/content/research/deepreinforcementlearning/WeeklyProgress/1550549326169.png b/content/research/deepreinforcementlearning/WeeklyProgress/1550549326169.png new file mode 100644 index 0000000..b327209 Binary files /dev/null and b/content/research/deepreinforcementlearning/WeeklyProgress/1550549326169.png differ diff --git a/content/research/deepreinforcementlearning/WeeklyProgress/1550590562084.png b/content/research/deepreinforcementlearning/WeeklyProgress/1550590562084.png new file mode 100644 index 0000000..bb4e2d9 Binary files /dev/null and b/content/research/deepreinforcementlearning/WeeklyProgress/1550590562084.png differ diff --git a/content/research/deepreinforcementlearning/WeeklyProgress/1551158699648.png b/content/research/deepreinforcementlearning/WeeklyProgress/1551158699648.png new file mode 100644 index 0000000..b159eb4 Binary files /dev/null and b/content/research/deepreinforcementlearning/WeeklyProgress/1551158699648.png differ diff --git a/content/research/deepreinforcementlearning/WeeklyProgress/1551158802225.png b/content/research/deepreinforcementlearning/WeeklyProgress/1551158802225.png new file mode 100644 index 0000000..6385c07 Binary files /dev/null and b/content/research/deepreinforcementlearning/WeeklyProgress/1551158802225.png differ diff --git a/content/research/deepreinforcementlearning/WeeklyProgress/1551160033552.png b/content/research/deepreinforcementlearning/WeeklyProgress/1551160033552.png new file mode 100644 index 0000000..4ebb6b0 Binary files /dev/null and b/content/research/deepreinforcementlearning/WeeklyProgress/1551160033552.png differ diff --git a/content/research/deepreinforcementlearning/WeeklyProgress/Apr2.md b/content/research/deepreinforcementlearning/WeeklyProgress/Apr2.md new file mode 100644 index 0000000..33f81ca --- /dev/null +++ b/content/research/deepreinforcementlearning/WeeklyProgress/Apr2.md @@ -0,0 +1,25 @@ +# Progress Report for Week of April 2nd + +## Added Video Recording Capability to MinAtar environment + +You can now use the OpenAI Monitor Wrapper to watch the actions performed by agents in the MinAtar suite. (Currently the videos are in grayscale) + +Problems I had to solve: + +- How to represent the channels into a grayscale value +- Getting the tensor into the right format (with shape and dtype) +- Adding additional meta information that OpenAI expected + +## Progress Towards \#Exploration + +After getting nowhere trying to combine the paper on Random Network Distillation and Count-based exploration and Intrinsic Motivation, I turned the paper \#Exploration: A Study of Count-Based Exploration for Deep Reinforcement Learning. + +This paper uses the idea of an autoencoder to learn a smaller latent state representation of the input. We can then use this smaller representation as a hash and count states based on these hashes. + +Playing around with the ideas of autoencoders, I wanted a way to discretized my hash more than just what floating point precision allows. Of course this turns it into a non-differential function which I then tried turning towards Evolutionary methods to solve. Sadly the rate of optimization was drastically diminished using the Evolutionary approach. Therefore, my experiments for this week failed. + +I'll probably look towards implementing what the paper did for my library and move on to a different piece. + + + +Guru Indian: 3140 Cowan Blvd, Fredericksburg, VA 22401 \ No newline at end of file diff --git a/content/research/deepreinforcementlearning/WeeklyProgress/Feb12.md b/content/research/deepreinforcementlearning/WeeklyProgress/Feb12.md new file mode 100644 index 0000000..2f419a1 --- /dev/null +++ b/content/research/deepreinforcementlearning/WeeklyProgress/Feb12.md @@ -0,0 +1,63 @@ +# Weekly Progress Feb 12 + +## Finished writing scripts for data collection + +- Playing a game now records + - Video + - State / Next-State as pixel values + - Action taken + - Reward Received + - Whether the environment is finished every turn +- Wrote scripts to gather and preprocess the demonstration data + - Now everything is standardized on the npy format. Hopefully that stays consistent for a while. + +## Wrote code to create an actor that *imitates* the demonstrator + +Tweaked the loss function to be a form of cross-entropy loss +$$ +loss = max(Q(s, a) + l(s,a)) - Q(s, a_E) +$$ +Where $l(s, a)$ is zero for the action the demonstrator took and positive elsewhere. + +Turns out, that as with a lot of deep learning applications, you need a lot of training data. So the agent currently does poorly on mimicking the performance of the demonstrator. + +### Aside : Pretraining with the Bellman Equation + +Based off the paper: + +Todd Hester, Matej Vecerik, Olivier Pietquin, arc Lanctot, Tom Schaul, Bilal Piot, Andrew Sendonaris, Gabriel Dulac-Arnold, Ian OsbandI, John Agapiou, Joel Z. Leibo, Audrunas Gruslys. **Learning from Demonstrations for Real World Reinforcement Learning** + + + +This paper had the demonstration not include include the $(state, action)$ pairs like I did, but also the $(next_state, reward, done)$ signals. This way, they can pretrain with both supervised loss and with the general Q-learning loss. + +That way, they can use the result of the pretraining as a starting ground for the actual training. The way I implemented it, I would first train an imitator which would then be used as the actor during the simulations from which we would collect data and begin training another net. + +## Prioritized Replay + +Instead of uniform sampling of experiences, we can sample by how surprised we were about the outcome of the Q-value loss. + +I had a previous implementation of this, but it was faulty, so I took the code from OpenAI baselines and integrated it with my library. + +It helps with games like Pong, because there are many states where the result is not surprising and inconsequential. Like when the ball is around the center of the field. + +## Schedulers + +There are some people who use Linear Schedulers to change the value of various parameters throughout training. + +I implemented it as an iterator in python and called *next* for each time the function uses the hyper-parameter. + +The two parameters I use schedulers in normally are: + +- Epsilon - Gradually decreases exploration rate +- Beta - Decreases the importance of the weights of experiences that get frequently sampled + + + +## Layer Norm + +"Reduces training by normalizes the activities of the neurons." + +Jimmy Lei Ba, Jamie Ryan Kiros, Geoffrey E. Hinton. **Layer Normalization.** + +It's nicely implemented in PyTorch already so I threw that in for each layer of the network. Reduces the average loss. \ No newline at end of file diff --git a/content/research/deepreinforcementlearning/WeeklyProgress/Feb25.md b/content/research/deepreinforcementlearning/WeeklyProgress/Feb25.md new file mode 100644 index 0000000..5d125fe --- /dev/null +++ b/content/research/deepreinforcementlearning/WeeklyProgress/Feb25.md @@ -0,0 +1,117 @@ +# Weekly Progress for February 25th + +## Evolutionary Algorithms + +### Genetic Algorithm + +I worked towards implementing the Genetic Algorithm into PyTorch. I got a working implementation which operates like the following: + +Generate $n$ perturbations of the model by taking the tensors in the model dictionary and add some random noise to them. + +- Calculate the fitness of each model +- Keep the $k$ best survivors +- Sample (with replacement) $2(n - k)$ parents based on their fitness. (Higher fitness -> More likely to be sampled) + + - Easy way to do this is: $prob = fitness / sum(fitness)$ +- Split the parents in half to $parent1$ and $parent2$ +- Perform crossover in order to make children + + - For every tensor in the model dictionary + + - Find a point in where you want the split to happen + - Create a new tensor: the left part of the split comes from $parent1$, the other side from $parent2$ + - Mutate the child with $\epsilon$ probability + - Add random noise to the tensor + +Normally if you perform this algorithm with many iterations, your results start to converge towards a particular solution. + +The main issue with this algorithm is that you need to carry with you $n$ models of the environment throughout the entire training process. You also need to have a somewhat good definition of the bounds of which your weights and biases can be otherwise the algorithm might not converge to the true value. + +Due to these reasons, I didn't end up adding this functionality to RLTorch. + +### Evolutionary Strategies + +To combat these issues, I knocked into a paper by OpenAI Called "Evolutionary Strategies" + +Tim Salimans, Jonathan Ho, Xi Chen, Szymon Sidor, Ilya Sutskever. **Evolution Strategies as a Scalable Alternative to Reinforcement Learning** + +https://arxiv.org/abs/1703.03864 + +*This paper mostly describes the efforts made to make a certain evolutionary strategy scalable to many nodes. I ended up using only the algorithm from the paper and I didn't implement any of the scalable considerations.* + +The following code below explains the process for maximizing a simple function + +```python +white_noise = np.random.randn(population_size, *current_solution.shape) +noise = sigma * white_noise +candidate_solutions = current_solution + noise + +# Calculate fitness, mean shift, and scale +fitness_values = calculate_fitness(candidate_solutions) +fitness_values = (fitness_values - np.mean(fitness_values)) / (np.std(fitness_values) + np.finfo('float').eps) + +new_solution = current_solution + learning_rate * np.mean(white_noise.T * fitness_values, axis = 1) / sigma +``` + +To explain further, suppose you have a guess as to what the solution is. To generate new guesses, let us add random noise around our guess like the image below. + +![1551158699648](/home/rozek/Documents/Research/Deep RL/WeeklyProgress/1551158699648.png) + +Now calculate the fitness of all the points, let us represent that by the intensity of blue in the background, + +![1551158802225](/home/rozek/Documents/Research/Deep RL/WeeklyProgress/1551158802225.png) + +What ends up happening is that your new solution, the black square, will move towards the areas with higher reward. + +## Q-Evolutionary Policies + +**Motivation** + +So this brings up the point, why did I bother studying these algorithms? I ran into a problem when I was looking to implement the DDPG algorithm. Primarily that it required your action space to be continuous, which is not something I'm currently on. + +Then I thought, why can I not make it work with discrete actions? First let us recall the loss of a policy function under DDPG: +$$ +loss_\pi = -Q(s, \pi(s)) +$$ +For the discrete case, your Q-function is going to be a function of the state and output the values of each action taken under that state. In mathematical terms, +$$ +loss_\pi = -Q(s)[\pi(s)] +$$ +Indexing into another array, however, is not a differentiable function. Meaning I cannot then calculate $loss_\pi$ with respect to $\pi$. + +Evolutionary Strategies are non-gradient based methods. Meaning that I can bypass this restriction with the traditional methods. + +**How it works** + +Train your Value function with the typical DQN loss. + +Every 10 Value function updates, update the policy. This gives time for the Value function to stabilize so that the policy is not chasing suboptimal value functions. Update the policy according to the $loss_\pi$ written above. + +**Results** + +![1551160033552](/home/rozek/Documents/Research/Deep RL/WeeklyProgress//1551160033552.png) + +The orange line is the QEP performance + +Blue is DQN + +## Future Direction + +I would like to look back towards demonstration data and figure out a way to pretrain a QEP model. + +It's somewhat easy to think of a way to train the policy. Make it a cross-entropy loss with respect to the actions the demonstrator took. +$$ +loss_\pi = -\sum_{c=1}^M{y_{o,c}\ln{(p_{o,c})}} +$$ +Where $M$ is the number of classes, $y$ is the binary indicator for whether the correction classification was observed, and $p$ is the predicted probability observation for class c. + +It's harder to think about how I would do it for a Value function. There was the approach we saw before where the loss function was like so, +$$ +loss_Q = max(Q(s, a) + l(s,a)) - Q(s, a_E) +$$ +Where $l(s, a)$ is a vector that is positive for all values except for what the demonstrator took which is action $a_E$. + +The main issue with this loss function for the Value is that it does not capture the actual output values of the functions, just how they are relative to each other. Perhaps adding another layer can help transform it to the values it needs to be. This will take some more thought. + + + diff --git a/content/research/deepreinforcementlearning/WeeklyProgress/Jan29.md b/content/research/deepreinforcementlearning/WeeklyProgress/Jan29.md new file mode 100644 index 0000000..a203d4f --- /dev/null +++ b/content/research/deepreinforcementlearning/WeeklyProgress/Jan29.md @@ -0,0 +1,65 @@ +# Weekly Progress Jan 29 + +## 1. Training From Demonstrations + +Training from demonstrations is the act of using previous data to help speed up the learning process. + +I read two papers on the topic: + +[1] Gabriel V. de la Cruz Jr., Yunshu Du, Matthew E. Taylor. **Pre-training Neural Networks with Human Demonstrations for Deep Reinforcement Learning**. + +https://arxiv.org/abs/1709.04083 + +The authors showed how you can speed up the training of a DQN network, especially under problems involving computer vision, if you first train the convolution layers by using a supervised loss between the actions the network would choose and the actions from the demonstration data given a state. + +[2] Todd Hester, Matej Vecerik, Olivier Pietquin, Marc Lanctot, Tom Schaul, Bilal Piot, Dan Horgan, John Quan, Andrew Sendonaris, Gabriel Dulac-Arnold, Ian Osband, John Agapiou, Joel Z. Leibo, Audrunas Gruslys. **Deep Q-learning from Demonstrations.** + +https://arxiv.org/abs/1704.03732 + +The authors showed how from "expert" demonstrations we can speed up the training of a DQN by incorporating the supervised loss into the loss function. + +### Supervised Loss + +What is supervised loss in the context of DQNs? +$$ +Loss = max(Q(s, a)+l(s,a )) - Q(s, a_E) +$$ +Where $a_E$ is the expert action, and $l(s, a)$ is a vector of positive values with an entry of zero for the expert action. + +The intuition behind this is that for the loss to be zero, the network would've had to have chosen the same action as the expert. The $l(s, a)$ term exists to ensure that there are no ties. + +### What I decided to do + +The main environment I chose to test these algorithms is Acrobot. It is a control theory problem and it has several physics related numbers as input. (Not image based) + +I noticed when implementing [1] at least for the non-convolution case, there's no point in trying to train earlier layers. Perhaps I'll try again when I move onto the atari gameplays... + +I decided against following [2] exactly. It's not that I disagree with the approach, but I don't like the need for "expert" data. If you decide to proceed anyways with non-expert data, you need to remember that it is incorporated into the loss function. Which means that you fall risk into learning sub-optimal policies. + +In the end, what I decided to do was the following + +1. Train a neural network that maps states->actions from demonstration data +2. Use that network to play through several simulated runs of the environment, state the (state, action, reward, next_state, done) signals and insert it into the experience replay buffer and train from those (**Pretrain step**) +3. Once the pretrain step is completed, replace the network that maps from demonstration data with the one you've been training in the pre-training step and continue with the regular algorithm + + + +## 2. Noisy Networks + +Based on this paper... + +Meire Fortunato, Mohammad Gheshlaghi Azar, Bilal Piot, Jacob Menick, Ian Osband, Alex Graves, Vlad Mnih, Remi Munos, Demis Hassabis, Olivier Pietquin, Charles Blundell, Shane Legg. **Noisy Networks for Exploration.** + +This paper describes adding parametric noise to the weights and biases and how it aids in exploration. The parameters of the noise are learned with gradient descent along with the other network parameters. + + + +For the noise distribution I used the Gaussian Normal. One property that's handy to know about it is the following +$$ +N(\mu, \sigma) = \mu + \sigma*N(0, 1) +$$ +In our case, the $\mu$ would be the typical weights and biases, and the $\sigma$ is a new parameter representing how much variation or uncertainty needs to be added. + +The concept is that as the network grows more confident about it's predictions, the variation in the weights start to decrease. This way the exploration is systematic and not something randomly injected like the epsilon-greedy strategy. + +The paper describes replacing all your linear densely connected layers with this noisy linear approach. \ No newline at end of file diff --git a/content/research/deepreinforcementlearning/WeeklyProgress/Mar26.md b/content/research/deepreinforcementlearning/WeeklyProgress/Mar26.md new file mode 100644 index 0000000..bc303eb --- /dev/null +++ b/content/research/deepreinforcementlearning/WeeklyProgress/Mar26.md @@ -0,0 +1,11 @@ +# Progress for Week of March 26 + +## Parallelized Evolutionary Strategies + +When the parallel ES class is declared, I start a pool of workers that then gets sent with a loss function and its inputs to compute whenever calculating gradients. + +## Started Exploring Count-Based Exploration + +I started looking through papers on Exploration and am interested in using the theoretical niceness of Count-based exploration in tabular settings and being able to see their affects in the non-tabular case. + +""[Unifying Count-Based Exploration and Intrinsic Motivation](https://arxiv.org/abs/1606.01868)" creates a model of a arbitrary density model that follows a couple nice properties we would expect of probabilities. Namely, $P(S) = N(S) / n$ and $P'(S) = (N(S) + 1) / (n + 1)$. Where $N(S)$ represents the number of times you've seen that state, $n$ represents the total number of states you've seen, and $P'(S)$ represents the $P(S)$ after you have seen $S$ another time. With this model, we are able to solve for $N(S)$ and derive what the authors call a *Psuedo-Count*. \ No newline at end of file diff --git a/content/research/deepreinforcementlearning/WeeklyProgress/breakout.gif b/content/research/deepreinforcementlearning/WeeklyProgress/breakout.gif new file mode 100644 index 0000000..383917f Binary files /dev/null and b/content/research/deepreinforcementlearning/WeeklyProgress/breakout.gif differ diff --git a/content/research/deepreinforcementlearning/abstractspring2019.md b/content/research/deepreinforcementlearning/abstractspring2019.md new file mode 100644 index 0000000..3a8d5f0 --- /dev/null +++ b/content/research/deepreinforcementlearning/abstractspring2019.md @@ -0,0 +1,15 @@ +--- +showthedate: false +--- + +**Name:** Brandon Rozek + +Department of Computer Science + +**Mentor:** Dr. Ron Zacharski + +QEP: The Q-Value Policy Evaluation Algorithm + + + +*Abstract.* In Reinforcement Learning, sample complexity is often one of many concerns when designing algorithms. This concern outlines the number of interactions with a given environment that an agent needs in order to effectively learn a task. The Reinforcement Learning framework consists of finding a function (the policy) that maps states/scenarios to actions while maximizing the amount of reward from the environment. For example in video games, the reward is often characterized by some score. In recent years a variety of algorithms came out falling under the categories of Value-based methods and Policy-based methods. Value-based methods create a policy by approximating how much reward an agent is expected to receive if it performs the best actions from a given state. It is then common to choose the actions that maximizes such values. Meanwhile, in Policy-based methods, the policy function produces probabilities that an agent performs each action given a state and this is then optimized for the maximum reward. As such, Value-based methods produce deterministic policies while policy-based methods produce stochastic/probabilistic policies. Empirically, Value-based methods have lower sample complexity than Policy-based methods. However, in decision making not every situation has a best action associated with it. This is mainly due to the fact that real world environments are dynamic in nature and have confounding variables affecting the result. The QEP Algorithm combines both the Policy-based methods and Value-based methods by changing the policy's optimization scheme to involve approximate value functions. We have shown that this combines the benefits of both methods so that the sample complexity is kept low while maintaining a stochastic policy. \ No newline at end of file diff --git a/content/research/dimensionalityreduction.md b/content/research/dimensionalityreduction.md new file mode 100644 index 0000000..e8b9229 --- /dev/null +++ b/content/research/dimensionalityreduction.md @@ -0,0 +1,17 @@ +--- +Title: Dimensionality Reduction +Description: Reducing High Dimensional Datasets to what we can digest. +showthedate: false +--- + +# Dimensionality Reduction + +In the Summer of 2018, I was going to embark with another study on the topics pertaining to Dimensionality Reduction. Sadly the other student became busy a few weeks into the study. I decided to upload what we got through anyways for completeness. + +[Syllabus](syllabus) + +[Intro](intro) + +[Feature Selection](featureselection) + +[Optimality Criteria](optimalitycriteria) \ No newline at end of file diff --git a/content/research/dimensionalityreduction/featureselection.md b/content/research/dimensionalityreduction/featureselection.md new file mode 100644 index 0000000..02df890 --- /dev/null +++ b/content/research/dimensionalityreduction/featureselection.md @@ -0,0 +1,34 @@ +# Feature Selection + +Feature selection is the process of selecting a subset of relevant features for use in model construction. The core idea is that data can contain many features that are redundant or irrelevant. Therefore, removing it will not result in much loss of information. We also wish to remove features that do not help in our goal. + +Feature selection techniques are usually applied in domains where there are many features and comparatively few samples. + +## Techniques + +The brute force feature selection method exists to exhaustively evaluate all possible combinations of the input features, and find the best subset. The computational cost of this approach is prohibitively high and includes a considerable risk of overfitting to the data. + +The techniques below describe greedy approaches to this problem. Greedy algorithms are ones that don't search the entire possible space but instead converges towards local maximums/minimums. + +### Wrapper Methods + +This uses a predictive model to score feature subsets. Each new subset is used to train a model, which is tested on a hold-out set. The error rate of the model results in a score for that subset. This method is computationally intensive, but usually provides the best performing feature set for that particular type of model. + +### Filter Methods + +This method uses a proxy measure instead of the error rate. The proxy measure can be specifically chosen to be faster to compute while still capturing the essence of the feature set. Common implementations include: + +- Mutual information +- Pointwise mutual information +- Pearson product-moment correlation coefficient +- Relief-based algorithms +- Inter/intra class distances +- Scores of significance tests + +Many filters provide a feature ranking rather than producing an explicit best feature subset + +### Embedded Methods + +This is a catch-all group of techniques which perform feature selection as part of the model. For example, the LASSO linear model penalizes the regression coefficients shrinking unimportant ones to zero. + +Stepwise regression is a commonly used feature selection technique that acts greedily by adding the feature that results in the best result each turn. \ No newline at end of file diff --git a/content/research/dimensionalityreduction/intro.md b/content/research/dimensionalityreduction/intro.md new file mode 100644 index 0000000..b26faf3 --- /dev/null +++ b/content/research/dimensionalityreduction/intro.md @@ -0,0 +1,30 @@ +# Introduction to Dimensionality Reduction + +## Motivations + +We all have problems to solve, but the data we might have at our disposal is too sparse or has too many features that it makes it computationally difficult or maybe even impossible to solve the problem. + +### Types of Problems + +**Prediction**: This is taking some input and trying to predict an output of it. An example includes having a bunch of labeled pictures of people and having the computer predict who is in the next picture taken. (Face or Object Recognition) + +**Structure Discovery**: Find an alternative representation of the data. Usually used to find groups or alternate visualizations + +**Density Estimation**: Finding the best model that describes the data. An example includes explaining the price of a home depending on several factors. + +## Advantages + +- Reduces the storage space of data (possibly removing noise in the process!) +- Decreases complexity making algorithms run faster +- Removes multi-collinearity which in turn likely improves the performance of a given machine learning model + - Multi-collinearity usually indicates that multiple variables are correlated with each other. Most models make use of independent features to simplify computations. Therefore, ensuring independent features is important. +- Data becomes easier to visualize as it can be projected into 2D/3D space +- Lessens the chance of models *overfitting* + - This typically happens when you have less observations compared to variables (also known as sparse data) + - Overfitting leads to a model being able to have high accuracy on the test set, but generalize poorly to reality. +- Curse of dimensionality does not apply in resulting dataset + - Curse of dimensionality is that in high dimensional spaces, all points become equidistant + +## Disadvantages + +Data is lost through this method, potentially resulting in possibly insightful information being removed. Features from dimensionality reduction are typically harder to interpret leading to more confusing models. \ No newline at end of file diff --git a/content/research/dimensionalityreduction/optimalitycriteria.md b/content/research/dimensionalityreduction/optimalitycriteria.md new file mode 100644 index 0000000..035d250 --- /dev/null +++ b/content/research/dimensionalityreduction/optimalitycriteria.md @@ -0,0 +1,99 @@ +# Optimality Criteria + +Falling under wrapper methods, optimality criterion are often used to aid in model selection. These criteria provide a measure of fit for the data to a given hypothesis. + +## Akaike Information Criterion (AIC) + +AIC is an estimator of relative quality of statistical models for a given set of data. Given a collection of models for the data, AIC estimates the quality of each model relative to each other. + +This way, AIC provides a means for model selection. AIC offers an estimate of the relative information lost when a given model is used. + +This metric does not say anything about the absolute quality of a model but only serves for comparison between models. Therefore, if all the candidate models fit poorly to the data, AIC will not provide any warnings. + +It is desired to pick the model with the lowest AIC. + +AIC is formally defined as +$$ +AIC = 2k - 2\ln{(\hat{L})} +$$ + + +## Bayesian Information Criterion (BIC) + +This metric is based on the likelihood function and is closely related to the Akaike information criterion. It is desired to pick the model with the lowest BIC. + +BIC is formally defined as +$$ +BIC = \ln{(n)}k - 2\ln{(\hat{L})} +$$ + +Where $\hat{L}$ is the maximized value of the likelihood function for the model $M$. +$$ +\hat{L} = p(x | \hat{\theta}, M) +$$ +$x$ is the observed data, $n$ is the number of observations, and $k$ is the number of parameters estimated. + + + +### Properties of BIC + +- It is independent from the prior +- It penalizes the complexity of the model in terms of the number of parameters + +### Limitations of BIC + +- Approximations are only valid for sample sizes much greater than the number of parameters (dense data) +- Cannot handle collections of models in high dimension + +### Differences from AIC + +AIC is mostly used when comparing models. BIC asks the question of whether or not the model resembles reality. Even though they have similar functions, they are separate goals. + +## Mallow's $C_p$ + +$C_p$ is used to assess the fit of a regression model that has been estimated using ordinary least squares. A small value of $C_p$ indicates that the model is relatively precise. + +The $C_p$ of a model is defined as +$$ +C_p = \frac{\sum_{i =1}^N{(Y_i - Y_{pi})^2}}{S^2}- N + 2P +$$ + +- $Y_pi$ is the predicted value of the $i$th observation of $Y$ from the $P$ regressors + +- $S^2$ is the residual mean square after regression on the complete set of regressors and can be estimated by mean square error $MSE$, + +- $N$ is the sample size. + +An alternative definition is + + +$$ +C_p = \frac{1}{n}(RSS + 2d\hat{\sigma}^2) +$$ + +- $RSS$ is the residual sum of squares +- $d$ is the number of predictors +- $\hat{\sigma}^2$ refers to an estimate of the variances associated with each response in the linear model + +## Deviance Information Criterion + +The DIC is a hierarchical modeling generalization of the AIC and BIC. it is useful in Bayesian model selection problems where posterior distributions of the model was obtained by a Markov Chain Monte Carlo simulation. + +This method is only valid if the posterior distribution is approximately multivariate normal. + +Let us define the deviance as +$$ +D(\theta) = -2\log{(p(y|\theta))} + C +$$ +Where $y$ is the data and $\theta$ are the unknown parameters of the model. + +Let us define a helper variable $p_D$ as the following +$$ +p_D = \frac{1}{2}\hat{Var}(D(\theta)) +$$ +Finally the deviance information criterion can be calculated as +$$ +DIC = D(\bar{\theta}) + 2p_D +$$ +Where $\bar{theta}$ is the expectation of $\theta$. + diff --git a/content/research/dimensionalityreduction/syllabus.md b/content/research/dimensionalityreduction/syllabus.md new file mode 100644 index 0000000..fbdd26d --- /dev/null +++ b/content/research/dimensionalityreduction/syllabus.md @@ -0,0 +1,71 @@ +# Dimensionality Reduction Study + +Dimensionality reduction is the process of reducing the number of random variables under consideration. This study will last for 10 weeks, meeting twice a week for about an hour. + +## Introduction to Dimensionality Reduction (0.5 Week) + +- Motivations for dimensionality reduction +- Advantages of dimensionality reduction +- Disadvantages of dimensionality reduction + +## Feature Selection (3 Weeks) + +This is the process of selecting a subset of relevant features. The central premise of this technique is that many features are either redundant or irrelevant and thus can be removed without incurring much loss of information. + +### Metaheuristic Methods (1.5 Weeks) + +- Filter Method +- Wrapper Method +- Embedded Method + +### Optimality Criteria (0.5 Weeks) + +- Bayesian Information Criterion +- Mallow's C +- Akaike Information Criterion + +### Other Feature Selection Techniques (1 Week) + +- Subset Selection +- Minimum-Redundancy-Maximum-Relevance (mRMR) feature selection +- Global Optimization Formulations +- Correlation Feature Selection + +### Applications of Metaheuristic Techniques (0.5 Weeks) + +- Stepwise Regression +- Branch and Bound + +## Feature Extraction (6 Weeks) + +Feature extraction transforms the data in high-dimensional space to a space of fewer dimensions. In other words, feature extraction involves reducing the amount of resources required to describe a large set of data. + +### Linear Dimensionality Reduction (3 Weeks) + +- Principal Component Analysis (PCA) +- Singular Value Decomposition (SVD) +- Non-Negative Matrix Factorization +- Linear Discriminant Analysis (LDA) +- Multidimensional Scaling (MDS) +- Canonical Correlation Analysis (CCA) [If Time Permits] +- Linear Independent Component Analysis [If Time Permits] +- Factor Analysis [If Time Permits] + +### Non-Linear Dimensionality Reduction (3 Weeks) + +One approach to the simplification is to assume that the data of interest lie on an embedded non-linear manifold within higher-dimensional space. + +- Kernel Principal Component Analysis +- Nonlinear Principal Component Analysis +- Generalized Discriminant Analysis (GDA) +- T-Distributed Stochastic Neighbor Embedding (T-SNE) +- Self-Organizing Map +- Multifactor Dimensionality Reduction (MDR) +- Isomap +- Locally-Linear Embedding +- Nonlinear Independent Component Analysis +- Sammon's Mapping [If Time Permits] +- Hessian Eigenmaps [If Time Permits] +- Diffusion Maps [If Time Permits] +- RankVisu [If Time Permits] + diff --git a/content/research/lunac.md b/content/research/lunac.md new file mode 100644 index 0000000..39af59e --- /dev/null +++ b/content/research/lunac.md @@ -0,0 +1,17 @@ +--- +Title: LUNA-C Cluster +Description: Building a Beowulf Cluster for the University +showthedate: false +--- + +# LUNA-C + +LUNA-C stands for Large Universal Network Array of Computers and it was a project started back in August 2017 to introduce a cluster computing system to the University. I started this project in response to a want for more computing power to help with the Physics research I was doing at the time. + +I started this project and wrote a grant proposal and have brought on many students to help make this dream come true. The resources below give a look into all the thoughts and ideas that went along with the project. + +[May 2018 Poster](poster.pdf) + +[August 2018 Report](report.pdf) + +[June 2019 Presentation](/files/slides/buildinglinuxcluster.pdf) \ No newline at end of file diff --git a/content/research/lunac/LUNA-C Cluster Report.pdf b/content/research/lunac/LUNA-C Cluster Report.pdf new file mode 100644 index 0000000..12ac30c Binary files /dev/null and b/content/research/lunac/LUNA-C Cluster Report.pdf differ diff --git a/content/research/lunac/LUNACposter.pdf b/content/research/lunac/LUNACposter.pdf new file mode 100644 index 0000000..675ff16 Binary files /dev/null and b/content/research/lunac/LUNACposter.pdf differ diff --git a/content/research/physics.md b/content/research/physics.md new file mode 100644 index 0000000..6c6765f --- /dev/null +++ b/content/research/physics.md @@ -0,0 +1,13 @@ +--- +Title: Physics +Description: Help with Physics Research Projects +showthedate: false +--- + +## Physics Research + +For the two projects below, I worked on Quantum Research in a physics lab with a fellow student Hannah Killian and an advisor Dr. Hai Nguyen. I mostly assisted with the software support for the project and assisted in the mathematics in whatever way I can. + +[Modeling Population Dynamics of Incoherent and Coherent Excitation](/files/research/modellingpopulationdynamics.pdf) + +[Coherent Control of Atomic Population Using the Genetic Algorithm](/files/research/coherentcontrolofatomicpopulation.pdf) \ No newline at end of file diff --git a/content/research/progcomp.md b/content/research/progcomp.md new file mode 100644 index 0000000..6c6ec10 --- /dev/null +++ b/content/research/progcomp.md @@ -0,0 +1,14 @@ +--- +Title: Programming Competition +Description: Competition on Algorithms and Data Structures +showthedate: false +--- + +# Programming Competition +Back in the Fall of 2018, Harrison Crosse, Clare Arrington, and I all formed a team to compete in a programming competition. + +I didn't make many notes for this, but below are the ones I did make for this. + +[Strings](strings) + +[Number Theory](numbertheory) \ No newline at end of file diff --git a/content/research/progcomp/numbertheory.md b/content/research/progcomp/numbertheory.md new file mode 100644 index 0000000..78ad9b1 --- /dev/null +++ b/content/research/progcomp/numbertheory.md @@ -0,0 +1,295 @@ +# Number Theory + +## Prime Numbers + +A *prime number* is an integer $p > 1$ which is only divisible by $1$ and itself. + +If $p$ is a prime number, then $p = ab$ for integers $a \le b$ implies that $a = 1$ and $b = p$. + +### Definitions + +**Fundamental Theorem of Arithmetic**: Every integer can be expressed in only one way as a product of primes. + +**Prime factorization of $n$**: The unique set of numbers multiplying to $n$. + +**Factor**: A prime number $p$ is a *factor* of $x$ if it appears in its prime factorization. + +**Composite**: A number which is not prime + +### Finding Primes + +The easiest way to test if a given number $x$ is repeated division + +- After testing two, we only need to check odd numbers afterwards +- We only need to check until $\sqrt{x}$ since two numbers are perhaps multiplied to achieve $x$. + +#### Considerations if you don't have nice things + +The terminating condition of $i > \sqrt{x}$ is somewhat problematic, because `sqrt()` is a numerical function with imperfect precision. + +To get around this, you can change the termination condition to $i^2 > x$. Though then we get into the problem of potential overflow when working on large integers. + +The best solution if you have to deal with these issues is to compute $(i + 1)^2$ based on the result from $i^2$. +$$ +\begin{align*} +(i + 1)^2 &= i^2 + 2i + 1 +\end{align*} +$$ +So just add $(2i + 1)$ to the previous result. + +## Divisibility + +A lot of number theory concerns itself with the study of integer divisibility. + +### Definition + +**Divides:** We say that $b$ *divides* $a$ (denoted $b|a$) if $a = bk$ for some integer $k$. + +**Divisor:** If the above is true, then we say that $b$ is a *divisor* of $a$ + +**Multiple:** Given the above, we say that $a$ is a multiple of $b$. + +As a consequence of this definition, the smallest natural divisor of every non-zero integer is $1$. This is also known as the *least common divisor*. + +**Greatest Common Divisor $(gcd)$:** the *largest* divisor shared by a given pair of integers. + +**Relatively Prime**: Two integers are *relatively prime* if their greatest common divisor is $1$. + +**Reduced Form:** A fraction is said to be in *reduced form* if the greatest common divisor between the numerator and denominator is $1$. + +### Properties + +The greatest common divisor an integer has with itself is itself. +$$ +gcd(b, b) = b \tag{1.1} +$$ +The ordering of arguments to $gcd$ doesn't matter. Traditionally the larger value is placed in the first argument. +$$ +gcd(a, b) = gcd(b, a) \tag{1.2} +$$ +The greatest common divisor if $b$ divides $a$ between $a$ and $b$ is $b$. +$$ +b | a \implies gcd(a, b) = b \tag{1.3} +$$ + +This in part is because of two observations + +- $b$ is the greatest common divisor of $b$ from $(1.1)$ +- $b$ divides $a$, therefore it's a common divisor + +The greatest common divisor between $a$ and $b$ where $a = bt + r$ is the same as the greatest common divisor between $b$ and $r$. +$$ +a = bt + r \implies gcd(a, b) = gcd(b, r) \tag{1.4} +$$ +Let's work this out: $gcd(a, b) = gcd(bt + r, b)$. Since $bt$ is a multiple of $b$, we can add and subtract as many $bt$'s as we want without influencing the answer. This leads to $gcd(bt + r, b) = gcd(r, b) = gcd(b, r)$. + +### Euclid's Algorithm + +Using $(1.4)$ we can rewrite greatest common divisor problems in terms of the property in order to simplify the expression. Take a look at the example below: +$$ +\begin{align*} +gcd(34398, 2131) &= gcd(34398 \text{ mod } 2132, 2132) = gcd(2132, 286) \\ +gcd(2132, 286) &= gcd(2132 \text{ mod } 286, 286,) = gcd(286, 130) \\ +gcd(286, 130) &= gcd(286 \text{ mod } 130, 130) = gcd(130, 26) \\ +gcd(130, 26) &= gcd(130 \text{ mod } 26, 26,) = gcd(26, 0) +\end{align*} +$$ +Therefore, $gcd(34398, 2132) = 26$. + +### Least Common Multiple + +#### Definition + +The *least common multiple* $(lcm)$ is the smallest integer which is divided by both of a given pair of integers. Ex: $lcm(24, 36) = 72$. + +#### Properties + +The least common multiple of $x$ and $y$ is greater (or equal) than both $x$ and $y$. +$$ +lcm(x, y) \ge max(x,y) \tag{2.1} +$$ +The least common multiple of $x$ and $y$ is less than or equal to $x$ and $y$ multiplied together. +$$ +lcm(x, y) \le xy \tag{2.2} +$$ +Coupled with Euclid's algorithm we can derive the property that the least common multiple is equal to the pair of multiplied integers divided by their greatest common divisor. +$$ +lcm(x, y) = xy / gcd(x, y) \tag{2.3} +$$ + +#### Potential Problems + +Least common multiple arises when we want to compute the simultaneous periodicity of two distinct periodic events. When is the next year (after 2000) that the presidential election will coincide with the census? + +These events coincide every twenty years, because $lcm(4, 10) = 20$. + +## Modular Arithmetic + +We are not always interested in full answers, however. Sometimes the remainder suffices for our purposes. + +Example: Suppose your birthday this year falls on a Wednesday. What day of the week will it fall on next year? + +The remainder of the number of days between now and then (365 or 366) mod the number of days in a week. $365$ mod $7 = 1$. Which means that your birthday will fall on a Thursday. + +### Operations of Modular Arithmetic + +**Addition**: $(x + y)$ mod $n$ $=$ $((x $ mod $n) + (y$ mod $n))$ mod $n$ + +Example: How much small change will I have if given \$123.45 by my mother and \$94.67 by my father? +$$ +\begin{align*} +(12345 \text{ mod } 100) + (9467 \text{ mod } 100) &= (45 + 67) \text{ mod } 100 \\ +&= 12 \text{ mod } 100 +\end{align*} +$$ +**Subtraction** (Essentially addition with negatives): + +Example: Based on the previous example, how much small change will I have after spending \$52.53? +$$ +(12 \text{ mod } 100) - (53 \text{ mod } 100) = -41 \text{ mod } 100 = 59 \text{ mod } 100 +$$ +Notice the flip in signs, this can be generalized into the following form: +$$ +x \text{ mod } y = (y - x) \text{ mod } y +$$ +**Multiplication** (Otherwise known as repeated addition): +$$ +xy \text{ mod } n = (x \text{ mod } n)(y \text{ mod } n) \text{ mod n} +$$ +Example: How much change will you have if you earn \$17.28 per hour for 2,143 hours? +$$ +\begin{align*} +(1728 * 2143) \text{ mod } 100 &= (28 \text{ mod } 100)(43 \text{ mod 100}) \\ +&= 4 \text{ mod } 100 +\end{align*} +$$ +**Exponentiation** (Otherwise known as repeated multiplication): +$$ +x^y \text{ mod } n =(x \text{ mod n})^y \text{ mod } n +$$ +Example: What is the last digit of $2^{100}$? +$$ +\begin{align*} +2^3 \text{ mod } 10 &= 8 \\ +2^6 \text{ mod } 10 &= 8(8) \text{ mod } 10 \rightarrow 4 \\ +2^{12} \text{ mod } 10 &= 4(4) \text{ mod } 10 \rightarrow 6 \\ +2^{24} \text{ mod } 10 &= 6(6) \text{ mod } 10 \rightarrow 6 \\ +2^{48} \text{ mod } 10 &= 6(6) \text{ mod } 10 \rightarrow 6 \\ +2^{96} \text{ mod } 10 &= 6(6) \text{ mod } 10 \rightarrow 6\\ +2^{100} \text{ mod } 10 &= 2^{96}(2^3)(2^1) \text{ mod } 10 \\ + &= 6(8)(2) \text{ mod } 10 \rightarrow 6 +\end{align*} +$$ + +## Linear Congruences + +**Definition:** $ a \equiv b \text{ (mod m)} \iff m |(a-b)$ + +### Properties + +If $a$ mod $m$ is $b$, then $a$ is linearly congruent to $b$ in mod $m$. +$$ +a \text{ mod } m = b \implies a \equiv b \text{ (mod m)} \tag{3.1} +$$ +Let us show that from what we know so far... +$$ +\begin{align*} +a \text{ mod m} = b &\implies a = mk+b \hspace{.2in} \text{(for some $k \in \mathbb{Z}$)} \\ +&\implies a - b = mk + b - b \\ +&\iff a-b = m k \\ +&\iff m | (a - b) \\ +&\iff a \equiv b \hspace{.2in} \text{ (mod m)} +\end{align*} +$$ +**Example:** What set of integers satisfy the following congruence? +$$ +x \equiv 3 \text{ mod } 9 +$$ +**Scratch work:** +$$ +\begin{align*} +x \equiv 3 \text{ mod } 9 &\iff 9 | (x - 3) \\ +&\iff x - 3 = 9k \hspace{.2in} \text{ (for some $k \in \mathbb{Z}$)} \\ +&\iff x = 9k - 3 +\end{align*} +$$ + +### Operations on congruences + +#### Addition/Subtraction + +$$ +a \equiv b \text{ (mod n) and } c \equiv d \text{ (mod n) } \implies a + c \equiv b + d \text{ (mod n)} \tag{3.2} +$$ + +*Proof.* +$$ +\begin{align*} +a \equiv b \text{ (mod n) } &\implies n | (a - b) \\ +&\implies a - b = nk_1 \hspace{.2in} \text{ (for some $k_1 \in \mathbb{Z}$)} \\ +&\implies a = nk_1 + b\\ +c \equiv d \text{ (mod n) } &\implies n | (c - d) \\ +&\implies c - d = nk_2 \hspace{.2in} \text{ (for some $k_2 \in \mathbb{Z}$)} \\ +&\implies c = nk_2 + d \\ +a + c &= nk_1 + b + nk_2 + d \\ +&= n(k_1 + k_2) + (b + d) \\ +&=nk + (b + d) \hspace{.2in} \text{(for some $k \in \mathbb{Z}$)} \\ +&\implies (a + c) \text{ mod } n = b + d \\ +&\implies a+c \equiv b + d \text{ (mod n)} +\end{align*} +$$ + +#### Multiplication + +$$ +a \equiv b \text{ (mod n) } \implies ad \equiv bd \text{ (mod n)} \tag{3.3} +$$ + +*Proof.* +$$ +\begin{align*} +a \equiv b \text{ (mod n) } &\implies n | (a - b) \\ +&\implies a - b = nk_1 \hspace{.2in} \text{ (for some $k_1 \in \mathbb{Z}$)} \\ +&\implies d(a - b) = d(nk_1) \\ +&\implies da-db = n(dk_1) \\ +&\implies n | (da-db) \\ +&\implies da \equiv db \text{ (mod n)} +\end{align*} +$$ +Next Theorem +$$ +a \equiv b \text{ (mod n) and } c \equiv d \text{ (mod n) } \implies ac \equiv bd \text{ (mod n) } +$$ +*Proof.* +$$ +\begin{align*} +a \equiv b \text{ (mod n) } &\implies a = nk_1 + b \hspace{.2in} \text{ (for some $k_1 \in \mathbb{Z}$)} \\ +c \equiv d \text{ (mod n)} &\implies c = nk_2 + d \hspace{.2in} \text{ (for some $k_2 \in \mathbb{Z}$)} \\ +a * c &= (nk_1 + b)(nk_2+d) \\ + &=n^2k_1k_2 + bnk_2+dnk_1 +bd \\ + &= n(nk_1k_2+bk_2+dk_2) + bd \\ + &\implies ac \text{ mod } n = bd \\ + ac &\equiv bd \text{ (mod n)} +\end{align*} +$$ + +#### Division + +Let us define division as so +$$ +bb^{-1} \equiv 1 \text{ (mod n)} \\ +$$ +Theorem. +$$ +ad \equiv bd \text{ (mod dn) } \iff a \equiv b \text{ (mod n) } +$$ +*Proof.* +$$ +\begin{align*} +ad \equiv bd \text{ (mod dn) } &\implies ad - bd = dnk \\ +&\implies d(a-b) = d(nk) \\ +&\implies a-b = nk \\ +&\implies n | (a-b) \\ +&\implies a \equiv b \text{ (mod n)} +\end{align*} +$$ diff --git a/content/research/progcomp/strings.md b/content/research/progcomp/strings.md new file mode 100644 index 0000000..4051955 --- /dev/null +++ b/content/research/progcomp/strings.md @@ -0,0 +1,15 @@ +# Strings + +## Character Codes + +Character codes are mappings between numbers and symbols which make up a particular alphabet. + +The *American Standard Code for Information Interchange* (ASCII) is a single-byte character code where $2^7 = 128$ characters are specified. + +Symbol assignments were not done at random. Several interesting properties of the design make programming tasks easier: + +- All non-printable characters have either the first three bits as zero or all seven lowest bits as one. This makes it easy to eliminate them before displaying junk. +- Both the upper and lower case letters and the numerical digits appear sequentially +- We can get the numeric order of a letter by subtracting the first letter +- We can convert a character from uppercase to lowercase by $Letter - "A" + "a"$ + diff --git a/content/research/proglang.md b/content/research/proglang.md new file mode 100644 index 0000000..75a50e4 --- /dev/null +++ b/content/research/proglang.md @@ -0,0 +1,12 @@ +--- +Title: Programming Languages +Description: Designing and Implementing Programming Languages +showthedate: false +--- + +# Programming Languages +Back in the Fall of 2018, under the guidance of Ian Finlayson, I worked towards creating a programming language similar to SLOTH (Simple Language of Tiny Heft). The language as of now is interpreted and supports array based programming. + +[Github repository](https://github.com/brandon-rozek/sloth) outlining my work. + +[Short Notes](types) on Types of Programming Languages \ No newline at end of file diff --git a/content/research/proglang/types.md b/content/research/proglang/types.md new file mode 100644 index 0000000..5917223 --- /dev/null +++ b/content/research/proglang/types.md @@ -0,0 +1,243 @@ +# Types of Programming Languages + +Mostly content from Wikipedia + +https://en.wikipedia.org/wiki/List_of_programming_languages_by_type#Hardware_description_languages + +## Array Languages + +Array programming languages generalizes operations on scalars to apply transparently to vectors, matrices, and higher-dimensional arrays. + +Example Language: R + +In R everything is by default a vector, typing in + +```R +x <- 5 +``` + +Will create a vector of length 1 with the value 5. + +This is commonly used by the scientific and engineering community. Other languages include MATLAB, Octave, Julia, and the NumPy extension to Python. + +## Constraint Programming Languages + +A declarative programming language where relationships between variables are expressed as constraints. Execution proceeds by attempting to find values for the variables that satisfy all declared constraints. + +Example: Microsoft Z3 Theorem Prover + +```z3 +(declare-const a Int) +(declare-fun f (Int Bool) Int) +(assert (> a 10)) +(assert (< (f a true) 100)) +(check-sat) +``` + +## Command Line Interface Languages + +Commonly used to control jobs or processes + +```bash +#!/bin/bash +echo "hello, $USER. I wish to list some files of yours" +echo "listing files in the current directory, $PWD" +ls # list files +``` + +## Concurrent Languages + +Languages that support language constructs for concurrency. These may involve multi-threading, distributed computing, message passing, shared resources, and/or future and promises. + +Example: Erlang + +```erlang +ping(0, Pong_PID) -> + Pong_PID ! finished, + io:format("ping finished~n", []); + +ping(N, Pong_PID) -> + Pong_PID ! {ping, self()}, + receive + pong -> + io:format("Ping received pong~n", []) + end, + ping(N - 1, Pong_PID). + +pong() -> + receive + finished -> + io:format("Pong finished~n", []); + {ping, Ping_PID} -> + io:format("Pong received ping~n", []), + Ping_PID ! pong, + pong() + end. + +start() -> + Pong_PID = spawn(tut15, pong, []), + spawn(tut15, ping, [3, Pong_PID]). +``` + + + +## Data-oriented Languages + +These languages provide powerful ways of searching and manipulating relations. + +Example: SQL + +```sql +SELECT * FROM STATION +WHERE 50 < (SELECT AVG(TEMP_F); +``` + +Give all the information from stations whose average temperature is above 50 degrees F + +## Declarative Languages + +Declarative languages express the logic of a computation without describing its control flow in detail + +Example: SQL again + +The example code above doesn't tell the computer how to perform the query, just what you want. + +## Functional Languages + +Style of computer programs that treat computation as the evaluation of mathematical functions and avoid changing-state and having mutable data. + +```haskell +primes = filterPrime [2..] + where filterPrime (p:xs) = + p : filterPrime [x | x <- xs, x `mod` p /= 0] +``` + +## Imperative Languages + +The use of statements to change a program's state + +Example: C + +```c +#define FOOSIZE 10 +struct foo fooarr[FOOSIZE]; + +for(i = 0; i < FOOSIZE; i++) +{ + do_something(fooarr[i].data); +} +``` + + + +## Iterative Languages + +Languages built around or offering generators + +Example: Python + +```python +def countfrom(n): + while True: + yield n + n += 1 + +g = countfrom(0) +next(g) # 0 +next(g) # 1 +``` + +## List-based Languages -LISPs + +Family of programming languages with a history of fully parenthesized prefix notation. + +Example: Common Lisp + +```commonlisp + ;; Sorts the list using the > and < function as the relational operator. + (sort (list 5 2 6 3 1 4) #'>) ; Returns (6 5 4 3 2 1) + (sort (list 5 2 6 3 1 4) #'<) ; Returns (1 2 3 4 5 6) +``` + +## Logic Languages + +Programming paradigm based on formal logic. Expressions are written stating the facts and rules about some problem domain. + +Example: Prolog + +```prolog +mother_child(trude, sally). + +father_child(tom, sally). +father_child(tom, erica). +father_child(mike, tom). + +sibling(X, Y) :- parent_child(Z, X), parent_child(Z, Y). + +parent_child(X, Y) :- father_child(X, Y). +parent_child(X, Y) :- mother_child(X, Y). +``` + +```prolog +?- sibling(sally, erica). + Yes +``` + +## Symbolic Programming + +A programming paradigm in which the program can manipulate its own formulas and program components as if they were plain data. + +Example: Clojure + +Clojure is written in prefix notation, but with this macro, you can write in infix notation. + +```clojure +(defmacro infix + [infixed] + (list (second infixed) + (first infixed) + (last infixed))) +``` + + + +## Probabilistic Programming Language + +Adds the ability to describe probabilistic models and then perform inference in those models. + +Example: Stan + +```stan +model { + real mu; + + # priors: + L_u ~ lkj_corr_cholesky(2.0); + L_w ~ lkj_corr_cholesky(2.0); + to_vector(z_u) ~ normal(0,1); + to_vector(z_w) ~ normal(0,1); + + for (i in 1:N){ + mu = beta[1] + u[subj[i],1] + w[item[i],1] + + (beta[2] + u[subj[i],2] + w[item[i],2])*so[i]; + rt[i] ~ lognormal(mu,sigma_e); // likelihood + } +} +``` + + + +## Quick Summary of Programming Paradigms + +Imperative + +- Object Oriented +- Procedural + +Declarative + +- Functional +- Logic + +Symbolic Programming + diff --git a/content/research/publications.md b/content/research/publications.md new file mode 100644 index 0000000..35ea97b --- /dev/null +++ b/content/research/publications.md @@ -0,0 +1,22 @@ +--- +Title: Publications +Descriptions: Papers, Presentations, and Grants obtained +ShowDatesOnPosts: false +--- + +# Publications + +Brandon Rozek. "QEP: The Quality Policy Evaluation Algorithm", Research and Creativity Day at University of Mary Washington, 2019. + +Brandon Rozek, Stefano Coronado. "Beowulf Cluster for Research and Education", Research and Creativity Day at University of Mary Washington, 2018. + +Brandon Rozek. "Coherent Control of Atomic Population Using the Genetic Algorithm", Summer Science Institute Research Symposium, 2017. + +Hannah Killian, Brandon Rozek. "Modelling Population Dynamics of Incoherent and Coherent Excitation", Virginia Academy of Science, 2017. + +Hannah Killian, Brandon Rozek. “Modeling Population Dynamics of Incoherent and Coherent Excitation", Research and Creativity Day at University of Mary Washington, 2017. + + +# Grants + +Julia Arrington, Maia Magrakvilidze, Ethan Ramirez, Brandon Rozek "Beowulf Cluster for Research and Education", University of Mary Washington, 2017-2018 School Year diff --git a/content/research/reinforcementlearning.md b/content/research/reinforcementlearning.md new file mode 100644 index 0000000..2dff393 --- /dev/null +++ b/content/research/reinforcementlearning.md @@ -0,0 +1,45 @@ +--- +Title: Reinforcement Learning +Description: The study of optimally mapping situations to actions +--- + +# Reinforcement Learning +Reinforcement learning is the art of analyzing situations and mapping them to actions in order to maximize a numerical reward signal. + +In this independent study, I as well as Dr. Stephen Davies, will explore the Reinforcement Learning problem and its subproblems. We will go over the bandit problem, markov decision processes, and discover how best to translate a problem in order to **make decisions**. + +I have provided a list of topics that I wish to explore in a [syllabus](syllabus) + +## Readings + +In order to spend more time learning, I decided to follow a textbook this time. + +Reinforcement Learning: An Introduction + +By Richard S. Sutton and Andrew G. Barto + + +[Reading Schedule](readings) + + +## Notes + +The notes for this course, is going to be an extreemly summarized version of the textbook. There will also be notes on whatever side tangents Dr. Davies and I explore. + +[Notes page](notes) + +I wrote a small little quirky/funny report describing the bandit problem. Great for learning about the common considerations for Reinforcement Learning problems. + +[The Bandit Report](/files/research/TheBanditReport.pdf) + +## Code + +Code will occasionally be written to solidify the learning material and to act as aids for more exploration. + +[Github Link](https://github.com/brandon-rozek/ReinforcementLearning) + +Specifically, if you want to see agents I've created to solve some OpenAI environments, take a look at this specific folder in the Github Repository + +[Github Link](https://github.com/Brandon-Rozek/ReinforcementLearning/tree/master/agents) + + diff --git a/content/research/reinforcementlearning/notes.md b/content/research/reinforcementlearning/notes.md new file mode 100644 index 0000000..9b84aa1 --- /dev/null +++ b/content/research/reinforcementlearning/notes.md @@ -0,0 +1,12 @@ +# Lecture Notes for Reinforcement Learning + +[Chapter 1: An Introduction](intro) + +[Chapter 2: Multi-armed Bandits](bandits) + +[Chapter 3: Markov Decision Processes](mdp) + +[Chapter 4: Dynamic Programming](dynamic) + +[Chapter 5: Monte Carlo Methods](mcmethods) + diff --git a/content/research/reinforcementlearning/notes/bandits.md b/content/research/reinforcementlearning/notes/bandits.md new file mode 100644 index 0000000..2fabed1 --- /dev/null +++ b/content/research/reinforcementlearning/notes/bandits.md @@ -0,0 +1,144 @@ +# Chapter 2: Multi-armed Bandits + +Reinforcement learning *evaluates* the actions taken rather than accepting $instructions$ of the correct actions. This creates the need for active exploration. + +This chapter of the book goes over a simplified version of the reinforcement learning problem, that does not involve learning to act in more than one situation. This is called a *nonassociative* setting. + +In summation, the type of problem we are about to study is a nonassociative, evaluative feedback problem that is a simplified version of the $k$-armed bandit problem. + +## $K$-armed bandit problem + +Consider the following learning problem. You are faced repeatedly with a choice among $k$ different options/actions. After each choice you receive a numerical reward chosen from a stationary probability distribution that depends on the action you selected. + +Your objective (if you choose to accept it) is to maximize the expected total reward over some time period. Let's say $1000$ time steps. + +### Analogy + +This is called the $k$-armed bandit problem because it's an analogy of a slot machine. Slot machines are nick-named the "one-armed bandit", and the goal here is to play the slot machine that has the greatest value return. + +### Sub-goal + +We want to figure out which slot machine produces the greatest value. Therefore, we want to be able to estimate the value of a slot machine as close to the actual value as possible. + +### Exploration vs Exploitation + +If we maintain estimates of the action values, then at any time step there is at least one action whose estimated value is the greatest. We call these *greedy* actions. When you select one of these actions we say that you are *exploiting* your current knowledge of the values of the actions. + +If you instead select a non-greedy action, then you are *exploring*, because this enables you to better improve your estimate of the non-greedy action's value. + +Uncertainty is such that at least one of the other actions probably better than the greedy action, you just don't know which one yet. + +## Action-value Methods + +In this section, we will look at simple balancing methods in how to gain the greatest reward through exploration and exploitation. + +We begin by looking more closely at some simple methods for estimating the values of actions and for using said estimates to make action selection decisions. + +### Sample-average method + +One natural way to estimate this is by averaging the rewards actually received +$$ +Q_t(a) = \frac{\sum_{i = 1}^{t - 1}R_i * \mathbb{I}_{A_i = 1}}{\sum_{i = 1}^{t - 1}\mathbb{I}_{A_i = 1}} +$$ +where $\mathbb{I}_{predicate}$ denotes the random variable that is 1 if the predicate is true and 0 if it is not. If the denominator is zero (we have not experienced the reward), then we assume some default value such as zero. + +### Greedy action selection + +This is where you choose greedily all the time. +$$ +A_t = argmax_a(Q_t(a)) +$$ + +### $\epsilon$-greedy action selection + +This is where we choose greedily most of the time, except for a small probability $\epsilon$. Where instead of selecting greedily, we select randomly from among all the actions with equal probability. + +### Comparison of greedy and $\epsilon$-greedy methods + +The advantage of $\epsilon$-greedy over greedy methods depends on the task. With noisier rewards it takes more exploration to find the optimal action, and $\epsilon$-greedy methods should fare better relative to the greedy method. However, if the reward variances were zero, then the greedy method would know the true value of each action after trying it once. + +Suppose the bandit task were non-stationary, that is, the true values of actions changed over time. In this case exploration is needed to make sure one of the non-greedy actions has not changed to become better than the greedy one. + +### Incremental Implementation + +There is a way to update averages using small constant computations rather than storing the the numerators and denominators separate. + +Note the derivation for the update formula +$$ +\begin{align} +Q_{n + 1} &= \frac{1}{n}\sum_{i = 1}^n{R_i} \\ +&= \frac{1}{n}(R_n + \sum_{i = 1}^{n - 1}{R_i}) \\ +&= \frac{1}{n}(R_n + (n - 1)\frac{1}{n-1}\sum_{i = 1}^{n - 1}{R_i}) \\ +&= \frac{1}{n}{R_n + (n - 1)Q_n} \\ +&= \frac{1}{n}(R_n + nQ_n - Q_n) \\ +&= Q_n + \frac{1}{n}(R_n - Q_n) \tag{2.3} +\end{align} +$$ +With formula 2.3, the implementation requires memory of only $Q_n$ and $n$. + +This update rule is a form that occurs frequently throughout the book. The general form is +$$ +NewEstimate = OldEstimate + StepSize(Target - OldEstimate) +$$ + +### Tracking a Nonstationary Problem + +As noted earlier, we often encounter problems that are nonstationary, in such cases it makes sense to give more weight to recent rewards than to long-past rewards. One of the most popular ways to do this is to use a constant value for the $StepSize​$ parameter. We modify formula 2.3 to be +$$ +\begin{align} +Q_{n + 1} &= Q_n + \alpha(R_n - Q_n) \\ +&= \alpha R_n + Q_n - \alpha Q_n \\ +&= \alpha R_n + (1 - \alpha)Q_n \\ +&= \alpha R_n + (1 - \alpha)(\alpha R_{n - 1} + (1-\alpha)Q_{n - 1}) \\ +&= \alpha R_n + (1 - \alpha)(\alpha R_{n - 1} + (1-\alpha)(\alpha R_{n - 2} + (1 - a)Q_{n - 2})) \\ +&= \alpha R_n + (1-\alpha)\alpha R_{n - 1} + (1-\alpha)^2\alpha R_{n - 2} + \dots + (1-\alpha)^nQ_1 \\ +&= (1-\alpha)^nQ_1 + \sum_{i = 1}^n{\alpha(1-\alpha)^{n - i}R_i} +\end{align} +$$ +This is a weighted average since the summation of all the weights equal one. Note here that the farther away a value is from the current time, the more times $(1-\alpha)$ gets multiplied by itself. Hence making it less influential. This is sometimes called an *exponential recency-weighted average*. + +### Manipulating $\alpha_n(a)$ + +Sometimes it is convenient to vary the step-size parameter from step to step. We can denote $\alpha_n(a)$ to be a function that determines the step-size parameter after the $n$th selection of action $a$. As noted before $\alpha_n(a) = \frac{1}{n}$ results in the sample average method which is guaranteed to converge to the truth action values assuming a large number of trials. + +A well known result in stochastic approximation theory gives us the following conditions to assure convergence with probability 1: +$$ +\sum_{n = 1}^\infty{\alpha_n(a) = \infty} \and \sum_{n = 1}^{\infty}{\alpha_n^2(a) \lt \infty} +$$ +The first condition is required to guarantee that the steps are large enough to overcome any initial conditions or random fluctuations. The second condition guarantees that eventually the steps become small enough to assure convergence. + +**Note:** Both convergence conditions are met for the sample-average case but not for the constant step-size parameter. The latter condition is violated in the constant parameter case. This is desirable since if the rewards are changing then we don't want it to converge to any one parameter. + +### Optimistic Initial Values + +The methods discussed so far are biased by their initial estimates. Another downside is that these values are another set of parameters that must be chosen by the user. Though these initial values can be used as a simple way to encourage exploration. + +Let's say you set an initial estimate that is wildly optimistic. Whichever actions are initially selected, the reward is less than the starting estimates. Therefore, the learner switches to other actions, being *disappointed* with the rewards it was receiving. + +The result of this is that all actions are tried several times before their values converge. It even does this if the algorithm is set to choose greedily most of the time! + +![1536284892566](/home/rozek/Pictures/1536284892566.png) + +This simple trick is quite effective for stationary problems. Not so much for nonstationary problems since the drive for exploration only happens at the beginning. If the task changes, creating a renewed need for exploration, this method would not catch it. + +### Upper-Confidence-Bound Action Selection + +Exploration is needed because there is always uncertainty about the accuracy of the action-value estimates. The greedy actions are those that look best at the present but some other options may actually be better. Let's choose options that have potential for being optimal, taking into account how close their estimates are to being maximal and the uncertainties in those estimates. +$$ +A_t = argmax_a{(Q_t(a) + c\sqrt{\frac{ln(t)}{N_t(a)}})} +$$ +where $N_t(a)$ denotes the number of times that $a$ has been selected prior to time $t$ and $c > 0$ controls the degree of exploration. + +###Associative Search (Contextual Bandits) + +So far, we've only considered nonassociative tasks, where there is no need to associate different actions with different situations. However, in a general reinforcement learning task there is more than one situation and the goal is to learn a policy: a mapping from situations to the actions that are best in those situations. + +For sake of continuing our example, let us suppose that there are several different $k$-armed bandit tasks, and that on each step you confront one of these chosen at random. To you, this would appear as a single, nonstationry $k$-armed bandit task whose true action values change randomly from step to step. You could try using one of the previous methods, but unless the true action values change slowly, these methods will not work very well. + +Now suppose, that when a bandit task is selected for you, you are given some clue about its identity. Now you can learn a policy association each task, singled by the clue, with the best action to take when facing that task. + +This is an example of an *associative search* task, so called because it involves both trial-and-error learning to *search* for the best actions, and *association* of these actions with situations in which they are best. Nowadays they're called *contextual bandits* in literature. + +If actions are allowed to affect the next situation as well as the reward, then we have the full reinforcement learning problem. This will be presented in the next chapter of the book with its ramifications appearing throughout the rest of the book. + +![1536321791927](/home/rozek/Pictures/1536321791927.png) \ No newline at end of file diff --git a/content/research/reinforcementlearning/notes/dynamic.md b/content/research/reinforcementlearning/notes/dynamic.md new file mode 100644 index 0000000..708b258 --- /dev/null +++ b/content/research/reinforcementlearning/notes/dynamic.md @@ -0,0 +1,130 @@ +# Chapter 4: Dynamic Programming + +Dynamic programming refers to a collection of algorithms that can be used to compute optimal policies given a perfect model of the environment as a Markov decision process (MDP). + +Classic DP algorithms are of limited utility due to their assumption of a perfect model and their great computational expense. + +Let's assume that the environment is a finite MDP. We assume its state, action, and reward sets, $\mathcal{S}, \mathcal{A}, \mathcal{R}$ are finite, and that its dynamics are given by a set of probabilities $p(s^\prime, r | s , a)$. + +The key idea of dynamic programming, and of reinforcement learning is the use of value functions to organize and structure the search for good policies. In this chapter, we show how dynamic programming can be used to compute the value functions defined in Chapter 3. We can easily obtain optimal policies once we have found the optimal value functions which satisfy the Bellman optimality equations. + +## Policy Evaluation + +First we consider how to compute the state-value function for an arbitrary policy. The existence and uniqueness of a state-value function for an arbitrary policy are guaranteed as long as either the discount rate is less than one or eventual termination is guaranteed from all states under the given policy. + +Consider a sequence of approximate value functions. The initial approximation, $v_0$, is chosen arbitrarily (except that the terminal state must be given a value of zero) and each successive approximation is obtained by using the Bellman equation for $v_\pi$ as an update rule: +$$ +v_{k + 1} = \sum_{a}{\pi(a |s)\sum_{s^\prime, r}{p(s^\prime,r|s,a)[r + \gamma v_k(s^\prime)]}} +$$ +This algorithm is called *iterative policy evaluation*. + +To produce each successive approximation, $v_{k + 1}$ from $v_k$, iterative policy evaluation applies the same operation to each state $s$: it replaces the old value of $s$ with a new value obtained from the old values of the successor states of $s$, and the expected immediate rewards, along all the one-step transitions possible under the policy being evaluated. + +**Iterative Policy Evaluation** + +``` +Input π, the policy to be evaluated +Initialize an array V(s) = 0, for all s ∈ S+ +Repeat + ∆ ← 0 + For each s ∈ S: + v ← V(s) + V(s) ← ∑_a π(a|s) ∑_s′,r p(s′,r|s,a)[r+γV(s′)] + ∆ ← max(∆,|v−V(s)|) +until ∆ < θ (a small positive number) +Output V ≈ v_π +``` + +### Grid World Example + +Consider a grid world where the top left and bottom right squares are the terminal state. Now consider that every other square, produces a reward of -1, and the available actions on each state is {up, down, left, right} as long as that action keeps the agent on the grid. Suppose our agent follows the equiprobable random policy. + +![1540262811089](/home/rozek/Documents/Research/Reinforcement Learning/1540262811089.png) + +## Policy Improvement + +One reason for computing the value function for a policy is to help find better policies. Suppose we have determined the value function $v_\pi$ for an arbitrary deterministic policy $\pi$. For some state $s$ we would like to know whether or not we should change the policy to determinatically chose another action. We know how good it is to follow the current policy from $s$, that is $v_\pi(s)$, but would it be better or worse to change to the new policy? + +One way to answer this question is to consider selecting $a$ in $s$ and thereafter follow the existing policy, $\pi$. The key criterion is whether the this produces a value greater than or less than $v_\pi(s)$. If it is greater, then one would expect it to be better still to select $a$ every time $s$ is encountered, and that the new policy would in fact be a better one overall. + +That this is true is a special case of a general result called the *policy improvement theorem*. Let $\pi$ and $\pi^\prime$ be any pair of deterministic policies such that for all $s \in \mathcal{S}$. +$$ +q_\pi(s, \pi^\prime(s)) \ge v_\pi(s) +$$ +So far we have seen how, given a policy and its value function, we can easily evaluate a change in the policy at a single state to a particular action. It is a natural extension to consider changes at all states and to all possible actions, selecting at each state the action that appears best according to $q_\pi(s, a)$. In other words, to consider the new *greedy* policy, $\pi^\prime$, given by: +$$ +\pi^\prime = argmax (q_\pi(s, a)) +$$ +So far in this section we have considered the case of deterministic policies. We will not go through the details, but in fact all the ideas of this section extend easily to stochastic policies. + +## Policy Iteration + +Once a policy, $\pi$, has been improved using $v_\pi$ to yield a better policy, $\pi^\prime$, we can then compute $v_{\pi^\prime}$ and improve it again to yield an even better $\pi^{\prime\prime}$. We can thus obtain a sequence of monotonically improving policies and value functions. + +Each policy is guaranteed to be a strict improvement over the previous one (unless its already optimal). Since a finite MDP has only a finite number of policies, this process must converge to an optimal policy and optimal value function in a finite number of iterations. + +This way of finding an optimal policy is called *policy iteration*. + +Algorithm + +``` +1. Initialization + V(s) ∈ R and π(s) ∈ A(s) arbitrarily for all s ∈ S +2. Policy Evaluation + Repeat + ∆ ← 0 + For each s∈S: + v ← V(s) + V(s) ← ∑_{s′,r} p(s′,r|s,π(s))[r + γV(s′)] + ∆ ← max(∆,|v − V(s)|) + until ∆ < θ (a small positive number) +3. Policy Improvement + policy-stable ← true + For each s ∈ S: + old-action ← π(s) + π(s) ← arg max_a ∑_{s′,r} p(s′,r|s,a)[r + γV(s′)] + If old-action != π(s), then policy-stable ← false + If policy-stable, then stop and return V ≈ v_∗, + and π ≈ π_∗; else go to 2 +``` + +## Value Iteration + +One drawback to policy iteration is that each of its iterations involve policy evaluation, which may itself be a protracted iterative computation requiring multiple sweeps through the state set. If policy evaluation is done iteratively, then convergence exactly to $v_\pi$ occurs only in the limit. Must we wait for exact convergence, or can we stop short of that? + +In fact, the policy evaluation step of policy iteration can be truncated in several ways without losing the convergence guarantee of policy iteration. One important special case is when policy evaluation is stopped after one sweep. This algorithm is called value iteration. + +Another way of understanding value iteration is by reference to the Bellman optimality equation. Note that value iteration is obtained simply by turning the Bellman optimality equation into an update rule. Also note how value iteration is identical to the policy evaluation update except that it requires the maximum to be taken over all actions. + +Finally, let us consider how value iteration terminates. Like policy evaluation, value iteration formally requires an infinite number of iterations to converge exactly. In practice, we stop once the value function changes by only a small amount. + +``` +Initialize array V arbitrarily (e.g., V(s) = 0 for all +s ∈ S+) + +Repeat + ∆ ← 0 + For each s ∈ S: + v ← V(s) + V(s) ← max_a∑_{s′,r} p(s′,r|s,a)[r + γV(s′)] + ∆ ← max(∆, |v − V(s)|) +until ∆ < θ (a small positive number) + +Output a deterministic policy, π ≈ π_∗, such that + π(s) = arg max_a ∑_{s′,r} p(s′,r|s,a)[r + γV(s′)] +``` + +Value iteration effectively combines, in each of its sweeps, one sweep of policy evaluation and one sweep of policy improvement. Faster convergence is often achieved by interposing multiple policy evaluation sweeps between each policy improvement sweep. + +## Asynchronous Dynamic Programming + +*Asynchronous* DP algorithms are in-place DP algorithms that are not organized in terms of systematic sweeps of the state set. These algorithms update the values of states in any order whatsoever, using whatever value of other states happen to be available. + +To converge correctly, however, an asynchronous algorithm must continue to update the value of all the states: it can't ignore any state after some point in the computation. + +## Generalized Policy Iteration + +Policy iteration consists of two simultaneous, iterating processes, one making the value function consistent with the current policy (policy evaluation) and the other making the policy greedy with respect to the current value function (policy improvement). + +We use the term *generalized policy iteration* (GPI) to competing and cooperating. They compete in the sense that they pull in opposing directions. Making the policy greedy with respect to the value function typically makes the value function incorrect for the changed policy. Making the value function consistent with the policy typically causes the policy to be greedy. In the long run, however, the two processes interact to find a single joint solution. + diff --git a/content/research/reinforcementlearning/notes/intro.md b/content/research/reinforcementlearning/notes/intro.md new file mode 100644 index 0000000..5b378ba --- /dev/null +++ b/content/research/reinforcementlearning/notes/intro.md @@ -0,0 +1,66 @@ +# Introduction to Reinforcement Learning Day 1 + +Recall that this course is based on the book -- + +Reinforcement Learning: An Introduction by Richard S. Sutton and Andrew G. Barto + + + +These notes really serve as talking points for the overall concepts described in the chapter and are not meant to stand for themselves. Check out the book for more complete thoughts :) + + + +**Reinforcement Learning** is learning what to do -- how to map situations to actions -- so as to maximize a numerical reward signal. There are two characteristics, trial-and-error search and delayed reward, that are the two most important distinguishing features of reinforcement learning. + + + +Markov decision processes are intended to include just these three aspects: sensation, action, and goal(s). + + + +Reinforcement learning is **different** than the following categories + +- Supervised learning: This is learning from a training set of labeled examples provided by a knowledgeable external supervisor. In interactive problems it is often impractical to obtain examples of desired behavior that are both correct and representative of all situations in which the agent has to act. +- Unsupervised learning: Reinforcement learning is trying to maximize a reward signal as opposed to finding some sort of hidden structure within the data. + + + +One of the challenges that arise in reinforcement learning is the **trade-off** between exploration and exploitation. The dilemma is that neither exploration nor exploitation can be pursued exclusively without failing at the task. + + + +Another key feature of reinforcement learning is that it explicitly considers the whole problem of a goal-directed agent interacting with an uncertain environment. This is different than supervised learning since they're concerned with finding the best classifier/regression without explicitly specifying how such an ability would finally be useful. + + + +A complete, interactive, goal-seeking agent can also be a component of a larger behaving system. A simple example is an agent that monitors the charge level of a robot's battery and sends commands to the robot's control architecture. This agent's environment is the rest of the robot together with the robot's environment. + + + +## Definitions + +A policy defines the learning agent's way of behaving at a given time + + + +A reward signal defines the goal in a reinforcement learning problem. The agent's sole objective is to maximize the total reward it receives over the long run + + + +A value function specifies what is good in the long run. Roughly speaking, the value of a state is the total amount of reward an agent can expect to accumulate over the future, starting from that state. Without rewards there could be no value,s and the only purpose of estimating values is to achieve more reward. We seek actions that bring about states of highest value. + + + +Unfortunately, it is much harder to determine values than it is to determine rewards. The most important component of almost all reinforcement learning algorithms we consider is a method for efficiently estimating values. + + + +**Look at Tic-Tac-Toe example** + + + +Most of the time in a reinforcement learning algorithm, we move greedily, selecting the move that leads to the state with greatest value. Occasionally, however, we select randomly from amoung the other moves instead. These are called exploratory moves because they cause us to experience states that we might otherwise never see. + + + +Summary: Reinforcement learning is learning by an agent from direct interaction wit its environment, without relying on exemplary supervision or complete models of the environment. \ No newline at end of file diff --git a/content/research/reinforcementlearning/notes/mcmethods.md b/content/research/reinforcementlearning/notes/mcmethods.md new file mode 100644 index 0000000..51543e8 --- /dev/null +++ b/content/research/reinforcementlearning/notes/mcmethods.md @@ -0,0 +1,110 @@ +# Chapter 5: Monte Carlo Methods + +Monte Carlo methods do not assume complete knowledge of the environment. They require only *experience* which is a sample sequence of states, actions, and rewards from actual or simulated interaction with an environment. + +Monte Carlo methods are ways of solving the reinforcement learning problem based on averaging sample returns. To ensure that well-defined returns are available, we define Monte Carlo methods only for episodic tasks. Only on the completion of an episode are value estimates and policies changed. + +Monte Carlo methods sample and average returns for each state-action pair is much like the bandit methods explored earlier. The main difference is that there are now multiple states, each acting like a different bandit problems and the problems are interrelated. Due to all the action selections undergoing learning, the problem becomes nonstationary from the point of view of the earlier state. + +## Monte Carlo Prediction + +Recall that the value of a state is the expected return -- expected cumulative future discounted reward - starting from that state. One way to do it is to estimate it from experience by averaging the returns observed after visits to that state. + +Each occurrence of state $s$ in an episode is called a *visit* to $s$. The *first-visit MC method* estimates $v_\pi(s)$ as the average of the returns following first visits to $s$, whereas the *every-visit MC method* averages the returns following all visits to $s$. These two Monte Carlo methods are very similar but have slightly different theoretical properties. + +First-visit MC prediction + +``` +Initialize: + π ← policy to be evaluated + V ← an arbitrary state-value function + Returns(s) ← an empty list, for all s ∈ S + +Repeat forever: + Generate an episode using π + For each state s appearing in the episode: + G ← the return that follows the first occurrence of +s + Append G to Returns(s) + V(s) ← average(Returns(s)) +``` + +## Monte Carlo Estimation of Action Values + +If a model is not available then it is particularly useful to estimate *action* values rather than state values. With a model, state values alone are sufficient to define a policy. Without a model, however, state values alone are not sufficient. One must explicitly estimate the value of each action in order for the values to be useful in suggesting a policy. + +The only complication is that many state-action pairs may never be visited. If $\pi$ is a deterministic policy, then in following $\pi$ one will observe returns only for one of the actions from each state. With no returns to average, the Monte Carlo estimates of the other actions will not improve with experience. This is a serious problem because the purpose of learning action values is to help in choosing among the actions available in each state. + +This is the general problem of *maintaining exploration*. For policy evaluation to work for action values, we must assure continual exploration. One way to do this is by specifying that the episodes *start in a state-action pair*, and that each pair has a nonzero probability of being selected as the start. We call this the assumption of *exploring starts*. + +## Monte Carlo Control + +We made two unlikely assumptions above in order to easily obtain this guarantee of convergence for the Monte Carlo method. One was that the episodes have exploring starts, and the other was that policy evaluation could be done with an infinite number of episodes. + +Monte Carlo Exploring Starts + +``` +Initialize, for all s ∈ S, a ∈ A(s): + Q(s,a) ← arbitrary + π(s) ← arbitrary + Returns(s,a) ← empty list + +Repeat forever: + Choose S_0 ∈ S and A_0 ∈ A(S_0) s.t. all pairs have probability > 0 + Generate an episode starting from S_0,A_0, following +π + For each pair s,a appearing in the episode: + G ← the return that follows the first occurrence of +s,a + Append G to Returns(s,a) + Q(s,a) ← average(Returns(s,a)) + For each s in the episode: + π(s) ← arg max_a Q(s,a) +``` + +## Monte Carlo Control without Exploring Starts + +The only general way to ensure that actions are selected infinitely often is for the agent to continue to select them. There are two approaches ensuring this, resulting in what we call *on-policy* methods and *off-policy* methods. + +On-policy methods attempt to evaluate or improve the policy that is used to make decisions, whereas off-policy methods evaluate or improve a policy different from that used to generate the data. + +In on-policy control methods the policy is generally *soft*, meaning that $\pi(a|s)$ for all $a \in \mathcal{A}(s)$. The on-policy methods in this section uses $\epsilon$-greedy policies, meaning that most of the time they choose an action that has maximal estimated action value, but with probability $\epsilon$ they instead select an action at random. + +On-policy first-visit MC control (for $\epsilon$-soft policies) + +``` + +``` + +Initialize, for all $s \in \mathcal{S}$, $a \in \mathcal{A}(s)$: + + $Q(s, a)$ ← arbitrary + + $Returns(s,a)$ ← empty list + + $\pi(a|s)$ ← an arbitrary $\epsilon$-soft policy + +Repeat forever: + + (a) Generate an episode using $\pi$ + + (b) For each pair $s,a$ appearing in the episoe + +​ $G$ ← the return that follows the first occurance of s, a + +​ Append $G$ to $Returns(s,a)$ + +​ $Q(s, a)$ ← average($Returns(s,a)$) + + (c) For each $s$ in the episode: + +​ $A^*$ ← argmax$_a Q(s,a)$ (with ties broken arbitrarily) + +​ For all $a \in \mathcal{A}(s)$: + +​ $\pi(a|s)$ ← $\begin{cases} 1 - \epsilon + \epsilon / |\mathcal{A}(s)| & a = A^* \\ \epsilon / | \mathcal{A}(s)| & a \neq A^* \end{cases}$ + +``` + +``` + diff --git a/content/research/reinforcementlearning/notes/mdp.md b/content/research/reinforcementlearning/notes/mdp.md new file mode 100644 index 0000000..cde47b2 --- /dev/null +++ b/content/research/reinforcementlearning/notes/mdp.md @@ -0,0 +1,193 @@ +# Chapter 3: Finite Markov Decision Processes + +Markov Decision processes are a classical formalization of sequential decision making, where actions influence not just immediate rewards, but also subsequent situations, or states, and through those future rewards. Thus MDPs involve delayed reward and the need to trade-off immediate and delayed reward. Whereas in bandit problems we estimated the value of $q_*(a)$ of each action $a$, in MDPs we estimate the value of $q_*(s, a)$ of each action $a$ in state $s$. + +MDPs are a mathematically idealized form of the reinforcement learning problem. As we will see in artificial intelligence, there is often a tension between breadth of applicability and mathematical tractability. This chapter will introduce this tension and discuss some of the trade-offs and challenges that it implies. + +## Agent-Environment Interface + +The learner and decision maker is called the *agent*. The thing it interacts with is called the *environment*. These interact continually, the agent selecting actions and the environment responding to these actions and presenting new situations to the agent. + +The environment also give rise to rewards, special numerical values that the agent seeks to maximize over time through its choice of actions. + +![1536511147205](/home/rozek/Documents/Research/Reinforcement Learning/1536511147205.png) + +To make the future paragraphs clearer, a Markov Decision Process is a discrete time stochastic control process. It provides a mathematical framework for modeling decision making in situations where outcomes are partly random and partly under the control of the decision maker. + +In a *finite* MDP, the set of states, actions, and rewards all have a finite number of elements. In this case, the random variables R_t and S_t have a well defined discrete probability distribution dependent only on the preceding state and action. +$$ +p(s^\prime | s,a) = \sum_{r \in \mathcal{R}}{p(s^\prime, r|s, a)} +$$ +Breaking down the above formula, it's just an instantiation of the law of total probability. If you partition the probabilistic space by the reward, if you sum up each partition you should get the overall space. This formula has a special name: the *state-transition probability*. + +From this we can compute the expected rewards for each state-action pair by multiplying each reward with the probability of getting said reward and summing it all up. +$$ +r(s, a) = \sum_{r \in \mathcal{R}}{r}\sum_{s^\prime \in \mathcal{S}}{p(s^\prime, r|s,a)} +$$ +The expected reward for a state-action-next-state triple is +$$ +r(s, a, s^\prime) = \sum_{r \in \mathcal{R}}{r\frac{p(s^\prime, r|s,a)}{p(s^\prime|s,a)}} +$$ +I wasn't able to piece together this function in my head like the others. Currently I imagine it as if we took the formula before and turned the universe of discourse from the universal set to the state where $s^\prime$ occurred. + +The MDP framework is abstract and flexible and can be applied to many different problems in many different ways. For example, the time steps need not refer to fixed intervals of real time; they can refer to arbitrary successive states of decision making and acting. + +### Agent-Environment Boundary + +In particular, the boundary between agent and environment is typically not the same as the physical boundary of a robot's or animals' body. Usually, the boundary is drawn closer to the agent than that. For example, the motors and mechanical linkages of a robot and its sensing hardware should usually be considered parts of the environment rather than parts of the agent. + +The general rule we follow is that anything that cannot be changed arbitrarily by the agent is considered to be outside of it and thus part of its environment. We do not assume that everything in the environment is unknown to the agent. For example, the agent often knows quite a bit about how its rewards are computed as a function of its actions and the states in which they are taken. But we always consider the reward computation to be external to the agent because it defines the task facing the agent and thus must be beyond its ability to change arbitrarily. The agent-environment boundary represents the limit of the agent's absolute control, not of its knowledge. + +This framework breaks down whatever the agent is trying to achieve to three signals passing back and forth between an agent and its environment: one signal to represent the choices made by the agent, one signal to represent the basis on which the choices are made (the states), and one signal to define the agent's goal (the rewards). + +### Example 3.4: Recycling Robot MDP + +Recall that the agent makes a decision at times determined by external events. At each such time the robot decides whether it should + +(1) Actively search for a can + +(2) Remain stationary and wait for someone to bring it a can + +(3) Go back to home base to recharge its battery + +Suppose the environment works as follows: the best way to find cans is to actively search for them, but this runs down the robot's battery, whereas waiting does not. Whenever the robot is searching the possibility exists that its battery will become depleted. In this case, the robot must shut down and wait to be rescued (producing a low reward.) + +The agent makes its decisions solely as a function of the energy level of the battery, It can distinguish two levels, high and low, so that the state set is $\mathcal{S} = \{high, low\}$. Let us call the possible decisions -- the agent's actions -- wait, search, and recharge. When the energy level is high, recharging would always be foolish, so we do not include it in the action set for this state. The agent's action sets are +$$ +\begin{align*} +\mathcal{A}(high) &= \{search, wait\} \\ +\mathcal{A}(low) &= \{search, wait, recharge\} +\end{align*} +$$ +If the energy level is high, then a period of active search can always be completed without a risk of depleting the battery. A period of searching that begins with a high energy level leaves the energy level high with a probability of $\alpha$ and reduces it to low with a probability of $(1 - \alpha)$. On the other hand, a period of searching undertaken when the energy level is low leaves it low with a probability of $\beta$ and depletes the battery with a probability of $(1 - \beta)$. In the latter case, the robot must be rescued, and the batter is then recharged back to high. + +Each can collected by the robot counts as a unit reward, whereas a reward of $-3$ occurs whenever the robot has to be rescued. Let $r_{search}$ and $r_{wait}$ with $r_{search } > r_{wait}$, respectively denote the expected number of cans the robot will collect while searching and waiting. Finally, to keep things simple, suppose that no cans can be collected ruing a run home for recharging and that no cans can be collected on a step in which the battery is depleted. + +| $s$ | $a$ | $s^\prime$ | $p(s^\prime | s, a)$ | $r(s| +| ---- | -------- | ---------- | ------------- | ------------ | --- | +| high | search | high | $\alpha$ | $r_{search}$ | +| high | search | low | $(1-\alpha)$ | $r_{search}$ | +| low | search | high | $(1 - \beta)$ | -3 | +| low | search | low | $\beta$ | $r_{search}$ | +| high | wait | high | 1 | $r_{wait}$ | +| high | wait | low | 0 | $r_{wait}$ | +| low | wait | high | 0 | $r_{wait}$ | +| low | wait | low | 1 | $r_{wait}$ | +| low | recharge | high | 1 | 0 | +| low | recharge | low | 0 | 0 | + +A *transition graph* is a useful way to summarize the dynamics of a finite MDP. There are two kinds of nodes: *state nodes* and *action nodes*. There is a state node for each possible state and an action node for reach state-action pair. Starting in state $s$ and taking action $a$ moves you along the line from state node $s$ to action node $(s, a)$. The the environment responds with a transition ot the next states node via one of the arrows leaving action node $(s, a)$. + +![1537031348278](/home/rozek/Documents/Research/Reinforcement Learning/1537031348278.png) + +## Goals and Rewards + +The reward hypothesis is that all of what we mean by goals and purposes can be well thought of as the maximization of the expected value of the cumulative sum of a received scalar signal called the reward. + +Although formulating goals in terms of reward signals might at first appear limiting, in practice it has proved to be flexible and widely applicable. The best way to see this is to consider the examples of how it has been, or could be used. For example: + +- To make a robot learn to walk, researchers have provided reward on each time step proportional to the robot's forward motion. +- In making a robot learn how to escape from a maze, the reward is often $-1$ for every time step that passes prior to escape; this encourages the agent to escape as quickly as possible. +- To make a robot learn to find and collect empty soda cans for recycling, one might give it a reward of zero most of the time, and then a reward of $+1$ for each can collected. One might also want to give the robot negative rewards when it bumps into things or when somebody yells at it. +- For an agent to play checkers or chess, the natural rewards are $+1$ for winning, $-1$ for losing, and $0$ for drawing and for all nonterminal positions. + +It is critical that the rewards we set up truly indicate what we want accomplished. In particular, the reward signal is not the place to impart to the agent prior knowledge about *how* to achieve what we want it to do. For example, a chess playing agent should only be rewarded for actually winning, not for achieving subgoals such as taking its opponent's pieces. If achieving these sort of subgoals were rewarded, then the agent might find a way to achieve them without achieving the real goal. The reward signal is your way of communicating what you want it to achieve, not how you want it achieved. + +## Returns and Episodes + +In general, we seek to maximize the *expected return*, where the return is defined as some specific function of the reward sequence. In the simplest case, the return is the sum of the rewards: +$$ +G_t = R_{t + 1} + R_{t + 2} + R_{t + 3} + \dots + R_{T} +$$ +where $T$ is the final time step. This approach makes sense in applications in which there is a natural notion of a final time step. That is when the agent-environment interaction breaks naturally into subsequences or *episodes*, such as plays of a game, trips through a maze, or any sort of repeated interaction. + +### Episodic Tasks + +Each episode ends in a special state called the *terminal state*, followed by a reset to the standard starting state or to a sample from a standard distribution of starting states. Even if you think of episodes as ending in different ways the next episode begins independently of how the previous one ended. Therefore, the episodes can all be considered to ending the same terminal states with different rewards for different outcomes. + +Tasks with episodes of this kind are called *episodic tasks*. In episodic tasks we sometimes need to distinguish the set of all nonterminal states, denoted $\mathcal{S}$, from the set of all states plus the terminal state, denoted $\mathcal{S}^+$. The time of termination, $T$, is a random variable that normally varies from episode to episode. + +### Continuing Tasks + +On the other hand, in many cases the agent-environment interaction goes on continually without limit. We call these *continuing tasks*. The return formulation above is problematic for continuing tasks because the final time step would be $T = \infty$, and the return which we are trying to maximize, could itself easily be infinite. The additional concept that we need is that of *discounting*. According to this approach, the agent tries to select actions so that the sum of the discounted rewards it receives over the future is maximized. In particular, it chooses $A_t$ to maximize the expected discounted return. +$$ +G_t= \sum_{k = 0}^\infty{\gamma^kR_{t+k+1}} +$$ +where $\gamma$ that is a parameter between $0$ and $1$ is called the *discount rate*. + +#### Discount Rate + +The discount rate determines the present value of future rewards: a reward received $k$ time steps in the future is worth only $\gamma^{k - 1}$ time what it would be worth if it were received immediately. If $\gamma < 1$, the infinite sum has a finite value as long as the reward sequence is bounded. + +If $\gamma = 0$, the agent is "myopic" in being concerned only with maximizing immediate rewards. But in general, acting to maximize immediate reward can reduce access to future rewards so that the return is reduced. + +As $\gamma$ approaches 1, the return objective takes future rewards into account more strongly; the agent becomes more farsighted. + +### Example 3.5 Pole-Balancing + +The objective in this task is to apply forces to a car moving along a track so as to keep a pole hinged to the cart from falling over. + +A failure is said to occur if the pole falls past a given angle from the vertical or if the cart runs off the track. + +![1537500975060](/home/rozek/Documents/Research/Reinforcement Learning/1537500975060.png) + +#### Approach 1 + +The reward can be a $+1$ for every time step on which failure did not occur. In this case, successful balancing would mean a return of infinity. + +#### Approach 2 + +The reward can be $-1$ on each failure and zero all other times. The return at each time would then be related to $-\gamma^k$ where $k$ is the number of steps before failure. + + + +Either case the return is maximized by keeping the pole balanced for as long as possible. + +## Policies and Value Functions + +Almost all reinforcement learning algorithms involve estimating *value functions* which estimate what future rewards can be expected. Of course the rewards that the agent can expect to receive is dependent on the actions it will take. Accordingly, value functions are defined with respect to particular ways of acting, called policies. + +Formally, a *policy* is a mapping from states to probabilities of selecting each possible action. The *value* of a state s under a policy \pi, denoted $v_{\pi}(s)$ is the expected return when starting in $s$ and following $\pi$ thereafter. For MDPs we can define $v_{\pi}$ as + +$$ +v_{\pi}(s) = \mathbb{E}_{\pi}[G_t | S_t = s] = \mathbb{E}_{\pi}[\sum_{k = 0}^\infty{\gamma^kR_{t+k+1} | S_t = s}] +$$ + +We call this function the *state-value function for policy $\pi$*. Similarly, we define the value of taking action $a$ in state $s$ under a policy $\pi$, denoted as $q_\pi(s,a)$ as the expected return starting from $s$, taking the action $a$, and thereafter following the policy $\pi$. Succinctly, this is called the *action-value function for policy $\pi$*. + +### Optimality and Approximation + +For some kinds of tasks we are interested in,optimal policies can be generated only with extreme computational cost. A critical aspect of the problemfacing the agent is always teh computational power available to it, in particular, the amount of computation it can perform in a single time step. + +The memory available is also an important constraint. A large amount of memory is often required to build up approximations of value functions, policies, and models. In the case of large state sets, functions must be approximated using some sort of more compact parameterized function representation. + +This presents us with unique oppurtunities for achieving useful approximations. For example, in approximating optimal behavior, there may be many states that the agent faces with such a low probability that selecting suboptimal actions for them has little impact on the amount of reward the agent receives. + +The online nature of reinforcement learning which makes it possible to approximate optimal policies in ways that put more effort into learning to make good decisions for frequently encountered states at the expense of infrequent ones is the key property that distinguishes reinforcement learning from other approaches to approximately solve MDPs. + +### Summary + +Let us summarize the elements of the reinforcement learning problem. + +Reinforcement learning is about learning from interaction how to behave in order to achieve a goal. The reinforcement learning *agent* and its *environment* interact over a sequence of discrete time steps. + +The *actions* are the choices made by the agent; the states are the basis for making the choice; and the *rewards* are the basis for evaluating the choices. + +Everything inside the agent is completely known and controllable by the agent; everything outside is incompletely controllable but may or may not be completely known. + +A *policy* is a stochastic rule by which the agent selects actions as a function of states. + +When the reinforcement learning setup described above is formulated with well defined transition probabilities it constitutes a Markov Decision Process (MDP) + +The *return* is the function of future rewards that the agent seeks to maximize. It has several different definitions depending on the nature of the task and whether one wishes to *discount* delayed reward. + +- The un-discounted formulation is appropriate for *episodic tasks*, in which the agent-environment interaction breaks naturally into *episodes* +- The discounted formulation is appropriate for *continuing tasks* in which the interaction does not naturally break into episodes but continue without limit + +A policy's *value functions* assign to each state, or state-action pair, the expected return from that state, or state-action pair, given that the agent uses the policy. The *optimal value functions* assign to each state, or state-action pair, the largest expected return achievable by any policy. A policy whose value unctions are optimal is an *optimal policy*. + +Even if the agent has a complete and accurate environment model, the agent is typically unable to perform enough computation per time step to fully use it. The memory available is also an important constraint. Memory may be required to build up accurate approximations of value functions, policies, and models. In most cases of practical interest there are far more states that could possibly be entries in a table, and approximations must be made. + + + + diff --git a/content/research/reinforcementlearning/readings.md b/content/research/reinforcementlearning/readings.md new file mode 100644 index 0000000..5243255 --- /dev/null +++ b/content/research/reinforcementlearning/readings.md @@ -0,0 +1,19 @@ +# Readings for Lectures of Cluster Analysis + +## Lecture 1 +Chapter 1: What is Reinforcement Learning? + +## Lecture 2 +Chapter 2: Multi-armed Bandits + +## Lecture 3 +Chpater 3: Finite Markov Decision Processes Part 1 + +## Lecture 4 +Chapter 3: Finite Markov Decision Processes Part 2 + +## Lecture 5 +[No Readings] Playing around with Multi-armed Bandits Code + + +**Lost track of readings around this time period :(** diff --git a/content/research/reinforcementlearning/syllabus.md b/content/research/reinforcementlearning/syllabus.md new file mode 100644 index 0000000..6cea733 --- /dev/null +++ b/content/research/reinforcementlearning/syllabus.md @@ -0,0 +1,78 @@ +# Reinforcement Learning + +The goal of this independent study is to gain an introduction to the topic of Reinforcement Learning. + +As such the majority of the semester will be following the textbook to gain an introduction to the topic, and the last part applying it to some problems. + + +## Textbook + +The majority of the content of this independent study will come from the textbook. This is meant to lessen the burden on the both us of as I already experimented with curating my own content. + +The textbook also includes examples throughout the text to immediately apply what's learned. + +Richard S. Sutton and Andrew G. Barto, "Reinforcement Learning: An Introduction" http://incompleteideas.net/book/bookdraft2017nov5.pdf + +## Discussions and Notes + +Discussions and notes will be kept track of and published on my tilda space as time and energy permits. This is for easy reference and since it's nice to write down what you learn. + +## Topics to be Discussed + +###The Reinforcement Learning Problem (3 Sessions) + +In this section we will get ourselves familiar with the topics that are commonly discussed in Reinforcement learning problems. + +In this section we will learn the different vocab terms such as: + +- Evaluative Feedback +- Non-Associative Learning +- Rewards/Returns +- Value Functions +- Optimality +- Exploration/Exploitation +- Model +- Policy +- Value Function +- Multi-armed Bandit Problem + +### Markov Decision Processes (4 Sessions) + +This is a type of reinforcement learning problem that is commonly studied and well documented. This helps form an environment for which the agent can operate within. Possible subtopics include: + +- Finite Markov Decision Processes +- Goals and Rewards +- Returns and Episodes +- Optimality and Approximation + +### Dynamic Programming (3 Sessions) + +Dynamic Programming refers to a collection of algorithms that can be used to compute optimal policies given an environment. Subtopics that we are going over is: + +- Policy Evaluation +- Policy Improvement +- Policy Iteration +- Value Iteration +- Asynchronous DP +- Generalized policy Iteration +- Bellman Expectation Equations + +### Monte Carlo Methods (3 Sessions) + +Now we move onto not having complete knowledge of the environment. This will go into estimating value functions and discovering optimal policies. Possible subtopics include: + +- Monte Carlo Prediction +- Monte Carlo Control +- Importance Sampling +- Incremental Implementation +- Off-Policy Monte Carlo Control + +### Temporal-Difference Learning (4-5 Sessions) + +Temporal-Difference learning is a combination of Monte Carlo ideas and Dynamic Programming. This can lead to methods learning directly from raw experience without knowledge of an environment. Subtopics will include: + +- TD Prediction +- Sarsa: On-Policy TD Control +- Q-Learning: Off-Policy TD Control +- Function Approximation +- Eligibility Traces diff --git a/content/ta.md b/content/ta.md new file mode 100644 index 0000000..9c539de --- /dev/null +++ b/content/ta.md @@ -0,0 +1,28 @@ +--- +title: Teaching Assistant +description: My work as a teaching assistent +--- + + +## Dr. Jessica Zeitz-Self +I was the lab aide for Dr. Zeitz' Computer Programming and Problem Solving (CPSC 220). + +My role in this class was to help students during lab time and to create lecture notes based on the lectures given in class. + +[Spring 2018/CPSC 220 Notes](spring2018/cpsc220) + +## Dr. Jennifer Polack + +I've been the lab aide for two of Polack's classes so far: Introduction to Computer Science (CPSC 110) and Computer Programming and Problem Solving (CPSC 220). + +My role involves helping students debug during the lab time. I also create lecture notes for students to look over while working on projects. + +[Summer 2017/CPSC 110 Notes](summer2017/cpsc110) + +[Fall 2017/CPSC 220 Lecture Notes](fall2017/cpsc220) + +## Dr. Ron Zacharski + +I was the lab aide for Zacharski's DATA 101 class. My role in his class mostly involved helping students debug during lab time and grading student's demonstrations of what they've done in a lab. + +He also asked me to TA for the NVIDIA Computer Vision workshop that he was running at the University. diff --git a/content/ta/_index.md b/content/ta/_index.md new file mode 100644 index 0000000..e69de29 diff --git a/content/ta/fall2017/cpsc220.md b/content/ta/fall2017/cpsc220.md new file mode 100644 index 0000000..53b1b81 --- /dev/null +++ b/content/ta/fall2017/cpsc220.md @@ -0,0 +1,39 @@ +# CPSC 220 Computer Programming and Problem Solving Fall 2017 + +[Lecture 3 -- September 6](sept6) + +[Lecture 4 -- September 11](sept11) + +[Lecture 7 -- September 20](sept20) + +[Lecture 9 -- September 25](sept25) + +[Lecture 10 -- October 2](oct2) + +[Lecture 11 -- October 4](oct4) + +[Lecture 12 -- October 9](oct9) + +[Lecture 13 -- October 11](oct11) + +[Lecture 15 -- October 18](oct18) + +[Lecture 16 -- October 23](oct23) + +[Lecture 17 -- October 25](oct25) + +[Lecture 18 -- October 30](oct30) + +[Exam 2 Review -- October 30](exam2review) + +[Lecture 19 -- November 6](nov6) + +[Lecture 20 -- November 13](nov13) + +[Lecture 21 -- November 15](nov15) + +[Lecture 22 -- November 20](nov20) + +[Lecture 23 -- November 27](nov27) + +[Lecture 25 -- December 6](dec6) diff --git a/content/ta/fall2017/cpsc220/dec6.md b/content/ta/fall2017/cpsc220/dec6.md new file mode 100644 index 0000000..b1de303 --- /dev/null +++ b/content/ta/fall2017/cpsc220/dec6.md @@ -0,0 +1,125 @@ +# Final Review December 6 + +## Classes + +Here is how you can create a class called "Employee" with a non-default constructor (a constructor that takes parameters) and a getter and setter + +```java +public class Employee { + // Our private variables + private String name; + private double salary; + // Non-default constructor + public Employee(String name, double salary) { + this.name = name; + this.salarly = salary; + } + // This is a getter + public string getName() { + return name; + } + public double setSalarly(double salary) { + this.salary = salary; + } +} +``` + +## For Loops + Arrays + +For loops are constructed in the following way + +`for (initialization; condition to stop; increment to get closer to condition to stop)` + +```java +//Assume an array with variable name array is declared before +for (int i = 0; i < array.length; i++) { + // This code will loop through every entry in the array +} +``` + +Note that you don't always have to start from zero, you can start anywhere from the array. + +## For Loops + Arrays + Methods + +This is an example of how you can take in an array in a method + +```java +public static boolean isEven(int[] array) { // <-- Note the int[] array + for (int i = 0; i < array.length; i++) { // Iterate through the entire array + // If you find an odd number, return false + if (array[i] % 2 == 1) { + return false; + } + } + // If you didn't find any odd numbers, return true + return true; +} +``` + +## File I/O + +Let's say that you have the following file + +``` +4 +chicken +3 +salad +``` + +And you want to make it so that you take the number, and print the word after it a certain number of times. For this example we would want to see the following + +```java +chicken chicken chicken chicken +salad salad salad +``` + +Here is the code to write it + +```java +public static void printStrings() { + FileInputStream file = new FileInputStream("stuff.txt"); // File contents are in stuff.txt + Scanner scnr = new Scanner(file); // Scanner takes in a file to read + while (scnr.hasNext()) { // While there are still stuff in the file to read + int number = scnr.nextInt(); // Grab the number + String word = scnr.next(); // Grab the word after the number + // Print the word number times + for (int i = 0; i < number; i++) { + System.out.print(word); + } + // Put a new line here + System.out.println(); + } + +} +``` + +## Recursion + +Look at handout and carefully trace recursion problems + +## 2D Arrays + +Declare a 2D int array with 4 rows and 7 columns + +```java +int[][] dataVals = new int[4][7]; +``` + +A 2D array with 4 rows and 7 columns has 7 * 4 = 28 entries. + + + +If you want to sum up all the numbers in a 2 dimensional array, do the following + +``` java +// Assume numbers is declared beforehand +int sum = 0; +for (int i = 0; i < numbers.length; i++) { // Loop through every row in the 2D array + for (int j = 0; j < numbers[i].length; j++) { // Loop through every column in a row + // This code now looks at one entry in a 2D array + sum += numbers[i][j]; + } +} +``` + diff --git a/content/ta/fall2017/cpsc220/exam2review.md b/content/ta/fall2017/cpsc220/exam2review.md new file mode 100644 index 0000000..e6acf9d --- /dev/null +++ b/content/ta/fall2017/cpsc220/exam2review.md @@ -0,0 +1,62 @@ +# Exam Review Partial Answer Sheet + +Write a Java method to sum values of an array + +```java +// Assume variable numbers is an array of 10 integers +int sum = 0; +for (int i = 0; i < numbers.length; i++) { + sum += numbers[i]; +} +``` + +Write a Java method to test if an array contains a specific value + +```java +// Assume variable numbers is an array of 10 integers +int numWanted = 4; +boolean found = false; +for (int i = 0; i < numbers.length; i++) { + if (numbers[i] == numWanted) { + System.out.println("The number " + numWanted + " was found!"); + found = true; + } +} +if (!found) { + System.out.println("The number " + numWanted + " was not found!"); +} +``` + +Write a Java method to find the index of an array element + +```java +// Assume variable numbers is an array of 10 integers +int numWanted = 4; +boolean found = false; +for (int i = 0; i < numbers.length; i++) { + if (numbers[i] == numWanted) { + System.out.println("The index of number " + numWanted + " is " + i); + } +} +``` + +How many lines will the following loop print when it is run? + +```java +int i = 0; +while (i <= 6) { + System.out.println("i is now " + (i)); + i++; +} +``` + +``` +i is now 0 +i is now 1 +i is now 2 +i is now 3 +i is now 4 +i is now 5 +i is now 6 +``` + diff --git a/content/ta/fall2017/cpsc220/nov13.md b/content/ta/fall2017/cpsc220/nov13.md new file mode 100644 index 0000000..028152e --- /dev/null +++ b/content/ta/fall2017/cpsc220/nov13.md @@ -0,0 +1,221 @@ +# Lecture for November 13 + +## File IO (Cont.) + +Last class we talked about reading from files, we can also write to files. + +### Import necessary libraries + +First you must import all of the necessary libraries + +```java +// To read +import java.util.Scanner; +import java.io.FileOutputStream; +// To Write +import java.io.FileReader; +import java.io.PrintWriter; +// For Exception Handling +import java.io.IOException; +``` + +Then in your main, declare a `FileOutputStream` and `PrintWriter` + +```java +FileOutputStream file; +PrintWriter print; +``` + +### Try-Catch-Finally + +Create a try block to open a file for writing + +```java +try { + // If the file doesn't exist, it'll create it + file = new FileOutputStream("output.txt"); + print = new PrintWriter(file); +} catch (IOException except) { + // Prints out the error message + System.out.println("File error " + except.getMessage()); +} +``` + +Adding a finally block allows the program to clean up before it closes + +```java + try { + file = new FileOutputStream("output.txt"); + print = new PrintWriter(file); + } catch (IOException except) { + System.out.println("File error " + except.getMessage()); + } finally { // It starts here! + delete file; + delete print; + file.close(); + return; + } +``` + +### Write to the file :) + +Then you can write the to file! + +```java +// Do you notice the following methods? + print.println("Your number is"); + print.print("My name is..\n"); + print.printf("%s %d", "Hello ", 5); + print.flush(); //Clears the output stream + file.close(); //Closes the file + +``` + +Extra Note: Disk fragmentation is a way of cleaning up memory that isn't being used by any of the code on your computer. + +## Swing Graphics + +### Importing Necessary Libraries + + + +You need to import all the necessary libraries first + +```java +import javax.swing.*; +import java.awt.FlowLayout; +import java.awt.event.ActionListener; +``` + +### Changing the class header + +Your class file needs to extend `JFrame` that way it can use a bunch of the already existent code written for Swing applications + +```java +public class firstGUi extends JFrame { + //.... +``` + +### Swing Components + +Java Swing makes use of what is called Swing Components. These are basic building blocks of GUI items you can add to the screen. For example, a checkbox, a radio button, text field. These are all swing components. + +I wrote a blog post back in the summer which is an overview of them. You can check it out here: https://brandonrozek.com/2017/06/java-swing-components/ + +Inside your `firstGUI` class, declare some Swing components you would like to use in the program + +```java +public class firstGUI extends JFrame { + JButton button1; + JTextArea area; + JTextField text; + // .... + +``` + +### Constructor + +You need to create a constructor for this class that way you can initiate all of the swing component values. + +```java +// ... +JButton button1; +JTextArea area; +JTextField text; + +// Begin Constructor +firstGUI() { + // Define the components + JLabel name = new JLabel("Enter in your name:"); + text = new JTextField("Jennifer", 20); // 20 characters long, default value: Jennifer + area = new JTextArea(10, 10); //Width and Height is 10 characters big + JScrollPane sp = new JScrollPane(area); //Adds a scroll bar for the text area + button1 = new JButton("Press Me"); + + // Set the Layout + // FlowLayout organizes each of the components top to bottom, left to right + setLayout(new FlowLayout()); + + // Add the components to the screen + add(name); + add(text); + add(sp); // never add the textarea when surrounded by a ScrollPane + add(button1); +} +``` + +### New Main Method + +Finally, you need to create the Main method which will initiate it all + +```java +public static void main(String[] args) { + firstGUI myFrame = new firstGUI(); + + // End the program when the 'x' button (not keyboard) is pressed + myFrame.setDefaultCloseOperation(JFrame.EXIT_ON_CLOSE); + + myFrame.setTitle("My title"); // Titles the window + myFrame.pack(); // Packs it all into the frame + myFrame.setVisible(true); // Makes the frame appear on the screen +} +``` + +### Making it interactive + +You need to change your class header to the following + +```java +public class firstGUI extends JFrame implements ActionListener { + // ... +``` + +Then in your class, add the following method + +```java +@Override public void actionPerformed(ActionEvent event) { + // Do stuff as a result of an event here + area.append("You Pressed the Button"); +} +``` + +To make it actually activate as a result of an event. You need to attach it to a swing component. + +For example, I want the code in `actionPerformed` to activate in result of a button press. + +Add the following line to your code in the constructor. + +```java +//... +button1 = new JButton("Press Me"); +button1.addActionListener(this); // New Code +//.... +``` + + + +### Identifying Button Pressed + +How do you know which button was pressed in the `actionPerformed` method? + +You can use `event.getSource()` to find out. + +Example: + +```java +@Override public void actionPerformed(ActionEvent event) { + if (event.getSource() == button1) { // Replace button1 with appropriate variable name + // Do things as a result of a specific button being pressed + } +} +``` + +### Summary + +To use Swing, do the following steps + +1. Import Libraries +2. Declare J___ variables +3. New the J___ variables +4. Add the J___ variables to the frame +5. Add the `ActionListener` to the components you wish to monitor \ No newline at end of file diff --git a/content/ta/fall2017/cpsc220/nov15.md b/content/ta/fall2017/cpsc220/nov15.md new file mode 100644 index 0000000..2aa309f --- /dev/null +++ b/content/ta/fall2017/cpsc220/nov15.md @@ -0,0 +1,109 @@ +# Lecture Notes for November 15th + +Import the necessary libraries + +```java +import java.awt.*; +import java.awt.event.*; +import javax.swing.*; +``` + +This time we'll be using the null layout. This will require you to set the x, and y positions of each of the elements on the screen + +First we'll make a class called `GUILayout` which will extend `JPanel` and contain our layout and components + +```java +import java.awt.*; +import java.awt.event.*; +import javax.swing.*; + +public class GUILayout extends JPanel { + private JButton one, two; + private JTextField text; + private JTextArea area; + private int count; // Used to keep track of button pushes + private int number = 0; + + GUILayout() { + // Set the layout to the null layout + setLayout(null); + // Tells the computer that you wish to have the size of your program to be 500x500 + setPreferredSize(new Dimension(500, 500)); + + // Create the buttons + one = new JButton("Change color"); + two = new JButton("Count Pushes"); + + // Set the x, y, width, height inside parenthesis + // This places the buttons on the specified locations on the screen + one.setBounds(10, 10, 100, 24); + two.setBounds(120, 10, 100, 24); + + // Sets the color of the text of button 1 to blue + one.setForeground(Color.BLUE); + + // Add the components to the screen + add(one); + add(two); + + + text = new JTextField("Today is Wednesday, a photographer is here."); + text.setBounds(10, 40 ,480, 24); + add(text); + + area = new JTextArea(20, 20); + // Wrap the text area into the scroll pane + // This adds the scroll bars (vertical/horizontal) + JScrollPane sp = new JScrollPane(area); + sp.setBounds(10, 75, 490, 400); + add(sp); + + // Bind the Listener class to the button one + one.addActionListener(new Listener()); + + // Bind it to two and text + two.addActionListener(new Listener()); + text.addActionListener(new Listener()); + + } + + // Create the class for the listener + private class Listener implements ActionListener { + // Define what you want to occur after an event + public void actionPerformed(ActionEvent event) { + if (event.getSource() == one) { + + } else if (event.getSource() == two) { + count++; + // \n is needed to prevent scrolling + area.append("You pressed the button " + count + " times!"); + } else if (event.getSource() == text) { + // Grab the number inside the text area and set it to the variable number + number = Integer.paseInt(text.getText()); + number += 10; + // add "" to number so that it converts number to a String + text.setText(number + ""); + // Convert the number to a String + String temp = Integer.toString(number); + area.setText(temp); + } + + + } + } +} +``` + +The main code is really short, you just need to extend `JFrame` and some short code seen last class to set it up. + +```java +public class mainTester extends JFrame { + public static void main(String[] args) { + JFrame frame = new JFrame("Sample GUI"); // Sets the title to "Sample GUI" + frame.setDefaultCloseOperation(JFrame.EXIT_ON_CLOSE); + // Instantiate the GUILayout file you made before + frame.getContentPane().add(new GUILayout()); + } +} +``` + diff --git a/content/ta/fall2017/cpsc220/nov20.md b/content/ta/fall2017/cpsc220/nov20.md new file mode 100644 index 0000000..77f2ce6 --- /dev/null +++ b/content/ta/fall2017/cpsc220/nov20.md @@ -0,0 +1,116 @@ +# Lecture for November 20 + +## Adding a drawing panel to the GUI + +You can't put swing and graphics together, therefore you need to make a seperate JPanels for swing and graphics. + +Add necessary libraries + +```java +import java.awt.*; +import java.awt.Graphics; +import java.awt.event.*; +import javax.swing.*; +``` + + + +```java +public class drawingWindow extends JPanel { + JTextField field; + JButton draw; + DrawingPanel drawingPanel; + + public drawingWindow() { + // Each new component would be vertically stacked upon each other + setLayout(new BoxLayout(this, BoxLayout.Y_AXIS)); + + JPanel swingSTuff = new JPanel(); + + // Add things to the screen + draw = new JButton("Draw"); + field = new JTextField(); + swingStuff.add(field); + swingStuff.add(draw) + + // Add the drawing panel onto the screen + drawingPanel = new DrawingPanel(200, 400); + add(drawingPanel); + + // Activate the listener if the button was pressed + draw.addActionListener(new Listener()); + } + + // Add the listener to respond to events + private class listener implements ActionListener { + public void actionPerformed(ActionEvent event) { + if (event.getSource() == draw) { + drawingPanel.setFlag(1); + // Repaints the screen so the oval can appear + drawingPanel.repaint(); + } + } + } + + // Create the draw panel so we can add it to the screen + private class DrawingPanel extends JPanel { + private int width, height; + DrawingPanel(int width, int height) { + this.width = width; + this.height = height; + setPreferredSize(new Dimension(width, height)); + } + public void setFlag(int flag) { + this.flag = flag; + } + public void paintComponent(Graphics g) { + super.paintComponent(g); + + // Every time the flag is set, draw an oval at a random location and color + if (flag == 1) { + Random rand = new Random(); + int x = rand.nextInt(width); + int y = rand.nextInt(height); + g.setColor(Color.RED); + g.fillOval(x, y, 20, 30); + } + } + } +} +``` + +There are a myriad of different methods you can use. + +```java +// Assume width, height, y, x, etc are defined above +public void paintComponent(Graphics g) { + //.... + g.dispose(); // Flushes the graphics buffer +} +``` + +You have the traditional fill and draw methods. Fill creates the shape shaded in with a color. Draw creates an outline of the shape. + +```java + +// ... +g.fillRect(x ,y, width, height); + g.drawRect(x, y, width, height); + g.fillOval(x, y, width, height); + g.drawOval(x, y, width, height); + //g.drawPoly(parematers...); + //g.fillPoly(parameters...); + g.drawArc(x, y, width, height, startingAngle, sweepingAngle); + g.fillArc(x, y, width, height, startingAngle, sweepingAngle); +``` + +You can also create complex shapes like a polygon. When adding points, you need to make sure you add them Clockwise or Counterclockwise (but NOT both) + +```java + Polygon tri = new Polygon(); + tri.addPoint(150, 10); + tri.addPoint(175, 100); + tri.addPoint(125, 100); + // Add points clockwise or counterclockwise (NOT BOTH) +``` + diff --git a/content/ta/fall2017/cpsc220/nov27.md b/content/ta/fall2017/cpsc220/nov27.md new file mode 100644 index 0000000..fc94189 --- /dev/null +++ b/content/ta/fall2017/cpsc220/nov27.md @@ -0,0 +1,267 @@ +# Lecture for November 27 + +## Recursion + +When doing recursion, make sure not to use loops. + +Recursion is when a function makes a function call to itself. + +It consists of two parts: + +- Base Case: This tell it when to stop +- Smaller Caller Case: Helps you get closer to the base case + +You can have one or more base cases or caller cases. + +To teach recursion, we'll start with a problem that should be written iteratively (with loops) but we'll show how to do it with recursion. + +### Example: Counting Down + +```java +void CountDown(int number) { + while (number > 0) { + System.out.println(number + " "); + number = number - 1; + } + System.out.println("Blast Off") +} +``` + +1. How does this loop stop? -- Base Case +2. How does this loop change each time through? -- Smaller caller case + +Base Case: It stops when the number equals 0 + +```java +// Base Case +if (number == 0) { + System.out.println("Blast Off"); + return; +} +``` + +Smaller Caller Case: It decreases number by 1 + +```java +// Smaller Caller Case +System.out.print(number + " "); +countDownRecursive(number - 1); +``` + +Put it together... + +```java +void countDownRecursive(int number) { + if (number == 0) { + System.out.println("Blast Off"); + } else { + System.out.print(number + " "); + countDownRecursive(number - 1); + } +} +``` + +Prints `10 9 8 7 6 5 4 3 2 1 Blast Off` + +### Stack Snapshots + +Every time you make a recursive call, it keeps track of all the local variables at the current function call and pushes it onto the stack. + +That means if you make 10 recursive calls, you'll have 10 slots added onto the stack. If you want to return back to the beginning, you would need to return 10 times. + +### Order Matters + +Whether you do the recursive step first or some other action, it completely changes the output. Look at the following example that's similar to `countDownRecursive`. + +```java +void countUpRecursive(int number) { + if (number == 0) { + System.out.println("Blast Off"); + } else { + // Notice the swapping of the next two lines + countUpRecursive(number - 1); + System.out.print(number + " "); + } +} +``` + +This would print out `Blast Off 1 2 3 4 5 6 7 8 9 10` + +### Example: Summing up to a number + +This would be our iterative solution + +```java +int sum(int number) { + int sum = 0; + while (number > 0) { + sum += number; + number--; + } + return sum; +} +``` + +How does this loop stop? + +​ Same as before. Think about it, if the number you pass in is zero, what should be the result of sum? Zero. Since adding up from 0 to 0 is just 0. + +```java +if (number == 0) { + return 0; +} +``` + +How does this loop change each time through? + +​ You want to update your sum, so return the sum of the next call to the current sum. + +```java +return (number + sum(number - 1)); +``` + +Putting it all together + +```java +int sumRecursive(int number) { + if (number == 0) { + return 0; + } else { + return number + sumRecursive(number - 1); + } +} +``` + +### Example: Linear Search + +How to do it iteratively. + +```java +void linearSearch(int[] array, int number) { + int i = 0; + while (i < array.length && number != array[i]) { + i++; + } + if (i == array.length) { + System.out.println("Not Found"); + } else { + System.out.println("Found"); + } +} +``` + +Base Case: There are two base cases, when it reaches the end of the array and when it finds the number + +```java +if (array.length == i) { + System.out.println("Not Found"); +} else (array[i] == number) { + System.out.println(number + " found at index " + i); +} +``` + +Smaller Caller Case: Check the next element + +```java +linearSearchRecursion(number, array, i + 1); +``` + +Putting it all together... + +```java +void linearSearchRecursion(int[] array, int number) { + if (array.length == i) { + System.out.println("Not Found"); + } else if (array[i] == number) { + System.out.println(number + " found at index " + index); + } else { + linearSearchRecursion(number, array, i + 1); + } +} +``` + +## Binary Search + +This is a much more efficient search than the linear search we have been doing. The only condition is that your array must be sorted beforehand. + +A regular linear search `O(n)` -- Check at most all of the elements of the array. + +Binary Search `O(log(n))` -- Checks at most `ceil(log(n))` elements of an array. + +To demonstrate this with real numbers, let's take an array of 100 elements + +- With linear search this will take at most 100 iterations +- With binary search this will take at most **7**. + +Crazy right? + + + +### Implementation + +**Iterative approach** + +```java +void binarySearch(int number, int[] array) { + int lower = 0; + int upper = array.length - 1; + int mid = (lower + upper) / 2 + while (lower <= upper && array[mid] != number) { + mid = (lower + upper) / 2; + if (array[mid] < number) { + lower = mid + 1; + } else if () { + upper = mid -1; + } + } + if (lower > upper) { + System.out.println("Not Found"); + } else { + System.out.println(number + " found at index " + mid); + } +} +``` + +**Recursive Approach** + +Base Case: There are two cases, you either found it, or you made it to the end of the array without finding it + +```java +if (lower > upper) { + System.out.println("Not Found"); +} else if (array[mid] == number) { + System.out.println(number + " found at index " + mid); +} +``` + +Smaller Caller Case: Change the lower or upper bounds to cut the search in half + +```java +if (array[mid] < number) { + lower = mid + 1; + binarySearchRecursive(number, array, lower, upper); +} else if (array[mid] > number) { + upper = mid - 1; + binarySearchRecursive(number, array, lower, upper); +} +``` + +Putting it together.... + +```java +binarySearch(int number, int[] array, int lower, int upper) { + if (lower > upper) { + System.out.println("Not Found"); + } else if (array[mid] == number) { + System.out.println(number + " found at index " + mid); + } + else if (array[mid] < number) { + lower = mid + 1; + binarySearchRecursive(number, array, lower, upper); + } else if (array[mid] > number) { + upper = mid - 1; + binarySearchRecursive(number, array, lower, upper); + } +} +``` + diff --git a/content/ta/fall2017/cpsc220/nov6.md b/content/ta/fall2017/cpsc220/nov6.md new file mode 100644 index 0000000..9c6c08a --- /dev/null +++ b/content/ta/fall2017/cpsc220/nov6.md @@ -0,0 +1,137 @@ +# November 6th Lecture + +## Compare cont. + +Continuing from last week's topic, writing a function called `compare` in your custom class. + +For example, for your project: + +```java +public bool compare(ResearchProject right, int type) { + if (type == 0) { // Is last lastname greater than right lastname alphabeticallly + if (lastname.compareTo(right.lastname) > 0) { + return true; + } else { + return false; + } + } else if (type == 1) { // Implement a different type of comparison + + } +} +``` + +You can then use the sorting algorithms discussed previously to sort the ResearchProjects using the `compare` method. + +## File IO + +First start by importing the required libraries. + +```java +import java.io.FileInputStream; +import java.io.IOException; // For error handling +import java.io.FileNotFoundException; // For error handling +import java.util.Scanner; +``` + +Then inside your main method which throws an IOException (see example "Reading the filename from the keyboard") + +```java +FileStream file; +Scanner in; +try { // Try something + file = new FileInputStream("test.txt"); + in = new Scanner(file); +} catch (FileNotFoundException e) { // Catch IF it fails + System.out.println("File not found."); + in = new Scanner(System.in); // Read from the keyboard instead +} +// Read the file now.... +String name = in.nextLine(); +``` + +Before we had linked the Scanner to the keyboard, now we're doing it to a file. + +### Try-Catch + +In the code above you see what's called a try-catch block. That means that if something was to happen in the execution of the code. Instead of just crashing as we have been seeing normally. We can deal with the error. In the example above you saw that the program reads from the keyboard instead of the file + +### Reading the filename from the keyboard + +```java +public static void main(String[] args) throws IOException { + FileInputStream file; + Scanner in, scnr; + // Connect one scanner to the keyboard to get the filename + scnr = new Scanner(System.in); + + System.out.print("Enter file name: "); + String filename = in.nextLine(); + + // Repeat code from previous example + FileStream file; + Scanner in; + try { + file = new FileInputStream(filename); // Only this line changed + in = new Scanner(file); + } catch (FileNotFoundException e) { + System.out.println("File not found."); + in = new Scanner(System.in); + } + String name = in.nextLine(); + // .... +} +``` + +The main throws the IOException since we don't deal with it in any of the catch blocks. + + + +### Reading names of people from a file into an array + +Let's say we have a file with the following in it + +``` +3 +Paul +Peter +Mary +``` + +3 is to indicate the number of names in th file. + +Let's write code in order to read these names into an array! + +```java +import java.io.FileInputStream; +import java.io.IOException; +import java.io.FileNotFoundException; +import java.util.Scanner; +public static void main(String[] args) throws IOException { + FileInputStream file; + Scanner in, scnr; + scnr = new Scanner(System.in); + + System.out.print("Enter file name: "); + String filename = in.nextLine(); + + FileStream file; + Scanner in; + try { + file = new FileInputStream(filename); // Only this line changed + in = new Scanner(file); + } catch (FileNotFoundException e) { + System.out.println("File not found."); + in = new Scanner(System.in); + } + + // For the size of the array, get the first number in the file + int size = in.nextInt(); + String[] nameArray = new String[size]; + for (int i = 0; i < size; i++) { + namesArray[i] = in.nextLine(); + } + + // Now all the names in the file is in the namesArray +} +``` + diff --git a/content/ta/fall2017/cpsc220/oct11.md b/content/ta/fall2017/cpsc220/oct11.md new file mode 100644 index 0000000..a306568 --- /dev/null +++ b/content/ta/fall2017/cpsc220/oct11.md @@ -0,0 +1,133 @@ +# Lecture Notes October 11 + +## Global Variables + +Global variables is where you don't declare a variable inside a method. This is generally not a recommended practice. It is recommended to declare variables inside methods so that it is easier to reuse code. + +```java +public class mainDriver { + public static int globalVariable = 5; // I am a global variable + public static void main(String[] args) { + int localVariable = 4; // I am a local variable + } +} +``` + +## String Formatting + +You can format strings in java by using the `printf` method in System.out. + +Format strings work by using placeholders starting with `%` to specify where to place the value of a variable. + +General format of command + +```java +//System.out.printf(FormatString, variable1, variable2, ....) +String s = "The number is"; +int x = 5; +System.out.printf("%s %d", s, x); // Prints "The number is 5" +``` + +If you want to print out money, you can do it through the following + +```java +float tax = 0.45698; +System.out.printf("The tax is %.2f"); //prints "The tax is 0.46" +``` + +## Floating point precision + +Due to how computers store non-integers, math can be non-precise after some mathematical operations. It is therefore advantageous to do operations on integers to the level of precision you want. + +For example, instead of working in dollars, work in pennies since it's the smallest division we care about. + + + +### ArrayList + +Standard arrays are static, meaning they have no ability to grow. Instead of doing the operations we described last class, in order to add something to an array. We can use something called an `ArrayList` instead. + +The methods in the `ArrayList` library are useful abstractions to make the life of a programmer easier. + +ArrayLists can also hold only one type. The type cannot be a primitive like a standard array. Instead it must be a class representing the desired type. + +int -> Integer + +double -> Double + +char -> Character + +float -> String + +To declare and initialize an `ArrayList` + +```java +import java.util.ArrayList; +public class ArrayListTest { + public static void main(String[] args) { + ArrayList numbers = new ArrayList(); + ArrayList names = new ArrayList(); + } +} +``` + +`ArrayList`s has a variety of different methods that can be used to access/manipulate it + +- get +- set +- add +- clone +- clear +- size + +If you want to add the numbers 1 through 10 into the `ArrayList` of numbers + +```java +for (int i = 1; i < 11; i++) { + numbers.add(i); +} +``` + +To print out the entire contents of the `ArrayList` + +```java +for (int i = 0; i < numbers.size(); i++) { + System.out.println(numbers.get(i)); +} +``` + +How can you replace a value? + +```java +int n = 5; // Make this the number you wish to replace +int i = 0; +while (i < numbers.size() && numbers.get(i) != n) { + i++; +} +if (i == numbers.size()) { + System.out.println(n + " not found."); +} else { + int r = 10; // Make this the value you want to replace n with + numbers.set(i, r); +} +``` + +The `remove` method removes an item given an index. This shifts all the elements above the removed index down. + +```java +numbers.remove(3); // Removes the element in the third index +``` + +The `add` method can also take an index. It pushes all the elements at the index specified up. + +```java +numbers.add(3, 5); // Adds the number 5 to the third index +``` + +You can clone an array using the `clone` method + +```java +ArrayList numbers2 = new ArrayList(); +numbers2.clone(numbers); // Clones numbers into numbers2 +``` + diff --git a/content/ta/fall2017/cpsc220/oct18.md b/content/ta/fall2017/cpsc220/oct18.md new file mode 100644 index 0000000..0eaf04b --- /dev/null +++ b/content/ta/fall2017/cpsc220/oct18.md @@ -0,0 +1,75 @@ +# October 18th + +## ArrayLists in classes + +```java +public class Numbers { + private ArrayList used; + private ArrayList unused; + numbers () { + // Debug: System.out.println("1. Constructor Entry Point"); + used = new ArrayList(); + unused = new ArrayList(); + // Debug: System.out.println("2, Constructor Size of ArrayLists" + used.size() + " " + unused.size()) + } + // Adds the numbers 1-5 into the used ArrayList + public void fillUsedArrayList() { + for (int i = 0; i < 5; i++) { + used.add(i + 1); + } + } + // Move an item from the unused ArrayList to the used ArrayList + public int moveIt(int index) { + int temp = used.get(index); + unused.add(temp); + // Debug: System.out.println("Adding to used array:" + (i + 1)); + used.remove(index); + return temp; + } + // The method below is created for debugging purposes + public void printBothArrayLists() { + // Print the used arraylist + System.out.println("Used ArrayList"); + for (int i = 0; i < used.size(); i++) { + System.out.println(used.get(i)); + } + + // Print the unused arraylist + System.out.println("Unused ArrayList"); + for (int i = 0; i < unused.size(); i ++) { + System.out.println(unused.get(i)); + } + } +} +``` + +Recall that you can compile the code above but you cannot run it. To run code, you must have a main method. + +## NumberTester + +```java +public class NumberTester { + public static void main(String[] args) { + Numbers list; + list = new Numbers(); + list.fillUsedArrayList(); + list.printBothArrayLists(); + } +} +``` + + + + + +## Difference between Array and ArrayList + +An Array is a **static** structure of contiguous memory of a single type. + +An ArrayList is a **dynamic** structure of contiguous memory of a single type + + + +To get the size of an array you use `.length` + +To get the size of an ArrayList you use `.size()` \ No newline at end of file diff --git a/content/ta/fall2017/cpsc220/oct2.md b/content/ta/fall2017/cpsc220/oct2.md new file mode 100644 index 0000000..73581c8 --- /dev/null +++ b/content/ta/fall2017/cpsc220/oct2.md @@ -0,0 +1,160 @@ +# Lecture Notes Oct 2nd + +## Array + +`array` is not a reserved word, it's a concept. Arrays are able to hold multiple values under one name of the same type. + +For instance, you can have an array of integers. + +Properties of an array + +- Size (n) +- index [0, n - 1] + +You can declare arrays by saying the type '[]' and the name of the array + +```java +int[] numbers; +double[] gpas; +float[] grades; +``` + +Before you can use the array, you must `new` it + +```java +numbers = new int[10]; +``` + +Where 10 is the size of the array. + +You can combine both the declaration and initialization + +```java +double[] points = new double[7]; +``` + +You can access individual elements of the array by using its index. Indexes start from zero + +```java +points[0] = 5.4; // The first element in the point array is 5.4 +``` + +The `.length` property of an array gives the size of the array + +## For-Loops + Arrays + +You can print out each element in the array using a for loop + +```java +for (int i = 0; i < numbers.length; i++) { + System.out.println(numbers[i]); +} +``` + +You can ask a user to input a value to each element in the array + +```java +for (int i = 0; i < points.length; i++) { + System.out.print("Enter a number: "); + points[i] = scnr.nextInt(); +} +``` + +## While-Loops + Arrays + +You can use a while loop to search the array + +```java +int i = 0; +int number = 5; +// While the index is within the array size and the number isn't found +while (i != number.length && number != numbers[i]) { + i++ +} +if (i == numbers.length) { + System.out.println(number + " was not found.") +} else { + System.out.println(number + " was found at index " + i) +} +``` + +If you don't include the `i != number.length` you will obtain an `IndexOutOfBounds` error. + +The example above is called a *Linear Search*. + +Linear searches work on an unsorted and sorted arrays. + + + +## Methods + Arrays + +You can pass an array into a method + +```java +public static void exampleMethod(int[] sample) { + // Do something +} +public static void main(String[] args) { + int[] s = new int[30]; + exampleMethod(s); +} +``` + + + +## Do-While Loops + +For-loops can run 0 or more times. If you want something to execute at least once. Use a do-while loop. + +```java +do { + // Code +} while (condition); +``` + +For example, to search at least once and asking whether the user wants to search again + +```java +// Assume linearSearch and array are defined +char answer; +Scanner input = new Scanner(System.in); +do { + linearSearch(array, input); + System.out.print("Do you want to search again? (Y/N) "); + input.nextLine(); + answer = input.next().charAt(0); +} while( answer != 'N'); +``` + +You can create any type of loop just by using a while loop. + + + +## Example: Finding the Max + +You can find the max of an array using the following method + +```java +double max = arrayName[0]; +for (int i = 1; i < arrayName.length; i++) { + if (max < arrayName[i]) { + max = arrayName[i]; + } +} +System.out.println("The max is " + max); +``` + + + +## Example: Summing up an array + +You can sum the array using the following method + +```java +double sum = 0; +for (int i = 0; i < arrayName.length; i++) { + sum += arrayName[i]; +} +System.out.println("The sum is " + sum); +``` + diff --git a/content/ta/fall2017/cpsc220/oct23.md b/content/ta/fall2017/cpsc220/oct23.md new file mode 100644 index 0000000..682dc5c --- /dev/null +++ b/content/ta/fall2017/cpsc220/oct23.md @@ -0,0 +1,78 @@ +# Lecture for October 23 + +## Two-Dimensional Arrays + +You can think of a two dimensional array as a grid that is organized by rows then columns. + +To declare a two dimensional array do the following + +```java +int[][] grid = new int[5][5]; // Declares a 2D array of 5 rows and 5 columns +``` + +You can have as many dimensions as you want. For graphics a 3-dimensional array would render 3D points. + +It doesn't have to be inherently visual though, you can have the n-dimensional array look at the interaction between n different variables. For example, the relationships to different questions in a survey. + +Strings are essentially a char array with extra methods attached. We can imitate an array of strings with a 2D char array. + +```java +char[][] helloWorld = new char[5][5]; +hello[0][0] = 'h'; +hello[0][1] = 'e'; +hello[0][2] = 'l'; +hello[0][3] = 'l'; +hello[0][4] = 'o'; +hello[1][0] = 'w'; +hello[1][1] = 'o'; +hello[1][2] = 'r'; +hello[1][3] = 'l'; +hello[1][4] = 'd'; + +``` + +## Nested-For Loops + +To access the elements in a 2D array, you need to use a nested for-loop. + +Here is how you print out the hello world example above + +```java +for (int row = 0; row < helloWorld.length; row++) { + for (int col = 0; col < helloWorld[row].length; col++) { + System.out.print(helloWorld[row][col]); + } + System.out.print(" ") +} +``` + +The code above prints out "hello world" + + + +## 2D Arrays in methods + +You can write a get like method in the following way + +```java +public static void get(int[][] array, int row, int col) { + return array[row][col]; +} +``` + +Arrays in Java are pass by reference not pass by value. Meaning that if you change the array within the method then it will change outside the method. + +```java +public static void insert(int[][] array, int row, int col, int numToInsert) { + array[row][col] = numToInsert; +} +``` + +To make it not be able to change the array inside the method, use the keyword `const` inside the method header. To code below will throw a compiler error. + +```java +public static void insert(const int[][] array, int row, int col, int numToInsert) { + array[row][col] = numToInsert; // This line will throw an errror +} +``` + diff --git a/content/ta/fall2017/cpsc220/oct25.md b/content/ta/fall2017/cpsc220/oct25.md new file mode 100644 index 0000000..fcfc7e7 --- /dev/null +++ b/content/ta/fall2017/cpsc220/oct25.md @@ -0,0 +1,21 @@ +# Lecture on Oct 25 + +## 2 Dimension Array of Objects + +You can not only do a two dimensional array of primitive types, but you can also do two dimensional arrays of objects/classes. + +```java +animalLocation[][] map; +map = new animalLocation[5][4]; +``` + +Since we are dealing with classes, you cannot use this array right away. The code above creates the space in memory to store the objects. To have the animalLocation objects in the array, you must `new` each instance of the object. + +```java +for (int i = 0; i < map.length; i++) { + for (int j = 0; j < map[i].length; j++) { + map[i][j] = new animalLocation(); + } +} +``` + diff --git a/content/ta/fall2017/cpsc220/oct30.md b/content/ta/fall2017/cpsc220/oct30.md new file mode 100644 index 0000000..39e4f00 --- /dev/null +++ b/content/ta/fall2017/cpsc220/oct30.md @@ -0,0 +1,101 @@ +# Oct 30 Lecture + +## Sorting + +### Bubble Sort + +These instructions are to sort in descending order, to sort in ascending order just negate the condition. + +This sort is a series of iterations, for each iteration you go to the bottom of the array. Then compare if the value is greater than the element before it. If it is, then you + +1. Go to the bottom of the array +2. Compare the value to the one before it + 1. If it's greater than the element before it -> swap +3. Move on to the value before it and repeat step 2. + +Once you go through an iteration, the last thing being compared is the greatest value of the entire array. That means you don't have to check it every time anymore. + +Keep going through all the iterations until n, where n is the size of the array, iterations have been completed. + +### Swapping Values + +If you try to swap variables by saying + +```java +y = x; +x = y; +``` + +then you'll end up overwriting y's value with x and both variable would have x's value. + +If you want to actually swap variables, you must create a temporary variable that saves y's value so that it can be properly assigned to x. + +```java +int temp; +temp = y; +y = x; +x = temp; +``` + +### Implementation (Not Complete) + +```java +// Each iteration +for (int j = 0; j < array.length - 1; j++) { + // Each element in the list + for (int i = 0; i < array.length - 1; i++) { + // Is the element greater than the one after it? + if (array[i] > array[i + 1]) { + // Swap + int temp = array[i + 1]; + array[i + 1] = array[i]; + array[i] = temp; + } + } +} +``` + +This here compares each of the values each time. If you remember before, I said that you don't have to compare the topmost each time. + +### Implementation + +To change this, just change the second loop condition + +```java +// Each iteration +for (int j = 0; j < array.length - 1; j++) { + // Each element in the list + for (int i = 0; i < array.length - 1 - i; i++) { // Note this line + // Is the element greater than the one after it? + if (array[i] > array[i + 1]) { + // Swap + int temp = array[i + 1]; + array[i + 1] = array[i]; + array[i] = temp; + } + } +} +``` + +## Compare + +In Java, you can compare numbers, strings, and even your own customized objects. To compare your own customize object, you must write a method called `compare` in your class. + +### To use your compare method in the sorting algorithm + +```java +// Each iteration +for (int j = 0; j < array.length - 1; j++) { + // Each element in the list + for (int i = 0; i < array.length - 1 - i; i++) { + // Is the element greater than the one after it? + if (array[i].compare(array[i + 1])) { // Note this line + // Swap + int temp = array[i + 1]; + array[i + 1] = array[i]; + array[i] = temp; + } + } +} +``` + diff --git a/content/ta/fall2017/cpsc220/oct4.md b/content/ta/fall2017/cpsc220/oct4.md new file mode 100644 index 0000000..5329411 --- /dev/null +++ b/content/ta/fall2017/cpsc220/oct4.md @@ -0,0 +1,30 @@ +# Lecture on October 4th + +## Pass by Copy vs Pass by Reference + +### Pass by Copy + +When you pass a primitive type into a method (int, char, double, float, etc), it makes a copy of the value of the variable and brings it into the method + +### Pass by Reference + +When you pass an array into a method (int[], char[], double[], etc[]), it passes in the reference of the variable into the method. In other words, you give the actual array into the method and allows the method to change it. + +### What's the Implication? + +If you change the primitive in a method, it doesn't actually change the value of the variable. + +If you pass in an array and change it in the method, it has been permanently changed outside the method as well. + +### How do I make it so I can't change my array by accident? + +Use the `final`keyword in the method header + +```java +public static void printAll(final int[] array) { + for (int i = 0; i < array.length; i++) { + System.out.println("Number " + (i + 1) + " is " + array[i]) + } +} +``` + diff --git a/content/ta/fall2017/cpsc220/oct9.md b/content/ta/fall2017/cpsc220/oct9.md new file mode 100644 index 0000000..14bee39 --- /dev/null +++ b/content/ta/fall2017/cpsc220/oct9.md @@ -0,0 +1,37 @@ +# Lecture Notes October 9th + +## Arrays (Cont.) + +### Another way of Array Initialization + +```java +String[] names = {"Jennifer", "Noodle", "Fluffy", "Rosie", "Cinnamon", "Brianne", "Oliver"} +``` + +Everything between the `{}` is the initial values in the names array in the order that it is written. + +Recall that arrays are of a fixed size. The `names` array above has 7 elements. + +### What can I do if I want to add something to the names array? + +Do the following steps: + +1. Create an empty array with the same size as the array +2. Take all the contents in the array and store it in a temporary array +3. Set names equal to another array of a bigger size +4. Take all the contents in temp and store it back to the array of choice +5. Add an element to the array by index + +```java +// (1) +String[] temp = new String[7]; +// (2) +temp.clone(names); +// (3) +names = new String[20]; // Now it can hold up to 20 names +// (4) +names.clone(temp); +// (5) +names[7] = "New name!"; +``` + diff --git a/content/ta/fall2017/cpsc220/sept11.md b/content/ta/fall2017/cpsc220/sept11.md new file mode 100644 index 0000000..b1b6b49 --- /dev/null +++ b/content/ta/fall2017/cpsc220/sept11.md @@ -0,0 +1,220 @@ +# CPSC 220 Lecture 4 + +## Practice Problem + +1. Create a class called Car +2. - Create a private variable of int type called year + - Create a private variable of String type called make +3. Create accessor methods for all data members. +4. Create mutator methods for all data methods. + + + +```java +public class car { // begin car + private int year; + private String make; + public int getYear(void) { + return year; + } + public String getMake() { + return make; + } + public void setYear(int y) { + if (y > 1890) { + year = y; + } else { + System.out.println(y + " is not a valid year."); + } + } + public void setMake(String m) { + make = m; + } +} +``` + +Local variables are only existent within the curly braces that it is defined in. + +## If Statements and Boolean Expressions + +Boolean expressions return a boolean + +```java +1 < 4; // 1 is less than 4: TRUE +3 > 5; // 3 is greater than 5: FALSE +5 == 5; // 5 is equal to 5: TRUE +5 != 5; // 5 is not equal to 5: FALSE +1 >= 1; // 1 is greater than or equal to 1: TRUE +5 <= 1; // 5 is less than or equal to 1: FALSE +``` + + If statements only occur if the boolean expression is true, otherwise the `else` block is executed. + +```java +if (true) { + System.out.println("I am always printed"); +} else { + System.out.println("I am never printed"); +} +``` + +You can only have one `else` per `if`. If you have an `if` you don't necessarily need an `else` + +## Local vs Class Variables + +If you have a local variable and the class variable sharing the same name, then the local variable is always used first. + +```java +public class car { // begin car + private int year; + public void setYear(int year) { + year = year; + } +} +``` + +This is a redundant statement, it makes the argument that is passed in equal to itself. + +To avoid this situation, use the keyword `this` to access the class variable + +```java +public class car { + private int year;   + public void setYear(int year) {     + this.year = year; + } +} +``` + +The code above runs as expected. + +Rewriting our class with `this` + +```java +public class car { // begin car + private int year; + private String make; + public int getYear(void) { + return year; + } + public String getMake() { + return make; + } + public void setYear(int year) { + if (y > 1890) { + this.year = year; + } else { + System.out.println(y + " is not a valid year."); + } + } + public void setMake(String make) { + this.make = make; + } +} +``` + +## Unreachable Code + +When the code hits a `return` statement, it stops executing the rest of the code in the method. Also throws an Unreachable Code Error. + +```java +public int add(int x, int y) { + return x + y; + System.out.println("x + y = " + x + y); +} +add(); +System.out.println("Hello"); +``` + +Here the code above will not compile, though assuming the error doesn't exist then it would only print out "Hello" + +## Constructors + +You cannot have a private or protected constructors. + +Constructors are used to initialize your objects. + +You want to have the class variables to the left of the assignment statement. + +```java +public class car { + private int year; + private String make; + car() { + year = 1890; + make = "Ford"; + } + car(int year, String make) { + this.year = year; + this.make = make; + } +} +``` + + + +## Testers + +Testers are useful to check that the class is implemented correctly. Both the tester and the class have to be in the same folder/directory. + +```java +public class carTester { + public static void main(String[] args) { + Car myCar; // Declaration + myCar = new Car(); // Initilization + Car yourCar = new Car(2009, "Hyundai"); // Declaration + Initialization + } +} +``` + + + +## More about classes + +```java +public class Car { + private String name; + private int odometer; + public void setOdometer(int od) { + odometer = od; + } + public void setName(String n) { + this.name = n; + } + public void changeOilRequest(String name, int od) { + if (name == this.name) { + int difference = od - this.odometer; + if (difference > = 3000) { + // You can call other methods in the class + setOdo(od); // Equivalent to "this.setOdo(od);" + this.odometer = od; + System.out.println("Ready for oil change."); + } else { + System.out.println(name + " not ready for oil change.") + } + } // end if + } // end changeOil request +} // end class +``` + +To call public methods outside the class use the variable name to do so. + +```java +public class CarTester { + public static void main(String[] args) { + Car myCar = new Car(); + myCar.setName("Honda") + myCar.changeOilRequest("Honda", 3400); + } +} +``` + +## Math library + +The `ceil` method rounds up while the `floor` method runs down. + +```java +Math.ceil(3.2); // 4 +Math.ceil(4.1); // 4 +``` + diff --git a/content/ta/fall2017/cpsc220/sept20.md b/content/ta/fall2017/cpsc220/sept20.md new file mode 100644 index 0000000..4fea2f2 --- /dev/null +++ b/content/ta/fall2017/cpsc220/sept20.md @@ -0,0 +1,177 @@ +## Counting Loop + +Looking at the following example code + +```java +int i; +for (i = 0; i < 3; i++) { //begin for + System.out.println("i = " + i); //body +} //end for +System.out.println("After loop, i = " + i); +``` + +`i = 0` is the initializing statement + +`i < 3` is the conditional, that is when the loop ends + +`i++` is the increment/decrement + +`i++` is synonymous with `i = i + 1` + +The initialization statement only occurs once at the beginning of the loop. + +### Execution Example + +Let us go through this for loop example + +- Let us set `i = 0` +- Is `i < 3`? Yes execute the body + - The body executes an output of `"i = 0"` +- Now we increment `i ++`, i is now 1 +- Is `i < 3`? Yes, 1 is less than 3. Execute body + - The computer prints out `"i = 1"` +- Increment `i++` i is now 2 +- Is `i < 3`? Yes 2 is less than 3. Execute body + - The computer prints out `"i = 2"` +- Increment `i++`, i is now 3 +- Is `i < 3`? No 3 is not less than 3 + - Don't execute body of loop + +Exit loop. Print `"After loop, i = 3"` + + + +### Condensing Syntax + +You can also do the declaration in the initialization statement + +```java +for (int i = 0; i < 3; i++) { + System.out.println("i = " + i); +} +``` + +This now runs like above without the `"After loop, i = 3"` print. You cannot access the variable `i` outside the for loop since in this example, it belongs to the for loop's scope. + + + +## Logic Expressions + +### And Statements + +With the AND operator `&&` both the left and right side needs to be true for the expression to be true. + +```java +true && true // true +true && false // false +false && true // false +false && false // false +``` + +### Or Statements + +With the OR operator `||` either the left or right side needs to be true for the expression to be true. + +```java +true || true // true +true || false // true +false || true // true +false || false // false +``` + +### Examples + +**Example**: Print out the number `n` if it is between 10 and 20 (inclusive) + +```java +if (n >= 10 && n <= 20) { + System.out.println(n); +} +``` + +**Example**: Print out the `age` if it is not of young adult age. Young adult range is from 18 to 39 (inclusive) + +```java +if (!(age >= 18 && age <= 39)) { + System.out.println(age); +} +``` + +Or you can use De Morgan's Law (for the curious) + +```java +if (age < 18 || age > 39) { + System.out.println(age); +} +``` + + + +## For Loops (Cont.) + +### Backwards counting + +You can use the loop to count backwards + +```java +for (int i = 10; i > -1; i--) { + System.out.println(i); +} +``` + +This prints the following + +```java +10 +9 +8 +7 +6 +5 +4 +3 +2 +0 +``` + +### Rows-Columns + +You can make rows and columns of asterisks + +```java +for (int j = 0; j < someNumber; j++) { // Corresponds to rows + for (int i = 0; i < someNumber2; i++) { // Corresponds to columns + System.out.print("*"); + } + System.out.println(""); // Goes to the next row +} +``` + +If `someNumber` equals `someNumber2`, then we have the same amount of rows as columns. + +Let `someNumber` equal to 2 and `someNumber2` equal to 2 + +Output: + +``` +** +** +``` + +### Right Triangles + +You can make a right triangle of Tilda with the following code + +```java +for (int i = 1; i <= num; i++) { // Corresponds to the row + for (int j = 0; j < i; j++) { // Corresponds to the column and stops at the current row number + System.out.print("~"); + } + System.out.println(""); // Moves to next row +} +``` + + + +##### What are for-loops used for? *Reusing code* + diff --git a/content/ta/fall2017/cpsc220/sept25.md b/content/ta/fall2017/cpsc220/sept25.md new file mode 100644 index 0000000..bd7ffd5 --- /dev/null +++ b/content/ta/fall2017/cpsc220/sept25.md @@ -0,0 +1,97 @@ +# Lecture in CPSC 220 Sept 25 2017 + +## Constants + +Adding the keyword `final` in front of a variable declaration makes the variable constant. Meaning you cannot later change it in the code. + +```java +final int MAX = 10; +``` + +By industry norm, the style of the variable is to have it in all caps. + +You CANNOT do the following + +```java +final int MAX = 10; +MAX = 15; +``` + + + +## Using Libraries + +1. Import the library +2. Find the method that is appropriate +3. Use it + +Example: + +```java +import java.util.Math; +public class MathTest { + public static void main(String[] args) { + double answer = Math.ceil(5.4); + System.out.println(Math.ceil(4.5)); + } +} +``` + +## Typecasting / Type Conversions + +You can only cast a variable if you are casting it to a type that is larger than the one it was previously. The expression Polack used is that you cannot fit into super skinny jeans, but you can fit into bigger pants. + +```java +double dnum; +float fnum; +int inum; +dnum = (double)fnum * (double)inum; +``` + +## Char vs String + +`String`s are initialized in Java with double quotes while `char`s are initialized with single quotes + +```java +char initial = 'j'; +String name = "Jennifer"; +``` + +Characters can be read in as an integer. + + + +## Random Numbers + +1. Import `java.util.Random;` +2. Declare the random number generator +3. Initialize with `new` +4. Use it + + + +```java +import java.util.Random; +public class RandTest { + public static void main(String[] args) { + Random rand; + rand = new Random(); + int number = rand.nextInt(100); // Random generates number between 0-99 + } +} +``` + +How do you generate numbers in a different range? [50, 150] + +```java +rand.nextInt(100); // 0-99 +rand.nextInt(101) // 0 - 100 +rand.nextInt(101) + 50 //50-150 +``` + +In more general terms + +```java +rand.nextInt(end - start + 1) + start +``` + diff --git a/content/ta/fall2017/cpsc220/sept6.md b/content/ta/fall2017/cpsc220/sept6.md new file mode 100644 index 0000000..e59128d --- /dev/null +++ b/content/ta/fall2017/cpsc220/sept6.md @@ -0,0 +1,298 @@ +# CPSC 220 Lecture 3 + +## Variables + +Variable -- Storage of information + +The type cannot change in a variable. + +Examples of types include + +- int +- float +- double +- String +- char +- boolean + +Declaration: `int num;` + +Initialization: `num = 5;` + +Declaration + Initialization: `int num = 5;` + +### Possible Errors + +**You cannot declare a variable multiple times.** + +Undefined variables are when you do not declare a variable before attempting to use it. + +### Casting + +You need to cast if you are attempting to lose data or store a larger memory type into a smaller one. + +double -> float -> int **(casting required)** + +```java +double gpa = 3.2; +int num1 = 10 * (int)gpa // 30 +``` + + + + + +# Operations + +The basic number operations are + +- + +- - +- * +- / +- % *(the remainder)* + +Examples + +```java +0 % 2 // 0 +1 % 2 // 1 +2 % 2 // 0 + +3 % 2 // 1 +4 % 2 // 0 +5 % 2 // 1 + +3 % 5 // 3 +7 % 5 // 2 +``` + +You can test if something is even using modulus % + +```java +// Assuming i was initiliazed to a value earlier +if (i % 2 == 0) { + System.out.println("i is even"); +} else { + System.out.println("i is odd"); +} +``` + + # System input + +Here is sample code using a Scanner as input + +```java +import java.util.Scanner; +public class ScannerExample { + public static void main(String[] args) { + Scanner in; + in = new Scanner(System.in); + + // Grab numerical values + int num = in.nextInt(); + float gpa = in.nextFloat(); + double weight = in.nextDouble(); + + // Grab a single character + in.nextLine() + char initial = in.next().charAt(0); + + // To get the entire line of a string + in.nextLine(); + String name = in.nextLine(); + } +} +``` + +You need to use `in.nextLine()` to grab the carriage return that is left after grabbing a numeric value. + + + +# Classes and Objects + +Classes are a new type that you can have multiple things of. + +These classes are blueprints that are made up of primitives or more basic types. + +First create a Pet.java file (Name of the class must match the name of the file) + +```java +public class Pet { + private String name; + private int years; +} +``` + +You can then use the Pet class in your main program. The terminology here is that you can create instances or objects of the class. + +In PetTester.java + +```java +public class PetTester { + public static void main(String[] args) { + Pet myPet; + myPet = new Pet(); + } +} +``` + +**Both Pet.java and PetTester.java must be in the same directory/folder** + +### Mutators/Accessors + +Since the variables are private we cannot access them in the main program. To work around this, we can write what is called a mutator method. + +```java +public class Pet { + private String name; + private int years; + + // Mutators + public void setName(String n) { + name = n; + } + public void setYears(int y) { + if (y >= 0) { + years = y; + } else { + System.out.println("No one is less than 0 years old.") + } + } +} +``` + +Now let's use these new methods + +```java +public class PetTester { + public static void main(String[] args) { + Pet mypet; + myPet = new Pet(); + myPet.setName("Fred"); + myPet.setAge(20); + } +} +``` + +We need a method that will allow us to access the data type. Let's add accessors to our pet class. + +```java +public class Pet { + private String name; + private int years; + + // Mutators + public void setName(String n) { + name = n; + } + public void setYears(int y) { + if (y >= 0) { + years = y; + } else { + System.out.println("No one is less than 0 years old.") + } + } + + // Accessors + public String getName() { + return name; + } + public int getYears() { + return years; + } +} +``` + +Now let's get some information from the pet object, such as the age. + +```java +public class PetTester { + public static void main(String[] args) { + Pet mypet; + myPet = new Pet(); + myPet.setName("Fred"); + myPet.setYears(20); + + int year = myPet.getYears(); + } +} +``` + + + +### Constructors + +Constructors lets us initialize variables in the class without having to use mutator methods. + +```java +public class Pet { + private String name; + private int years; + + // Default Constructor + public Pet() { + name = ""; + years = 0; + } + // Non-Default Constructor + public Pet(int y, String n) { + name = n; + years = y; + } + + // Mutator Methods + public void setName(String n) { + name = n; + } + public void setYears(int y) { + if (y >= 0) { + years = y; + } else { + System.out.println("No one is less than 0 years old.") + } + } + + // Accessor Methods + public String getName() { + return name; + } + public int getYears() { + return years; + } +} +``` + +Now let us see this in action. + +```java +public class PetTester { + public static void main(String[] args) { + Pet yourPet = new Pet(10, "Fluffy"); + } +} +``` + +You can have as many constructors as you want, but they must be different. + +Example: + +```java +public class Pet { + ... + pet() { + name = ""; + years = 0; + } + pet(int y, String n) { + name = n; + years = y; + } + pet(String n) { + years = 1; + name = n; + } + ... +} +``` + diff --git a/content/ta/spring2018.md b/content/ta/spring2018.md new file mode 100644 index 0000000..e69de29 diff --git a/content/ta/spring2018/cpsc220.md b/content/ta/spring2018/cpsc220.md new file mode 100644 index 0000000..4d7cfc1 --- /dev/null +++ b/content/ta/spring2018/cpsc220.md @@ -0,0 +1,40 @@ + +# CPSC 220 Computer Programming and Problem Solving Spring 2018 + +[Lecture 1 -- January 16](jan16) + +[Lecture 2 -- January 18](jan18) + +[Lecture 3 -- January 23](jan23) + +[Lecture 4 -- January 25](jan25) + +[Lecture 5 -- January 30](jan30) + +[Lecture 6 -- February 1](feb1) + +[Lecture 7 -- February 6](feb6) + +[Lecture 8 -- February 8](feb8) + +[Lecture 9 -- February 13](feb13) + +[Lecture 10 -- February 20](feb20) + +[Lecture 11 -- February 27](feb27) + +[Midterm Review](midtermreview) + +[Lecture 12 -- March 13](mar13) + +[Lecture 13 -- March 20](mar20) + +[Lecture 14 -- March 22](mar22) + +[Lecture 15 -- March 27](mar27) + +[Lecture 16 -- March 29](mar29) + +[Lecture 17 -- April 3](apr3) + + diff --git a/content/ta/spring2018/cpsc220/apr3.md b/content/ta/spring2018/cpsc220/apr3.md new file mode 100644 index 0000000..45ff8c4 --- /dev/null +++ b/content/ta/spring2018/cpsc220/apr3.md @@ -0,0 +1,39 @@ +# Lecture for April 3rd + +## Inheritance + +The *base class*, *super class*, or *parent class* is the initial class that we are working with. Let's say that you want to *extend* the class, or add additional functionality. The class that inherits from the parent class is called the *child class*, *subclass* or *derived class*. + +## Child Class Syntax + +```java +public class Truck extends Car { + // Truck Appropriate Fields + // Necessary methods for truck +} +``` + +This code adds all the methods from Car into the Truck class. You can then add methods that is specific to a Truck into the Truck class. + +A child class has all parent fields and access to all parent methods! + +## Visibility Modifiers + +Recall the words `public` and `private` + +The `public` modifier makes the field/method accessible by any class + +The `private` modifier makes the field/method only accessible within the method itself + +The protected modifier makes the field/method accessible within the same class or any subclasses. + +## Overriding a Method + +You can override a parent class method by declaring a method in the child class with the same... + +- name +- number of paramters +- parameter types + +but this method would have different behavior! + diff --git a/content/ta/spring2018/cpsc220/feb1.md b/content/ta/spring2018/cpsc220/feb1.md new file mode 100644 index 0000000..91da26c --- /dev/null +++ b/content/ta/spring2018/cpsc220/feb1.md @@ -0,0 +1,66 @@ +# Lecture for February 1st + +## Control Structures + +In this class we will talk about three types of control structures + +- Sequential +- Selection +- Repetition + +Sequential is what is most familiar to us. Write the lines from top to bottom and it executes it in that order + +### Selection + +Selection depends on the question of `if`. + +If it is raining, wear boots + +```java +if (raining) { + wearingBoots = true; +} +``` + +If you want something to happen also when it is not true, consider an `if-else` statement + +If the light is off, turn it on. + +Otherwise, turn it on + +```java +if (lightIsOn) { + lightIsOn = false; +} else { + lightIsOn = true; +} +``` + +Sometimes you can have multiple branches depending on a condition. Let us take a stop light as an example + +```java +if (light == "red") { + car.stop() +} else if (light == "yellow") { + car.slow() +} else { + car.go() +} +``` + +## String comparison + +There is a specific method in the `String` class when it comes to checking for string equality + +```java +boolean equals(String s) +``` + +Let us look at an example + +```java +String word = "hello"; +boolean ans = word.equals("hello"); // Returns true +boolean ans2 = word.equals("Hello"); // Returns false +``` + diff --git a/content/ta/spring2018/cpsc220/feb13.md b/content/ta/spring2018/cpsc220/feb13.md new file mode 100644 index 0000000..82c7de0 --- /dev/null +++ b/content/ta/spring2018/cpsc220/feb13.md @@ -0,0 +1,74 @@ +# Lecture for February 13 + +## Loops + +###Why Loops? + +While some check is true, repeat the work. + +While the cookies aren't baked, keep baking + +### Loop Building Process + +1. Identify one test that must be true when the loop is finished +2. Use the **opposite** form of the test +3. Within loop, make *progress* towards completion of the goal. + +### While syntax + +```java +while (expression) { + // Loop body executes if expression is true +} +// Statements execute after expression is false +``` + +### Getting Input (Songs in a Playlist Psuedocode) + +```java +// Ask user about first song +while (user says play next song) { + // play next song + // ask user about next song +} +``` + +### Nested Loops + +You can have loops inside loops + +```java +int outer = 1; +while (outer < 4) { + int inner = 1; + while (inner < 4) { + System.out.println(outer + ":" + inner); + inner++; + } + outer++; +} +``` + +This code does the following + +```reStructuredText +1:1 +1:2 +1:3 +2:1 +2:2 +2:3 +3:1 +3:2 +3:3 +``` + +### Break Down the Problem + +Never write the entire program at once! This makes it incredibly hard to debug. Instead break it into small parts. + +Write one part -> debug until it works + +Write second part -> debug until it works + +This way you know which part of your code failed, instead of having everything fail. \ No newline at end of file diff --git a/content/ta/spring2018/cpsc220/feb20.md b/content/ta/spring2018/cpsc220/feb20.md new file mode 100644 index 0000000..89d3bd3 --- /dev/null +++ b/content/ta/spring2018/cpsc220/feb20.md @@ -0,0 +1,94 @@ +# Lecture for February 20th + +## Reading a File + +You can get input from a file instead of from the terminal + +```java +FileInputStream fileIn = new FileInputStream("myFile.txt"); +// Our familiar Scanner +Scanner scnr = new Scanner(fileIn); +// We can use our usual Scanner methods +String line = scnr.nextLine(); +fileIn.close(); // Remember to close the file when you're finished with it! +``` + +### Reviewing Scanner Methods + +To understand some of the Scanner methods we need to be aware of the "newline" character. This character is equivalent to the `Enter` button on the keyboard. + +`scnr.nextLine()` This get's all the characters in the buffer up to the newline character. + +`scnr.next()` Grabs the characters in the next "token". Tokens are usually separated by any whitespace type character (spaces, enters, tabs, etc.) + +## Writing to a File + +Prints information to a file instead of to the screen + +```java +FileOutputStream fileOut = new FileOutputStream("myOutfile.txt"); +PrintWriter out = new PrintWriter(fileOut); +out.println("Print this as the first line."); +out.flush(); // Pushes the file changes to the file +fileOut.close(); // If you forget this then it won't remember your changes +``` + +## Arrays + +Arrays are containers of fixed size. It contains a fixed number of values of the **same type**. (Ex: 10 integers, 2 strings, 5 booleans) + +Declaration + +```java +int[] array; // This declares an integer array +``` + +Initialization + +```java +array = new int[7]; // This states that this array can hold up to 7 integers +``` + +Storing a value in an array + +- Square bracket notation is used + +```java +int[] array = new int[7]; +array[0] = 5; // Stores 5 into the first slot +``` + +Now let us attempt to retrieve the value + +```java +int temp = array[0]; +System.out.println(temp); // Prints "5" +``` + +### Traversing an Array + +Let's say we have the following array + +```java +int[] numbers = {3, 5, 2, 7, 9}; +``` + +Let's print out each of the values in the array + +```java +for (int i = 0; i < numbers.length; i++) { + System.out.print("value in " + i " is " + numbers[i]); +} +``` + +### Finding the maximum value in an Array + +```java +int highest = numbers[0]; +for (int i = 0; i < numbers.length; i++) { + if (numbers[i] > highest) { + highest = numbers[x]; + } +} +``` + diff --git a/content/ta/spring2018/cpsc220/feb27.md b/content/ta/spring2018/cpsc220/feb27.md new file mode 100644 index 0000000..017f97c --- /dev/null +++ b/content/ta/spring2018/cpsc220/feb27.md @@ -0,0 +1,91 @@ +# Lecture for February 27th + +## Review for midterm + +Chapter 1 -- Code Style, API + +Chapter 2 -- Variables & Assignments, strings + +Chapter 3 -- input & output + +Chapter 4 -- branches (if, if/else, switch) + +Chapter 5 -- loops (while, for), scope + +Chapter 6 -- File Reading and Writing + +## Separated vs Connected Branches + +What is the output of this code? + +```java +String preferredLanguage = "Spanish"; +if (preferredLanguage.equals("Chinese")) { + System.out.println("Ni hao!"); +} +if (preferredLanguage.equals("Spanish")) { + System.out.println("Hola!"); +} +if (preferredLanguage.equals("French")) { + System.out.println("Bonjour!"); +} +if (preferredLanguage.equals("German")) { + System.out.println("Gutentag!") +} else { + System.out.println("Hello!") +} +``` + +The output is + +```reStructuredText +Hola! +Hello! +``` + +This is because each of the if statements are independent from each other. Whether or not the if statement gets check is not affected by the if statements around it. + +Since the preferred language equals Spanish it outputs `Hola!` But since the language is also *not German* it prints out `Hello!` as well. + + + +## Using an Array + +Square brackets notation is used to access elements, array slots can be used as variables + +```java +int[] array = new int[7]; // Creates an integer array of size 7 +array[0] = 5; +``` + + + +## Swapping Elements + +You can swap `x` and `y` in the following way with a *temporary* variable + +```java +int x = 6; +int y = 1; + +int temp = x; + +x = y; +y = temp; +``` + + + +## Two-Dimensional Arrays + +```java +// Creates a 2D array of two rows and three columns +int[][] a = new int[2][3] +``` + +You can access an element of this 2D array using the conventional square bracket notation + +```java +a[0][0] = 5; +``` + diff --git a/content/ta/spring2018/cpsc220/feb6.md b/content/ta/spring2018/cpsc220/feb6.md new file mode 100644 index 0000000..91d2451 --- /dev/null +++ b/content/ta/spring2018/cpsc220/feb6.md @@ -0,0 +1,139 @@ +# Lecture for February 6th + +## If Statements -- Cont. + +Inside the parenthesis of the `if` statement must be a boolean expression. This is an expression that evaluates to either `true` or `false`. We can do more complex boolean expressions through logical operators. + +## Logical Operators + +NOT `!a` this is true when `a` is false + +AND `a && b ` this is true when both operands are true + +OR `a || b` this is true when either a is true OR b is true + +## Truth Tables + +- Show all possible outcomes +- It breaks the expression down into parts + +### Not + +Let's look at the most simplest case. Not. + +| a | !a | +| ----- | ----- | +| true | false | +| false | true | + +### AND + +| a | b | a && b | +| ----- | ----- | ------ | +| true | true | true | +| true | false | false | +| false | true | false | +| false | false | false | + +Notice here that `a && b` is only true when both `a` and `b` are true. + +### OR + +| a | b | a \|\| b | +| ----- | ----- | -------- | +| true | true | true | +| true | false | true | +| false | true | true | +| false | false | false | + +Notice here that `a || b` is only false when both `a` and `b` are false. + +## Precedence (Order of Operations) + +| | | +| --------------------------------- | ------------------- | +| Parenthesis | `()` | +| Logical Not | `!` | +| Arithmetic Operators | `*` `/` `%` `+` `-` | +| Relational Operators | `<` `<=` `>` `>=` | +| Equality and Inequality operators | `==` `!=` | +| Logical AND | `&&` | +| Logical OR | `||` | + + + +## Playing with Truth Tables Example + +### a && !b + +| a | b | !b | a && !b | +| ----- | ----- | ----- | ------- | +| true | true | false | false | +| true | false | true | true | +| false | true | false | false | +| false | false | true | false | + +### !a || b + +| a | b | !a | !a \|\| b | +| ----- | ----- | ----- | --------- | +| true | true | false | true | +| true | false | false | false | +| false | true | true | true | +| false | false | true | true | + +### !(a || b && c) + +| a | b | c | b && c | a \|\| (b && c) | !(a \|\| b && c) | +| ----- | ----- | ----- | ------ | --------------- | ---------------- | +| true | true | true | true | true | false | +| true | true | false | false | true | false | +| true | false | true | false | true | false | +| false | true | true | true | true | false | +| true | true | false | false | true | false | +| true | false | true | false | true | false | +| false | true | true | true | true | false | +| false | false | false | false | false | true | + +### !a || b && c + +| a | b | c | !a | b && c | !a \|\| b && c | +| ----- | ----- | ----- | ----- | ------ | -------------- | +| true | true | true | false | true | true | +| true | true | false | false | false | false | +| true | false | true | false | false | false | +| false | true | true | true | true | true | +| true | false | false | false | false | false | +| false | true | false | true | false | true | +| false | false | true | true | false | true | +| false | false | false | true | false | true | + +## Distributive Property of Logical Operators + +The following statements are equivalent + +`!(a && b)` is equivalent to `!a || !b` + +Notice how when you distribute the `!` you have to flip the operand as well. `&&` becomes `||` + +Same is true for the following example + +`!(a || b)` is equivalent to `!a && !b` + +`!(a || b && c)` is equivalent to `!a && (!b || !c)` + +## Short Circuit Evaluation + +In an `&&` (AND) statement, if the left side is `false`, there is no need to evaluate the right side. Since it's going to be false anyways!! + +```java +false && true; // FALSE no matter what the right side is +``` + +In an `||` (OR) statement, if the left side is `true, there is no need to evaluate the right side. Since it's going to be true by default!! + +```java +true || false; // TRUE no matter what the right side is +``` + +Java takes this shortcut by default for efficiency reasons \ No newline at end of file diff --git a/content/ta/spring2018/cpsc220/feb8.md b/content/ta/spring2018/cpsc220/feb8.md new file mode 100644 index 0000000..e17dda2 --- /dev/null +++ b/content/ta/spring2018/cpsc220/feb8.md @@ -0,0 +1,112 @@ +# Lecture for February 8th + +##Switch Statements + +Another way to perform multiway branching. Comparing a variable and constant values (`String`, `int`, `char`) + +Switch statements cannot be used with `boolean`, `double`, or `float`s + +### Syntax + +```java +switch (variable) { + case value1: + // Do something + break; + case value2: + // Do something else + break; + //... + default: + // If all else fails do this + break; +} +``` + +`case` is a reserved word that means "when our variable in consideration is equal to..." + +If you forget the `break` keyword, then the program will keep doing the work of all the statements until it hits a `break` keyword. + +### Example Switch Syntax + +```java +switch (birthday) { + case 1: + birthstone = "garnet"; + break; + case 2: + birthstone = "amethyst"; + break; + // .... + default: + System.out.println("Not valid"); + break; +} +``` + +## Comparing Strings Relationally + +Comparing strings are based on the ASCII value of characters + +Sorting strings will result in strings being in alphabetical or reverse alphabetical order. The values of the strings are compared character by character from the left with each ASCII value. + +To compare strings use the `compareTo()` method. Here is the format of the call + +```java +str1.compareTo(str2) +``` + +This returns a *negative number* when `str1` is less than `str2` + +This returns `0` when `str1` is equal to `str1` + +This returns a *positive number* when `str1` is greater than `str2` + +### Example + +```java +String a = "apple"; +String b = "banana"; + +int x = a.compareTo(b); // x = -1 + +int y = b.compareTo(a); // y = 1 +``` + +## Ternary Operator + +With a ternary operator, you can shorten statements where a value is determined by an if statement + +```java +String output = ""; +if (movieRating > 4) { + output = "Fan favorite"; +} else { + output = "Alright"; +} +``` + +Is equivalent to + +```java +String output = ""; +output = (movieRating > 4)? "Fan favorite": "Alright"; +``` + +### Another Example + +```java +double shipping; +if (isPrimeMember) { + shipping = 0; +} else { + shipping = 3.99; +} +``` + +Is equivalent to + +```java +double shipping = (isPrimeMember)? 0: 3.99; +``` + diff --git a/content/ta/spring2018/cpsc220/jan16.md b/content/ta/spring2018/cpsc220/jan16.md new file mode 100644 index 0000000..363cf71 --- /dev/null +++ b/content/ta/spring2018/cpsc220/jan16.md @@ -0,0 +1,47 @@ +# Lecture for January 16 2018 + +## Comments + +You can use multi-line comments or single line comments to note about a piece of code. This helps you so that you don't forget what was happening in the code + +```java +/* Multi Line Comment +I am multiple lines woo! +*/ + +System.out.println("Hello"); // I am an inline comment +``` + +### Javadocs + +This is a standardized method in Java to describe your functions and classes + +```java +/** + * This is a Javadoc comment. A description of your class should appear here + * @author Brandon + * @version 2018 + */ +public class Example{ + /** Another Javadoc comment. + * A description of your program should go here + */ + public static void main(String[] args) { + + } +} +``` + +## Variables + +Convention in Java is for all of your functions/method names to be lowercase. + +Class names should be title cased, each word is capitalized ex: `IntroExample` + + + +## Java API + +The Java API is publicly accessible and is extremely useful for finding methods in existing classes. + +The API documentation for the `String` class is located here: https://docs.oracle.com/javase/8/docs/api/index.html?java/lang/String.html \ No newline at end of file diff --git a/content/ta/spring2018/cpsc220/jan18.md b/content/ta/spring2018/cpsc220/jan18.md new file mode 100644 index 0000000..3cf89cb --- /dev/null +++ b/content/ta/spring2018/cpsc220/jan18.md @@ -0,0 +1,188 @@ +# Lecture for January 18 + +## Variables and Assignment + +Think about variables as buckets that hold information. Once the bucket is created, only one type of item can go in the bucket. + +```java +sand bucket1; +``` + +We can say that bucket1 is of type `sand`, that means the only thing that can go in the bucket is sand. + +```java +int bucket1; +double bucket2; +``` + +From the two lines above, we have *declared* the variable. + +Variables store state, they are a name for a location in memory. + +Always remember to initialize your variables. Otherwise there's nothing in the bucket! + +```java +bucket1 = 5; +``` + + You can combine both the declaration and initialization + +```java +int count = 15; +``` + +Remember when dealing with variables to stay true with the type, don't mix a bucket of water with a bucket of sand. + +We can update `count` to contain a true value + +```java +count = 55; +``` + +`count` no longer has the value of `15` in it. There's no record of it! It has been overwritten with the value `55` + +### Primitive Types + +There are 8 primitive types in Java + +- boolean +- char +- byte +- short +- int +- long +- float +- double + +byte through double are all *numeric* types + +#### Boolean + +`boolean` can only be equal to `true` or `false` + +```java +boolean student = true; +``` + +#### Char + +Stores a single character from the Unicode set + +There are 16 bits per character which adds up to 65,536 characters + +ASCII is the US subset of the characters. You can look this up online when needing to deal with ASCII values + +```java +char firstLetter = 'A'; +``` + +### Numeric types + +The different numeric types determine the precision of your number. Since numbers are not represented the same in the computer as they are in real life, there are some approximations. + +The default type you can use your code is `int` for integers and `double` for numbers with a decimal point + +There are certain types of operations you can perform on numeric type + +| Symbol | Meaning | Example | Value | +| ------ | --------------- | ---------- | ----- | +| + | addition | 43 + 8 | 51 | +| - | subtraction | 43.0-8.0 | 35.0 | +| * | multiplication | 43 * 8 | 344 | +| / | division | 43.0 / 8.0 | 5.375 | +| % | remainder / mod | 43 % 8 | 3 | +| - | unary minus | -43 | -43 | + +#### Increment/ Decrement + +There are two types of in/decrementers postfix and prefix + +Postfix: + +```java +int x = 0; +int y = 7; +x++; // Shortcut for x = x + 1 +y--; // Shortcut for y = y - 1 +``` + +Prefix + +```java +int x = 0, y = 7, z; +z = y * x++; // Equivalent to (y * x) + 1 = 7 * 0 +z = y * ++x; // Equivalent to y * (x + 1) = 7 * 1 +``` + +### Data Conversion + +There are two types of data conversion, implicit and explicit + +The compiler can perform implicit data conversion automatically. + +Performing an explicit data conversion requires additional work on the programmer's part + +A conversion is implicit if you do **not** lose any information in it + +```java +double price = 6.99; +int sale = 3; +double total = price - sale; +``` + +A *cast* is an explicit data conversion. This is requested by a programmer, this can lead to loss of information + +```java +int nextChar = 'b'; +Character.isAlphabetic( (char) nextChar); // Let's you print the actual letter 'b' instead of the number corresponding to it + +float price = 6.99; +int cost = (int) price; // cost is now 6 +``` + +### Printing variables + +You can print the values of variables using `System.out.println` and `System.out.print` + +The difference is that `System.out.println` adds a new line at the end. Meaning the next print out will be on the next line. + +```java +int cost = 5; +double sale = .30; +System.out.print(cost); +System.out.print(sale); +// Prints out '5.30` +System.out.println(cost); +System.out.println(sale); +// Prints out '5' +// Prints out '0.30' +``` + +To add a space between two variables in a print, add `" "` to the expression in between the two variables + +```java +System.out.println("The total cost is " + 5 " dollars and" + " " + 93 + " cents"); +// The total cost is 5 dollars and 94 cents +``` + +### Input from User + +You can get import from the user, we can do this using the `Scanner` class. + +First import it at the top of your file + +```java +import java.util.Scanner; +``` + +All you can do with `Scanner` is outlined in the Java API at this link https://docs.oracle.com/javase/8/docs/api/index.html?java/util/Scanner.html + +Create a Scanner object + +```java +Scanner input = new Scanner(System.in); +System.out.print("Please enter an integer: "); +price = input.nextInt(); // The integer that the user inputs is now stored in price +System.out.println("Your input: " + price); +``` + diff --git a/content/ta/spring2018/cpsc220/jan23.md b/content/ta/spring2018/cpsc220/jan23.md new file mode 100644 index 0000000..d18f20d --- /dev/null +++ b/content/ta/spring2018/cpsc220/jan23.md @@ -0,0 +1,92 @@ +# Lecture for January 23 + +## Java Class + +In Java, your code must live in a class. + +```java +public class NameOfClass { + public static void main(String[] args) { + // All program code + } +} +``` + +It is important that `NameOfClass` is named meaningfully for the code. It is convention to use CamelCase when using classes. (Capitalize your class names!) + +All methods have a method signature, it is unique to it. For main it is the words `public static void` and the argument `String[] args`. + +`public` means that any other piece of code can reference it. + +`void` means that the method returns nothing + +`main` is the name of the method. It is important to have `main` since that tells the Java Interpreter where to start in your program. + +`String[] args` is the command line arguments inputted into the program. For this part of the class, we don't need to worry about it. + +If you noticed `String` is a class, it is not a primitive type. This is denoted in Java by having it capitalized. + +## Arithmetic Expressions + +There is an order of operations in programming as well. It goes like this: + +1. Parenthesis +2. Unary Operations +3. *, /, % +4. +, - + +And from there you read from left to right. + +## Constant Variables + +These are variables that can never be changed + +```java +final int MINUTES_PER_HOUR = 60 +``` + +The keyword `final` indicates to the Java compiler that it is a constant variable. + +By convention, constants are in all caps with underscores being separated between the words + + + +## Java Math Library + +There are some arithmetic expressions that we want to be able to do and we cannot achieve that simply with the standard operations + +| Method | Description | +| -------------- | ----------------------------- | +| Math.sqrt(x) | square root | +| Math.abs(x) | absolute value | +| Math.pow(a, b) | exponentiation $a^b$ | +| Math.max(a, b) | returns the maximum of a or b | +| Math.min(a, b) | returns the minimum of a or b | +| Math.round(x) | rounds to the nearest integer | + +## Example: Finding Areas + +```java +public class MoreVariables + public static void main(String[] args) { + // Decrate a variable + int x; + + // Initialize ia variable + x = 5; + + // Area of a square + int squareArea = x * x; + System.out.println("Area of a square: " + squareArea); + double newSquare = Math.pow(x, 2); + System.out.println("Area of square: " + newSquare); + + // Area of Circle + final double PI = 3.14159; + double radius = 3; + double circleArea = radius * radius * PI; + System.out.println("Area of circle: " + circleArea); + +} +``` + diff --git a/content/ta/spring2018/cpsc220/jan25.md b/content/ta/spring2018/cpsc220/jan25.md new file mode 100644 index 0000000..949c5c4 --- /dev/null +++ b/content/ta/spring2018/cpsc220/jan25.md @@ -0,0 +1,137 @@ +# Lecture for January 25 + +## Strings + +These are concatenated chars + +```java +'d' + 'o' + 'g' // equivalent to "dog" +``` + +```java +"straw" + "berry" // strawberry +``` + +Strings are denoted by double quotes `""` rather than a string which is denoted by single quotes `''` + +String is not a primitive type, it is a class. Hence, why it is capitalized in Java. + +The `java.lang.String` is automatically imported in Java. + +To declare and initialize a String + +```java +String name = "Henry"; +``` + +In memory it appears as + +| H | 'e' | 'n' | 'r' | 'y' | +| ---- | ---- | ---- | ---- | ---- | +| | | | | | + +### String Methods + +```java +int length() +``` + +```java +boolean equals(String another) +``` + +```java +boolean startsWith(String prefix) +``` + +```java +boolean endsWith(String suffix) +``` + +```java +String substring(int start, int end) +``` + +```java +int indexOf(int ch) +``` + +```java +String toLowerCase() +``` + +### Using String Methods + +```java +char first = name.charAt(0); +``` + +Remember in Java, that it starts counting from zero! If you try to access a letter that doesn't exist, it will produce an `IndexOutOfBounds` error. + +## Errors + +There are two types of errors, compile-type errors and run-time errors. Later we will talk about debugging skills such as making "breakpoints" in your code so you can analyze the different variable values. + +### Compile Time Errors + +Compile time errors are generated due to syntax errors. Forgot a semicolon? Missing a brace? + +### Run-time Errors + +These are logic errors. Not derived from syntax errors. An example of one that was discussed earlier is the `IndexOutOfBounds` error. + + + +## Tricky Thing About Input + +Let's talk about input right now. Let's say you have the following scenario + +```java +Scanner input = new Scanner(System.in); +System.out.println("Enter pet's age: "); +int age = input.nextInt(); +System.out.println("Enter pet's name: "); +String name = input.nextLine(); +System.out.println("Enter pet's breed: "); +String breed = input.next(); +``` + +Then when we start to run the program... + +```reStructuredText +Enter pet's age: +14 +Enter pet's name: +Enter pet's breed: +Labradoodle +``` + +Why did it skip pet's name? Let's run through the process again + +```reStructuredText +Enter pet's age: +14 [ENTER] +Enter pet's name: +Enter pet's breed: +Labradoodle +``` + +Here the [ENTER] key gets saved into name. + +To resolve this, just use an `input.nextLine()` to throw away that [ENTER] + +```java +Scanner input = new Scanner(System.in); +System.out.println("Enter pet's age: "); +int age = input.nextInt(); +System.out.println("Enter pet's name: "); +input.nextLine(); +String name = input.nextLine(); +System.out.println("Enter pet's breed: "); +String breed = input.next(); +``` + + + + + diff --git a/content/ta/spring2018/cpsc220/jan30.md b/content/ta/spring2018/cpsc220/jan30.md new file mode 100644 index 0000000..e5e8095 --- /dev/null +++ b/content/ta/spring2018/cpsc220/jan30.md @@ -0,0 +1,91 @@ +# Lecture for January 30 + +## Random Number Generator + +One of the ways you can do a random number generator is through this method: + +Import a class called random + +```java +import java.util.Random; +``` + +Then you need to create a `Random` object + +```java +Random rand = new Random(); +``` + +After this you can call the `nextInt()` method to get a random number between 0 and $2^{32}$ + +```java +int randInt = rand.nextInt(); +``` + +If you don't want a random number between 0 and $2^{32}$ but instead to another maximum value, then you can call the `nextInt` method inserting the max integer as a parameter. + +Random Integer from 0-10 (not including 10) + +```java +int randInt2 = rand.nextInt(10); +``` + +## Output + +We have already encountered `System.out.println` and `System.out.print` but let us go over the differences again. + +`System.out.println()` prints the contents inside the parenthesis and appends a newline character afterwards so that the next output is on a new line + +`System.out.print()` prints the contents inside the parenthesis and does not output a newline character + + + +### Formatting Output + +If you want more control on how your output is displayed, it is recommended that you use `System.out.printf` to format your output + +First, you need to specify your type using the % instruction + +- d for integer +- f for decimal + +Example: + +```java +int sum = 50; +System.out.printf("Total = %d", sum); +``` + +This outputs + +```reS +Total = 50 +``` + +Notice here that there is no concatenation required like the previous two methods, instead you insert the variables as parameters + +Let us deconstruct the % instruction + +% __ __ . __ __ + +The first underline is the + - 0 space (sometimes we want to pad the money with zeros) + +The second underline is the width of the text + +The third underline is the number of decimal places + +The the final underline is the specifier `f` for decimal and `d` for integer + +Example + +```java +double amount = 0.5; +System.out.printf("Total Due: %0.2f") +``` + +This outputs + +```reStructuredText +Total Due: 0.50 +``` + diff --git a/content/ta/spring2018/cpsc220/mar13.md b/content/ta/spring2018/cpsc220/mar13.md new file mode 100644 index 0000000..5bac319 --- /dev/null +++ b/content/ta/spring2018/cpsc220/mar13.md @@ -0,0 +1,78 @@ +# Lecture for March 13th + +## Methods + +Methods are small blocks of statements that make it easier to solve a problem. It usually focuses on solving a small part of the overall problem. + +Usually in methods you provide some sort of input and get some output out of it. + +### Advantages + +- Code readability +- Modular program development (break up the problem in chunks) +- Incremental development +- No redundant code! + +### Method definition + +Consists of a method name, input and output and the block of statements. + +Usually this is succinctly written using JavaDocs which is what you see in the JavaAPI + +### Method Call + +A method call is the execution of the method. The statements defined in the method is what will execute. + +### Method Stubs + +Recall from method definition the parts of the method definition. Now look at the following method + +```java +String[] split(String s) +``` + +The output here is `String[]` + +The method name is `split` + +The input is `String s` + +## Modular Programming + +Let us look at the following example: + +The program should have a list of grocery prices. It should be able to calculate the total cost of groceries. The store gives a student discount of 5%. The program should calculate this discount and update the total, it should calculate and add the 2.5% tax. + +- First you should add it all up +- Then compute the discount +- Then add the tax + +## Parts of a method definition + +```java +public static int timesTwo(int num) { + int two = num * 2; + return two; +} +``` + +It first starts off by declaring the visibility `public` + +The return type if `int` + +The method name is `timesTwo` + +The input parameter is `int num` + +Between the curly braces is the *body* of the method + +## Calling a Method + +```java +int a = 5; +int b = 3; + +int ans = multiply(a, b) +``` + +The method call is `multiply(a, b)` and the result is stored in the variable `ans` \ No newline at end of file diff --git a/content/ta/spring2018/cpsc220/mar20.md b/content/ta/spring2018/cpsc220/mar20.md new file mode 100644 index 0000000..2210478 --- /dev/null +++ b/content/ta/spring2018/cpsc220/mar20.md @@ -0,0 +1,32 @@ +# Lecture for March 20th + +## Unit Testing + +With unit testing you are able to test small parts as you go. With unit testing, you can test many examples and border cases (extreme inputs) to see how your code reacts to different input. + +## Variable Scope + +A variable declared inside a method is only accessible inside that method. + +A good rule of thumb is that if a variable is declared within curly braces {} then it does not exist outside that curly brace. + +## Method Overloading + +Sometimes we need to have methods with the same name but different input parameters. + +```java +public static int multiply(int a, int b) { + return a * b; +} +``` + +This method only works with integers, what if we want to multiply two doubles? + +We can overload the method by declaring another method with the same name. + +```java +public static double multiply(double a, double b) { + return a * b; +} +``` + diff --git a/content/ta/spring2018/cpsc220/mar22.md b/content/ta/spring2018/cpsc220/mar22.md new file mode 100644 index 0000000..c560df9 --- /dev/null +++ b/content/ta/spring2018/cpsc220/mar22.md @@ -0,0 +1,72 @@ +# Lecture on March 22nd + +## Method Documentation + +Java has a special way that you can document your methods such that it will create documentation for you if you follow the convention. + +The Java API actually uses this technique to produce its own documentation. + +To create this, indicate a method with special comments that begin with `/**` and ends with `*/` + +It contains *block tags* that describe input and output parameters + +`@param` and `@return` + +### Example + +```java +/** + * @param y an integer to sum + * @param x an integer to sum + * @return the sum of x and y + */ +public int multiply(int x, int y) { + return x + y; +} +``` + +## Passing a Scanner + +We only want to create one **user input scanner** per program, we also only want one **file input scanner** per program. + +If a method needs a scanner, you can pass the one you already created in as an input parameter. + +## Array as Input Parameter + +Primitive types (`int`, `char`, `double`, etc.) are passed by value. Modifications made inside a method cannot be seen outside the method. + +Arrays on the other hand, is pass by reference. Changes made to an array inside the method can be seen outside the method. + +```java +public static void main(String[] args) { + int[] nums = {1, 3, 5, 7, 9}; + + timesTwo(nums); +} +public static void timesTwo(int[] arr) { + for (int i = 0; i < arr.length; i++) { + arr[i] *= 2; + } +} +``` + +At the end of the `timesTwo` method call, the variable `nums` would have `{2, 6, 10, 14, 18}` + +## Sizes of Arrays + +### Perfect Size Arrays + +When we declare an array, Java automatically fills every slot of the array with the type in memory. So if you know that you need exactly 8 slots, then you only ask for 8. + +### Oversize Arrays + +This is when we don't know how many slots we need. Therefore, we ask for more than we think we'll need. That way we don't go out of bounds. + +If we do this, then we don't know how many elements we have already inserted into the array. Since the length is the number of slots. + +So we can create another variable, which will keep track of the index in where we can add the next element. + +We use oversized arrays when the size of the array is unknown or may change. + + + diff --git a/content/ta/spring2018/cpsc220/mar27.md b/content/ta/spring2018/cpsc220/mar27.md new file mode 100644 index 0000000..50eac71 --- /dev/null +++ b/content/ta/spring2018/cpsc220/mar27.md @@ -0,0 +1,140 @@ +# Lecture for March 27 + +## In the Real World... + +Objects are known for having characteristics. A car has on average 4 wheels, 2-4 doors, a steering wheel. + +Objects can perform actions. A car can drive, hold cargo, and honk. + +## In the Programming World... + +Object-Oriented Programming + +- Focuses on objects +- Are not linear +- Adds organization to a program +- Fits with human cognition (making abstractions) + +## Class Structure + +```java +public class Classname { + // Fields + // Constructors + // Methods +} +``` + +## Fields + +Fields are instance variables, they store values, help define state, and exist in memory for the lifetime of the object. + +```java +public class Car { + private double price; + private double gas; +} +``` + +## Constructor + +We can build an object through a constructor. It is a special kind of method, this method requires that you not have a return type and that you name it the same as the class itself. + +Constructors help set default field values for the different properties of our class. + +```java +public class Car { + // Begin Constructor + public Car(double cost) { + this.price = cost; + this.gas = 0; + } + // End Constructor + private double price; + private double gas; +} +``` + +**Note:** The `this` keyword refers to the object's fields. This helps keep it separate from other variables you can create in the method and the input parameters you receive. + +## Accessor Method - "Getter" + +We like to classify methods into two types, accessors and mutators. + +Getter methods return a copy of an instance field. It does not change the state of the object. + +```java +public double getPrice() { + return this.price; +} +``` + +## Mutator Method - "Setter" + +This type of method modifies an instance field. It does not return anything and changes the state of the object. + +```java +public void setPrice(double cost) { + this.price = cost; +} +``` + +## Example of Car Class In All Its Glory + +```java +public class Car { + // Instance Variables + private int mpg; + private double price; + + // Constructors + public Car() { + this.price = 0; + this.mpg = 0; + } + public Car(double cost, int mpg) { + this.price = cost; + this.mpg = mpg; + } + + // Accessors + public double getPrice() { + return this.price'' + } + public int getMpg() { + return this.mpg; + } + + // Mutators + public void setPrice(double cost) { + this.price = cost; + } + public void setMpg(int mpg) { + this.mpg = mpg; + } +} +``` + +## Using Classes + +Just like how we used the `Scanner` class, we can also use our new `Car` class. + +```java +public class TestCar { + public static void main(String[] args) { + // Declare an object reference + Car c; + + // Initialize the object + c = new Car(); + + // Update the fields of the object + c.setPrice(3000); + c.setMpg(22); + + // Print object information + System.out.println("Price is " + c.getPrice() ) + } +} +``` + diff --git a/content/ta/spring2018/cpsc220/mar29.md b/content/ta/spring2018/cpsc220/mar29.md new file mode 100644 index 0000000..c5a51e4 --- /dev/null +++ b/content/ta/spring2018/cpsc220/mar29.md @@ -0,0 +1,67 @@ +# Lecture for March 29th + +## Enumerated Types + +These represent a fixed set of constants and include all possible values within them. + +Let's look at coins. On a daily basis in the US, we use the following coins: + +- Penny +- Nickel +- Dime +- Quarter + +Other examples include the days of the week, clothes sizes, etc. + +## Enum Syntax + +Let's define an `enum` type + +```java +public enum Coin { PENNY, NICKEL, DIME, QUARTER} +``` + +Now declare and initialize a variable + +```java +Coin myCoin = Coin.PENNY +``` + +## Arrays vs ArrayList + +Arrays require you to say upfront, how many slots you need. ArrayLists are more flexible since you can change the length of the array during Runtime. + +Arrays can store objects and primitives such as `int`, `char`, `boolean`, etc. + +ArrayLists can only store objects. + +### How to declare an ArrayList + +```java +ArrayList list = new ArrayList(); +``` + +### Differences between getting the length of the array + +**Array** + +```java +int length = array.length; +``` + +**ArrayList** + +```java +int length = array.size(); +``` + +## For Each Loop + +This is a special loop in where you tell it to go through all the elements of the array, without specifying an index. + +```java +for (String b : buildings) { + System.out.print(b); +} +``` + diff --git a/content/ta/spring2018/cpsc220/midtermreview.md b/content/ta/spring2018/cpsc220/midtermreview.md new file mode 100644 index 0000000..1258854 --- /dev/null +++ b/content/ta/spring2018/cpsc220/midtermreview.md @@ -0,0 +1,45 @@ +# More Midterm Review + +Let us suppose that we have the following array + +```java +int[] b = {11, 12, 15, 16, 21} +``` + +## Increase all elements by 2 + +```java +for (int i = 0; i < b.length; i++) { + b[i] += 2; +} +``` + +## Print all elements of array + +```java +for (int i = 0; i < b.length; i++) { + System.out.println(b[i]); +} +``` + +## Sum all the elements of an array + +```java +int sum = 0; +for (int i = 0; i < b.length; i++) { + sum += b[i]; +} +``` + +## Access Last Element of Array + +```java +System.out.println(b[b.length - 1]); +``` + +## Access the middle element + +```java +System.out.println(b[b.length / 2]); +``` + diff --git a/content/ta/summer2017.md b/content/ta/summer2017.md new file mode 100644 index 0000000..e69de29 diff --git a/content/ta/summer2017/cpsc110.md b/content/ta/summer2017/cpsc110.md new file mode 100644 index 0000000..6912fc9 --- /dev/null +++ b/content/ta/summer2017/cpsc110.md @@ -0,0 +1,13 @@ +# CPSC 110 Introduction to Computer Science Summer 2017 + +For the summer session, I didn't write in depth lecture notes. Instead I wrote short complementary blog posts help out with the labs. + +[Viewing Java Applets](/blog/2017-05-24-viewing-java-applets/) + +[Using System Themes in Java Swing](/blog/2017-06-05-using-system-themes-java-swing/) + +[Java Swing Components](/blog/2017-06-05-java-swing-components/) + +[Escape Sequences in Java](/blog/2017-08-28-escape-sequences-java/) + +[Obtaining Command Line Input in Java](/blog/2017-08-28-obtaining-command-line-input-java/) diff --git a/content/transcript.md b/content/transcript.md new file mode 100644 index 0000000..d14ede8 --- /dev/null +++ b/content/transcript.md @@ -0,0 +1,136 @@ +--- +Title: Transcript +Description: Page listing the courses I've taken +--- + +# Transcript + +Below is a list of courses I've taken in the past for credit. + +## Spring 2019 + +Deep Reinforcement Learning (CPSC 491) + +Real Analysis I (MATH 471) + +Abstract Algebra I (MATH 431) + +Operating Systems (CPSC 405) + +Digital Storytelling (CPSC 106) + +## Fall 2018 + +Reinforcement Learning (CPSC 491) + +Programming Languages (CPSC 491) + +Competitive Programming (CPSC 491) + +Multivariate Statistics (STAT 461) + +Foundations of Advance Mathematics (MATH 330) + +Applications of Databases (CPSC 350) + +## Spring 2018 + +Foundations for Data Science (Data 219) + +Theory of Computation (CPSC 326) + +Data Structures and Algorithms (CPSC 340) + +Differential Equations (MATH 312) + +Cluster Analysis (STAT 491) + +## Fall 2017 + +Computer Systems and Architecture (CPSC 305) + +Introduction to Data Science (DATA 101) + +Linear Algebra (MATH 300) + +Methods in Mathematical Physics (PHYS 317) + +Probability & Statistical Inference I (STAT 381) + +Undergraduate Research in Physics (URES 197J) + +## Fall 2017 + +Computer Systems and Architecture (CPSC 305) + +Introduction to Data Science (DATA 101) + +Linear Algebra (MATH 300) + +Methods in Mathematical Physics (PHYS 317) + +Probability & Statistical Inference I (STAT 381) + +Undergraduate Research in Physics (URES 197J) + +## Fall 2017 + +Computer Systems and Architecture (CPSC 305) + +Introduction to Data Science (DATA 101) + +Linear Algebra (MATH 300) + +Methods in Mathematical Physics (PHYS 317) + +Probability & Statistical Inference I (STAT 381) + +Undergraduate Research in Physics (URES 197J) + +## Spring 2017 + +Intro to Discrete Mathematics (CPSC 125A) + +Object-Oriented Analysis & Design (CPSC 240) + +Statistical Methods (MATH 280) + +University Physics II, with Lab (PHYS 106) + +Undergraduate Research in Physics (URES 197J) + +## Fall 2016 + +Software Development Tools (CPSC 225) + +Numbers Rule Your World (FSEM 100M1) + +Intro to Statistics (MATH 200) + +American Music (MUHL 156) + +University Physics I, with Lab (PHYS 105) + +## Advance Placement + +Computer Programming and Problem Solving (CPSC 220) + +Intro to Human Geography (GEOG 102) + +American History to 1865 (HIST 131) + +American History since 1865 (HIST 132) + +Calculus I (MATH 121) + +Calculus II (MATH 122) + +Calculus III (MATH 223) + +General Psychology (PSYCH 100) + + + + + + diff --git a/static/files/courses/BayesianStatistics/Challenger.png b/static/files/courses/BayesianStatistics/Challenger.png new file mode 100644 index 0000000..82d53b2 Binary files /dev/null and b/static/files/courses/BayesianStatistics/Challenger.png differ diff --git a/static/files/courses/BayesianStatistics/challengerfitted.png b/static/files/courses/BayesianStatistics/challengerfitted.png new file mode 100644 index 0000000..38e32c7 Binary files /dev/null and b/static/files/courses/BayesianStatistics/challengerfitted.png differ diff --git a/static/files/courses/BayesianStatistics/heightpairs.png b/static/files/courses/BayesianStatistics/heightpairs.png new file mode 100644 index 0000000..41de2e2 Binary files /dev/null and b/static/files/courses/BayesianStatistics/heightpairs.png differ diff --git a/static/files/groupssimplified.pdf b/static/files/groupssimplified.pdf new file mode 100644 index 0000000..0830c19 Binary files /dev/null and b/static/files/groupssimplified.pdf differ diff --git a/static/files/images/0932485094325.png b/static/files/images/0932485094325.png new file mode 100644 index 0000000..e411cfe Binary files /dev/null and b/static/files/images/0932485094325.png differ diff --git a/static/files/images/1573183066061.png b/static/files/images/1573183066061.png new file mode 100644 index 0000000..46361d1 Binary files /dev/null and b/static/files/images/1573183066061.png differ diff --git a/static/files/images/1578623897330.png b/static/files/images/1578623897330.png new file mode 100644 index 0000000..75937ea Binary files /dev/null and b/static/files/images/1578623897330.png differ diff --git a/static/files/images/1578887790276.png b/static/files/images/1578887790276.png new file mode 100644 index 0000000..8805817 Binary files /dev/null and b/static/files/images/1578887790276.png differ diff --git a/static/files/research/ClusterAnalysisSpring2018.html b/static/files/research/ClusterAnalysisSpring2018.html new file mode 100644 index 0000000..c6b6226 --- /dev/null +++ b/static/files/research/ClusterAnalysisSpring2018.html @@ -0,0 +1,222 @@ + + + + +ClusterAnalysisSpring2018.md + + +

Cluster Analysis Spring 2018

Distance, Dimensionality Reduction, and Tendency

  • Distance

    • Euclidean Distance
    • Squared Euclidean Distance
    • Manhattan Distance
    • Maximum Distance
    • Mahalanobis Distance
  • Which distance function should you use?

  • PCA

  • Cluster Tendency

    • Hopkins Statistic
  • Scaling Data

Validating Clustering Models

  • Clustering Validation
  • Cross Validation

Connectivity Models

  • Agglomerative Clustering

    • Single Linkage Clustering
    • Complete Linkage Clustering
    • Unweighted Pair Group Method with Arithmetic Mean (If time permits)
  • Dendrograms

  • Divisive Clustering

  • CURE (Clustering using REpresentatives) algorithm (If time permits)

Cluster Evaluation

  • Internal Evaluation

    • Dunn Index
    • Silhouette Coefficient
    • Davies-Bouldin Index (If time permits)
  • External Evaluation

    • Rand Measure
    • Jaccard Index
    • Dice Index
    • Confusion Matrix
    • F Measure (If time permits)
    • Fowlkes-Mallows Index (If time permits)

Centroid Models

  • Jenks Natural Breaks Optimization
  • Voronoi Diagram
  • K means clustering
  • K medoids clustering
  • K Medians/Modes clustering
  • When to use K means as opposed to K medoids or K Medians?
  • How many clusters should you use?
  • Lloyd's Algorithm for Approximating K-means (If time permits)

Density Models

  • DBSCAN Density Based Clustering Algorithm
  • OPTICS Ordering Points To Identify the Clustering Structure
  • DeLi-Clu Density Link Clustering (If time permits)
  • What should be your density threshold?

Analysis of Model Appropriateness

  • When do we use each of the models above?

Distribution Models (If time permits)

  • Fuzzy Clusters
  • EM (Expectation Maximization) Clustering
  • Maximum Likelihood Gaussian
  • Probabilistic Hierarchal Clustering

Textbooks

Cluster Analysis 5th Edition

Cluster Analysis: 2014 Edition (Statistical Associates Blue Book Series 24)

Schedule

In an ideal world, the topics below I estimated being a certain time period for learning them. Of course you have more experience when it comes to how long it actually takes to learn these topics, so I'll leave this mostly to your discretion.

Distance, Dimensionality Reduction, and Tendency -- 3 Weeks

Validating Cluster Models -- 1 Week

Connectivity Models -- 2 Weeks

Cluster Evaluation -- 1 Week

Centroid Models -- 3 Weeks

Density Models -- 3 Weeks

Analysis of Model Appropriateness -- 1 Week

The schedule above accounts for 14 weeks, so there is a week that is free as a buffer.

Conclusion

Creating this document got me really excited for this independent study. Feel free to give me feedback :)

+ + \ No newline at end of file diff --git a/static/files/research/ClusterAnalysisSpring2018.md b/static/files/research/ClusterAnalysisSpring2018.md new file mode 100644 index 0000000..002dc8a --- /dev/null +++ b/static/files/research/ClusterAnalysisSpring2018.md @@ -0,0 +1,119 @@ +# Cluster Analysis Spring 2018 + +### Distance, Dimensionality Reduction, and Tendency + +- Distance + - Euclidean Distance + - Squared Euclidean Distance + - Manhattan Distance + - Maximum Distance + - Mahalanobis Distance +- Which distance function should you use? +- PCA +- Cluster Tendency + - Hopkins Statistic +- Scaling Data + +### Validating Clustering Models + +- Clustering Validation +- Cross Validation + +### Connectivity Models + +- Agglomerative Clustering + - Single Linkage Clustering + - Complete Linkage Clustering + - Unweighted Pair Group Method with Arithmetic Mean (If time permits) +- Dendrograms +- Divisive Clustering +- CURE (Clustering using REpresentatives) algorithm (If time permits) + +### Cluster Evaluation + +- Internal Evaluation + - Dunn Index + - Silhouette Coefficient + - Davies-Bouldin Index (If time permits) +- External Evaluation + - Rand Measure + - Jaccard Index + - Dice Index + - Confusion Matrix + - F Measure (If time permits) + - Fowlkes-Mallows Index (If time permits) + +### Centroid Models + +- Jenks Natural Breaks Optimization +- Voronoi Diagram +- K means clustering +- K medoids clustering +- K Medians/Modes clustering +- When to use K means as opposed to K medoids or K Medians? +- How many clusters should you use? +- Lloyd's Algorithm for Approximating K-means (If time permits) + +### Density Models + +- DBSCAN Density Based Clustering Algorithm +- OPTICS Ordering Points To Identify the Clustering Structure +- DeLi-Clu Density Link Clustering (If time permits) +- What should be your density threshold? + +### Analysis of Model Appropriateness + +- When do we use each of the models above? + +### Distribution Models (If time permits) + +- Fuzzy Clusters +- EM (Expectation Maximization) Clustering +- Maximum Likelihood Gaussian +- Probabilistic Hierarchal Clustering + + + + +## Textbooks + +Cluster Analysis 5th Edition + +- Authors: Brian S. Everitt, Sabine Landau, Morven Leese, Daniel Stahl +- ISBN-13: 978-0470749913 +- Cost: Free on UMW Library Site +- Amazon Link: https://www.amazon.com/Cluster-Analysis-Brian-S-Everitt/dp/0470749911/ref=sr_1_1?ie=UTF8&qid=1509135983&sr=8-1 +- Table of Contents: http://www.wiley.com/WileyCDA/WileyTitle/productCd-EHEP002266.html + +Cluster Analysis: 2014 Edition (Statistical Associates Blue Book Series 24) + +- Author: David Garson +- ISBN: 978-1-62638-030-1 +- Cost: Free with Site Registration +- Website: http://www.statisticalassociates.com/clusteranalysis.htm + + + +## Schedule + +In an ideal world, the topics below I estimated being a certain time period for learning them. Of course you have more experience when it comes to how long it actually takes to learn these topics, so I'll leave this mostly to your discretion. + +**Distance, Dimensionality Reduction, and Tendency** -- 3 Weeks + +**Validating Cluster Models** -- 1 Week + +**Connectivity Models** -- 2 Weeks + +**Cluster Evaluation** -- 1 Week + +**Centroid Models** -- 3 Weeks + +**Density Models** -- 3 Weeks + +**Analysis of Model Appropriateness** -- 1 Week + +The schedule above accounts for 14 weeks, so there is a week that is free as a buffer. + +## Conclusion + +Creating this document got me really excited for this independent study. Feel free to give me feedback :) \ No newline at end of file diff --git a/static/files/research/ExpeditedLearningInteractiveDemo.pptx b/static/files/research/ExpeditedLearningInteractiveDemo.pptx new file mode 100644 index 0000000..739ea7a Binary files /dev/null and b/static/files/research/ExpeditedLearningInteractiveDemo.pptx differ diff --git a/static/files/research/LUNAC.pdf b/static/files/research/LUNAC.pdf new file mode 100644 index 0000000..12ac30c Binary files /dev/null and b/static/files/research/LUNAC.pdf differ diff --git a/static/files/research/LUNACposter.pdf b/static/files/research/LUNACposter.pdf new file mode 100644 index 0000000..675ff16 Binary files /dev/null and b/static/files/research/LUNACposter.pdf differ diff --git a/static/files/research/Measuresofsimilarity.pdf b/static/files/research/Measuresofsimilarity.pdf new file mode 100644 index 0000000..9c30b26 Binary files /dev/null and b/static/files/research/Measuresofsimilarity.pdf differ diff --git a/static/files/research/QEP.pptx b/static/files/research/QEP.pptx new file mode 100644 index 0000000..88a55ea Binary files /dev/null and b/static/files/research/QEP.pptx differ diff --git a/static/files/research/TheBanditReport.pdf b/static/files/research/TheBanditReport.pdf new file mode 100644 index 0000000..c9eac4b Binary files /dev/null and b/static/files/research/TheBanditReport.pdf differ diff --git a/static/files/research/coherentcontrolofatomicpopulation.pdf b/static/files/research/coherentcontrolofatomicpopulation.pdf new file mode 100644 index 0000000..7b7547d Binary files /dev/null and b/static/files/research/coherentcontrolofatomicpopulation.pdf differ diff --git a/static/files/research/honorsthesis.pdf b/static/files/research/honorsthesis.pdf new file mode 100644 index 0000000..7a1a64c Binary files /dev/null and b/static/files/research/honorsthesis.pdf differ diff --git a/static/files/research/modellingpopulationdynamics.pdf b/static/files/research/modellingpopulationdynamics.pdf new file mode 100644 index 0000000..b8ad0f8 Binary files /dev/null and b/static/files/research/modellingpopulationdynamics.pdf differ diff --git a/static/files/slides/embezzlement.pdf b/static/files/slides/embezzlement.pdf new file mode 100644 index 0000000..2445365 Binary files /dev/null and b/static/files/slides/embezzlement.pdf differ diff --git a/static/files/slides/similyrics.pdf b/static/files/slides/similyrics.pdf new file mode 100644 index 0000000..be5768f Binary files /dev/null and b/static/files/slides/similyrics.pdf differ diff --git a/static/files/umwlug/audio.pdf b/static/files/umwlug/audio.pdf new file mode 100644 index 0000000..4acd857 Binary files /dev/null and b/static/files/umwlug/audio.pdf differ diff --git a/static/files/umwlug/darklogo.pdf b/static/files/umwlug/darklogo.pdf new file mode 100644 index 0000000..12e1a78 Binary files /dev/null and b/static/files/umwlug/darklogo.pdf differ diff --git a/static/files/umwlug/interestfall2018.pdf b/static/files/umwlug/interestfall2018.pdf new file mode 100644 index 0000000..597b93f Binary files /dev/null and b/static/files/umwlug/interestfall2018.pdf differ diff --git a/static/files/umwlug/interestfall2019.pdf b/static/files/umwlug/interestfall2019.pdf new file mode 100644 index 0000000..fe00b3b Binary files /dev/null and b/static/files/umwlug/interestfall2019.pdf differ diff --git a/static/files/umwlug/interestspring2018.pdf b/static/files/umwlug/interestspring2018.pdf new file mode 100644 index 0000000..1029429 Binary files /dev/null and b/static/files/umwlug/interestspring2018.pdf differ diff --git a/static/files/umwlug/interestspring2019.pdf b/static/files/umwlug/interestspring2019.pdf new file mode 100644 index 0000000..585fda7 Binary files /dev/null and b/static/files/umwlug/interestspring2019.pdf differ diff --git a/static/files/umwlug/linuxvunix.pdf b/static/files/umwlug/linuxvunix.pdf new file mode 100644 index 0000000..7ad9393 Binary files /dev/null and b/static/files/umwlug/linuxvunix.pdf differ diff --git a/static/files/umwlug/logo.pdf b/static/files/umwlug/logo.pdf new file mode 100644 index 0000000..0af54a3 Binary files /dev/null and b/static/files/umwlug/logo.pdf differ diff --git a/static/files/umwlug/petertalk.pdf b/static/files/umwlug/petertalk.pdf new file mode 100644 index 0000000..4252daf Binary files /dev/null and b/static/files/umwlug/petertalk.pdf differ diff --git a/static/files/umwlug/tedtalk.pdf b/static/files/umwlug/tedtalk.pdf new file mode 100644 index 0000000..98bb926 Binary files /dev/null and b/static/files/umwlug/tedtalk.pdf differ diff --git a/static/img/avatar.jpg b/static/img/avatar.jpg new file mode 100644 index 0000000..d2211a1 Binary files /dev/null and b/static/img/avatar.jpg differ diff --git a/static/img/favicon.ico b/static/img/favicon.ico new file mode 100644 index 0000000..45008d3 Binary files /dev/null and b/static/img/favicon.ico differ diff --git a/static/keybase.txt b/static/keybase.txt new file mode 100644 index 0000000..a3fbedb --- /dev/null +++ b/static/keybase.txt @@ -0,0 +1,52 @@ +I hereby claim: + + * I am an admin of https://brandonrozek.com + * I am brozek (https://keybase.io/brozek) on keybase. + * I have a public key ASC0uPV8wQGhrA_JFkaY6D5SL6CRDzAttViMipmFf1EOKwo + +To do so, I am signing this object: + +{ + "body": { + "key": { + "eldest_kid": "0120b4b8f57cc101a1ac0fc9164698e83e522fa0910f302db5588c8a99857f510e2b0a", + "host": "keybase.io", + "kid": "0120b4b8f57cc101a1ac0fc9164698e83e522fa0910f302db5588c8a99857f510e2b0a", + "uid": "b0a95fe14c44e3d6e1ef5ea1db76ab19", + "username": "brozek" + }, + "merkle_root": { + "ctime": 1562016085, + "hash": "9d7341ba1f1f7ead60bbe053b2225a0da4e176a1f01ad03028b44e2de63fbf336b13020603665a2fb03925b9bca198fbcd1afbcfdc48890174ed853cc29180f2", + "hash_meta": "35592527e7fa28f64e609af892ddb7037dda26e0878fde7962ce0a0ed60323b8", + "seqno": 5675461 + }, + "service": { + "entropy": "QwM0YfSruvMgRiQV2182C6pZ", + "hostname": "brandonrozek.com", + "protocol": "https:" + }, + "type": "web_service_binding", + "version": 2 + }, + "client": { + "name": "keybase.io go client", + "version": "4.1.0" + }, + "ctime": 1562016093, + "expire_in": 504576000, + "prev": "1ea3c48ec49efb4b553666f56bd00cb0e72ae392d7e23ec08b0bc328e969c7e8", + "seqno": 10, + "tag": "signature" +} + +which yields the signature: + +hKRib2R5hqhkZXRhY2hlZMOpaGFzaF90eXBlCqNrZXnEIwEgtLj1fMEBoawPyRZGmOg+Ui+gkQ8wLbVYjIqZhX9RDisKp3BheWxvYWTESpcCCsQgHqPEjsSe+0tVNmb1a9AMsOcq45LX4j7AiwvDKOlpx+jEIFxHhuW7Qvb5oaOYfQoajEH+4c6mibK2jItcswgs3dCHAgHCo3NpZ8RAJ2Zyb+G2p6WYAlp9hZ5kH1/A1hI6CEBpMezqTvrBSolFBanObkYFSemGHh3vCUDgRJRT96HyA/J4fIGqf6MxDKhzaWdfdHlwZSCkaGFzaIKkdHlwZQildmFsdWXEIC7Cc/7oKz5F/YYU7PGRgxD4HPxOqUnhqT+PYC7zlp5Vo3RhZ80CAqd2ZXJzaW9uAQ== + +And finally, I am proving ownership of this host by posting or +appending to this document. + +View my publicly-auditable identity here: https://keybase.io/brozek + +