From 6f83c52930aa6c36bdcb8352be6c59bc41ab2940 Mon Sep 17 00:00:00 2001 From: <> Date: Thu, 12 Oct 2023 23:44:44 +0000 Subject: [PATCH] Deployed ab31ef7 with MkDocs version: 1.5.3 --- .nojekyll | 0 404.html | 478 + .../index.html | 1165 ++ assets/images/favicon.png | Bin 0 -> 1870 bytes assets/javascripts/bundle.59e7e423.min.js | 3 + assets/javascripts/lunr/min/lunr.ar.min.js | 1 + assets/javascripts/lunr/min/lunr.da.min.js | 18 + assets/javascripts/lunr/min/lunr.de.min.js | 18 + assets/javascripts/lunr/min/lunr.du.min.js | 18 + assets/javascripts/lunr/min/lunr.es.min.js | 18 + assets/javascripts/lunr/min/lunr.fi.min.js | 18 + assets/javascripts/lunr/min/lunr.fr.min.js | 18 + assets/javascripts/lunr/min/lunr.he.min.js | 1 + assets/javascripts/lunr/min/lunr.hi.min.js | 1 + assets/javascripts/lunr/min/lunr.hu.min.js | 18 + assets/javascripts/lunr/min/lunr.hy.min.js | 1 + assets/javascripts/lunr/min/lunr.it.min.js | 18 + assets/javascripts/lunr/min/lunr.ja.min.js | 1 + assets/javascripts/lunr/min/lunr.jp.min.js | 1 + assets/javascripts/lunr/min/lunr.kn.min.js | 1 + assets/javascripts/lunr/min/lunr.ko.min.js | 1 + assets/javascripts/lunr/min/lunr.multi.min.js | 1 + assets/javascripts/lunr/min/lunr.nl.min.js | 18 + assets/javascripts/lunr/min/lunr.no.min.js | 18 + assets/javascripts/lunr/min/lunr.pt.min.js | 18 + assets/javascripts/lunr/min/lunr.ro.min.js | 18 + assets/javascripts/lunr/min/lunr.ru.min.js | 18 + assets/javascripts/lunr/min/lunr.sa.min.js | 1 + .../lunr/min/lunr.stemmer.support.min.js | 1 + assets/javascripts/lunr/min/lunr.sv.min.js | 18 + assets/javascripts/lunr/min/lunr.ta.min.js | 1 + assets/javascripts/lunr/min/lunr.te.min.js | 1 + assets/javascripts/lunr/min/lunr.th.min.js | 1 + assets/javascripts/lunr/min/lunr.tr.min.js | 18 + assets/javascripts/lunr/min/lunr.vi.min.js | 1 + assets/javascripts/lunr/min/lunr.zh.min.js | 1 + assets/javascripts/lunr/tinyseg.js | 206 + assets/javascripts/lunr/wordcut.js | 6708 +++++++ .../workers/search.1e90e0fb.min.js | 2 + assets/stylesheets/main.13544b29.min.css | 1 + assets/stylesheets/palette.ab4e12ef.min.css | 1 + ...ommunicating-breaking-the-project-down.png | Bin 0 -> 85069 bytes images/communicating-fan-not-fan.png | Bin 0 -> 174685 bytes images/communicating-removing-roadblocks.jpeg | Bin 0 -> 139807 bytes ...-whos-it-for-what-do-they-need-to-know.png | Bin 0 -> 224977 bytes images/dog-photo-1.jpeg | Bin 0 -> 495206 bytes images/dog-photo-2.jpeg | Bin 0 -> 245858 bytes images/dog-photo-3.jpeg | Bin 0 -> 232067 bytes images/heart-disease-analysis.png | Bin 0 -> 95219 bytes ...l-framework-tools-matplotlib-highlight.png | Bin 0 -> 483423 bytes ...matplotlib-anatomy-of-a-plot-with-code.png | Bin 0 -> 670481 bytes images/matplotlib-anatomy-of-a-plot.png | Bin 0 -> 378254 bytes images/matplotlib-heart-disease-analysis.png | Bin 0 -> 75081 bytes ...eart-disease-chol-age-plot-cmap-change.png | Bin 0 -> 34780 bytes ...tlib-heart-disease-chol-age-plot-saved.png | Bin 0 -> 35042 bytes ...isease-chol-age-plot-seaborn-whitegrid.png | Bin 0 -> 27262 bytes ...matplotlib-heart-disease-chol-age-plot.png | Bin 0 -> 35453 bytes images/matplotlib-simple-plot.png | Bin 0 -> 22339 bytes images/ml101-6-step-ml-framework-tools.png | Bin 0 -> 510997 bytes images/ml101-6-step-ml-framework.png | Bin 0 -> 332025 bytes images/ml101-different-data-types.png | Bin 0 -> 490111 bytes images/ml101-ml-inputs-and-outputs.png | Bin 0 -> 77943 bytes ...-to-take-in-a-machine-learning-project.png | Bin 0 -> 364776 bytes images/ml101-two-data-tables.png | Bin 0 -> 543759 bytes ...tep-ml-framework-tools-numpy-highlight.png | Bin 0 -> 483209 bytes images/numpy-anatomy-of-a-numpy-array.png | Bin 0 -> 423357 bytes images/numpy-anatomy-of-an-array-updated.png | Bin 0 -> 292322 bytes images/numpy-car-photo.png | Bin 0 -> 563421 bytes images/numpy-dog-photo.png | Bin 0 -> 495206 bytes images/numpy-panda.jpeg | Bin 0 -> 246537 bytes ...as-6-step-ml-framework-tools-highlight.png | Bin 0 -> 479391 bytes images/pandas-anatomy-of-a-dataframe.png | Bin 0 -> 341236 bytes images/pandas-car-sales-csv.png | Bin 0 -> 517643 bytes images/pandas-car-sales-dataframe.png | Bin 0 -> 48384 bytes images/pandas-dataframe-anatomy.png | Bin 0 -> 103319 bytes images/pandas-dataframe-zero-indexed.png | Bin 0 -> 81538 bytes images/pandas-docs-img.png | Bin 0 -> 178819 bytes images/pandas-exported-car-sales-csv.png | Bin 0 -> 449231 bytes images/pandas-exported-patient-data-csv.png | Bin 0 -> 457146 bytes images/pandas-google-search-problem.png | Bin 0 -> 178402 bytes images/pandas-jupyter-notebook.png | Bin 0 -> 524346 bytes images/pandas-stack-overflow-question.png | Bin 0 -> 184145 bytes images/pandas-stackoverflow-answers.png | Bin 0 -> 293334 bytes ...pandas-steps-in-stack-overflow-process.png | Bin 0 -> 412375 bytes images/simple-plot.png | Bin 0 -> 32451 bytes ...framework-tools-scikit-learn-highlight.png | Bin 0 -> 479381 bytes images/sklearn-classification-report.png | Bin 0 -> 79807 bytes images/sklearn-confusion-matrix-anatomy.png | Bin 0 -> 215950 bytes images/sklearn-cross-validation.png | Bin 0 -> 141053 bytes images/sklearn-docstring.png | Bin 0 -> 624652 bytes images/sklearn-hyperparameter-tuning-oven.png | Bin 0 -> 314733 bytes .../sklearn-intro-jupyter-notebook-header.png | Bin 0 -> 693272 bytes ...map-cheatsheet-boston-housing-ensemble.png | Bin 0 -> 725063 bytes ...ml-map-cheatsheet-boston-housing-ridge.png | Bin 0 -> 716760 bytes ...cheatsheet-california-housing-ensemble.png | Bin 0 -> 455560 bytes ...ap-cheatsheet-california-housing-ridge.png | Bin 0 -> 451207 bytes ...-map-cheatsheet-heart-disease-ensemble.png | Bin 0 -> 753590 bytes ...ap-cheatsheet-heart-disease-linear-svc.png | Bin 0 -> 740557 bytes images/sklearn-ml-map.png | Bin 0 -> 761071 bytes images/sklearn-train-valid-test-annotated.png | Bin 0 -> 385353 bytes images/sklearn-train-valid-test-sets.png | Bin 0 -> 145406 bytes images/sklearn-user-guide.png | Bin 0 -> 789201 bytes .../sklearn-whats-happening-with-pipeline.png | Bin 0 -> 410476 bytes images/sklearn-workflow-title.png | Bin 0 -> 293488 bytes images/sklearn-workflow.png | Bin 0 -> 272659 bytes ...ts-6-step-ml-framework-tools-highlight.png | Bin 0 -> 480332 bytes ...lassification-jupyter-notebook-header.jpeg | Bin 0 -> 181024 bytes ...s-classification-shift-tab-on-function.png | Bin 0 -> 665353 bytes ...ts-regression-jupyter-notebook-header.jpeg | Bin 0 -> 221431 bytes ...jects-regression-shift-tab-on-function.png | Bin 0 -> 705413 bytes ...nstructured-data-colab-notebook-header.png | Bin 0 -> 798858 bytes ...ctured-data-colab-runtime-disconnected.png | Bin 0 -> 35535 bytes .../unstructured-data-docstring-in-colab.png | Bin 0 -> 658103 bytes images/unstructured-data-dog-photos.png | Bin 0 -> 29241 bytes .../unstructured-data-google-colab-icon.png | Bin 0 -> 5500 bytes ...uctured-data-google-drive-disconnected.png | Bin 0 -> 27732 bytes ...kaggle-dog-breed-identification Large.jpeg | Bin 0 -> 171024 bytes ...-data-kaggle-dog-breed-identification.jpeg | Bin 0 -> 171024 bytes images/unstructured-data-neural-network.png | Bin 0 -> 28618 bytes images/unstructured-data-nvidia-gpu.png | Bin 0 -> 144950 bytes ...ata-object-detection-self-driving-car.jpeg | Bin 0 -> 18437 bytes ...structured-data-object-detection-yolo.jpeg | Bin 0 -> 32176 bytes ...ctured-data-resnet50-backbone-at-tesla.png | Bin 0 -> 338643 bytes .../unstructured-data-tensorflow-guide.jpeg | Bin 0 -> 183357 bytes ...red-data-tensorflow-hub-logo-fullcolor.png | Bin 0 -> 10740 bytes ...red-data-tensorflow-hub-logo-fullcolor.svg | 1 + images/unstructured-data-tensorflow-logo.png | Bin 0 -> 15686 bytes .../unstructured-data-tensorflow-workflow.png | Bin 0 -> 249461 bytes .../unstructured-data-tesnorflow-workflow.png | Bin 0 -> 286928 bytes index.html | 520 + introduction-to-matplotlib/index.html | 8030 ++++++++ introduction-to-numpy/index.html | 8143 ++++++++ introduction-to-pandas/index.html | 9576 +++++++++ introduction-to-scikit-learn/index.html | 16082 ++++++++++++++++ search/search_index.json | 1 + sitemap.xml | 3 + sitemap.xml.gz | Bin 0 -> 127 bytes 137 files changed, 51206 insertions(+) create mode 100644 .nojekyll create mode 100644 404.html create mode 100644 a-6-step-framework-for-approaching-machine-learning-projects/index.html create mode 100644 assets/images/favicon.png create mode 100644 assets/javascripts/bundle.59e7e423.min.js create mode 100644 assets/javascripts/lunr/min/lunr.ar.min.js create mode 100644 assets/javascripts/lunr/min/lunr.da.min.js create mode 100644 assets/javascripts/lunr/min/lunr.de.min.js create mode 100644 assets/javascripts/lunr/min/lunr.du.min.js create mode 100644 assets/javascripts/lunr/min/lunr.es.min.js create mode 100644 assets/javascripts/lunr/min/lunr.fi.min.js create mode 100644 assets/javascripts/lunr/min/lunr.fr.min.js create mode 100644 assets/javascripts/lunr/min/lunr.he.min.js create mode 100644 assets/javascripts/lunr/min/lunr.hi.min.js create mode 100644 assets/javascripts/lunr/min/lunr.hu.min.js create mode 100644 assets/javascripts/lunr/min/lunr.hy.min.js create mode 100644 assets/javascripts/lunr/min/lunr.it.min.js create mode 100644 assets/javascripts/lunr/min/lunr.ja.min.js create mode 100644 assets/javascripts/lunr/min/lunr.jp.min.js create mode 100644 assets/javascripts/lunr/min/lunr.kn.min.js create mode 100644 assets/javascripts/lunr/min/lunr.ko.min.js create mode 100644 assets/javascripts/lunr/min/lunr.multi.min.js create mode 100644 assets/javascripts/lunr/min/lunr.nl.min.js create mode 100644 assets/javascripts/lunr/min/lunr.no.min.js create mode 100644 assets/javascripts/lunr/min/lunr.pt.min.js create mode 100644 assets/javascripts/lunr/min/lunr.ro.min.js create mode 100644 assets/javascripts/lunr/min/lunr.ru.min.js create mode 100644 assets/javascripts/lunr/min/lunr.sa.min.js create mode 100644 assets/javascripts/lunr/min/lunr.stemmer.support.min.js create mode 100644 assets/javascripts/lunr/min/lunr.sv.min.js create mode 100644 assets/javascripts/lunr/min/lunr.ta.min.js create mode 100644 assets/javascripts/lunr/min/lunr.te.min.js create mode 100644 assets/javascripts/lunr/min/lunr.th.min.js create mode 100644 assets/javascripts/lunr/min/lunr.tr.min.js create mode 100644 assets/javascripts/lunr/min/lunr.vi.min.js create mode 100644 assets/javascripts/lunr/min/lunr.zh.min.js create mode 100644 assets/javascripts/lunr/tinyseg.js create mode 100644 assets/javascripts/lunr/wordcut.js create mode 100644 assets/javascripts/workers/search.1e90e0fb.min.js create mode 100644 assets/stylesheets/main.13544b29.min.css create mode 100644 assets/stylesheets/palette.ab4e12ef.min.css create mode 100644 images/communicating-breaking-the-project-down.png create mode 100644 images/communicating-fan-not-fan.png create mode 100644 images/communicating-removing-roadblocks.jpeg create mode 100644 images/communicating-whos-it-for-what-do-they-need-to-know.png create mode 100644 images/dog-photo-1.jpeg create mode 100644 images/dog-photo-2.jpeg create mode 100644 images/dog-photo-3.jpeg create mode 100644 images/heart-disease-analysis.png create mode 100644 images/matplotlib-6-step-ml-framework-tools-matplotlib-highlight.png create mode 100644 images/matplotlib-anatomy-of-a-plot-with-code.png create mode 100644 images/matplotlib-anatomy-of-a-plot.png create mode 100644 images/matplotlib-heart-disease-analysis.png create mode 100644 images/matplotlib-heart-disease-chol-age-plot-cmap-change.png create mode 100644 images/matplotlib-heart-disease-chol-age-plot-saved.png create mode 100644 images/matplotlib-heart-disease-chol-age-plot-seaborn-whitegrid.png create mode 100644 images/matplotlib-heart-disease-chol-age-plot.png create mode 100644 images/matplotlib-simple-plot.png create mode 100644 images/ml101-6-step-ml-framework-tools.png create mode 100644 images/ml101-6-step-ml-framework.png create mode 100644 images/ml101-different-data-types.png create mode 100644 images/ml101-ml-inputs-and-outputs.png create mode 100644 images/ml101-steps-to-take-in-a-machine-learning-project.png create mode 100644 images/ml101-two-data-tables.png create mode 100644 images/numpy-6-step-ml-framework-tools-numpy-highlight.png create mode 100644 images/numpy-anatomy-of-a-numpy-array.png create mode 100644 images/numpy-anatomy-of-an-array-updated.png create mode 100644 images/numpy-car-photo.png create mode 100644 images/numpy-dog-photo.png create mode 100644 images/numpy-panda.jpeg create mode 100644 images/pandas-6-step-ml-framework-tools-highlight.png create mode 100644 images/pandas-anatomy-of-a-dataframe.png create mode 100644 images/pandas-car-sales-csv.png create mode 100644 images/pandas-car-sales-dataframe.png create mode 100644 images/pandas-dataframe-anatomy.png create mode 100644 images/pandas-dataframe-zero-indexed.png create mode 100644 images/pandas-docs-img.png create mode 100644 images/pandas-exported-car-sales-csv.png create mode 100644 images/pandas-exported-patient-data-csv.png create mode 100644 images/pandas-google-search-problem.png create mode 100644 images/pandas-jupyter-notebook.png create mode 100644 images/pandas-stack-overflow-question.png create mode 100644 images/pandas-stackoverflow-answers.png create mode 100644 images/pandas-steps-in-stack-overflow-process.png create mode 100644 images/simple-plot.png create mode 100644 images/sklearn-6-step-ml-framework-tools-scikit-learn-highlight.png create mode 100644 images/sklearn-classification-report.png create mode 100644 images/sklearn-confusion-matrix-anatomy.png create mode 100644 images/sklearn-cross-validation.png create mode 100644 images/sklearn-docstring.png create mode 100644 images/sklearn-hyperparameter-tuning-oven.png create mode 100644 images/sklearn-intro-jupyter-notebook-header.png create mode 100644 images/sklearn-ml-map-cheatsheet-boston-housing-ensemble.png create mode 100644 images/sklearn-ml-map-cheatsheet-boston-housing-ridge.png create mode 100644 images/sklearn-ml-map-cheatsheet-california-housing-ensemble.png create mode 100644 images/sklearn-ml-map-cheatsheet-california-housing-ridge.png create mode 100644 images/sklearn-ml-map-cheatsheet-heart-disease-ensemble.png create mode 100644 images/sklearn-ml-map-cheatsheet-heart-disease-linear-svc.png create mode 100644 images/sklearn-ml-map.png create mode 100644 images/sklearn-train-valid-test-annotated.png create mode 100644 images/sklearn-train-valid-test-sets.png create mode 100644 images/sklearn-user-guide.png create mode 100644 images/sklearn-whats-happening-with-pipeline.png create mode 100644 images/sklearn-workflow-title.png create mode 100644 images/sklearn-workflow.png create mode 100644 images/supervised-projects-6-step-ml-framework-tools-highlight.png create mode 100644 images/supervised-projects-classification-jupyter-notebook-header.jpeg create mode 100644 images/supervised-projects-classification-shift-tab-on-function.png create mode 100644 images/supervised-projects-regression-jupyter-notebook-header.jpeg create mode 100644 images/supervised-projects-regression-shift-tab-on-function.png create mode 100644 images/unstructured-data-colab-notebook-header.png create mode 100644 images/unstructured-data-colab-runtime-disconnected.png create mode 100644 images/unstructured-data-docstring-in-colab.png create mode 100644 images/unstructured-data-dog-photos.png create mode 100644 images/unstructured-data-google-colab-icon.png create mode 100644 images/unstructured-data-google-drive-disconnected.png create mode 100644 images/unstructured-data-kaggle-dog-breed-identification Large.jpeg create mode 100644 images/unstructured-data-kaggle-dog-breed-identification.jpeg create mode 100644 images/unstructured-data-neural-network.png create mode 100644 images/unstructured-data-nvidia-gpu.png create mode 100644 images/unstructured-data-object-detection-self-driving-car.jpeg create mode 100644 images/unstructured-data-object-detection-yolo.jpeg create mode 100644 images/unstructured-data-resnet50-backbone-at-tesla.png create mode 100644 images/unstructured-data-tensorflow-guide.jpeg create mode 100644 images/unstructured-data-tensorflow-hub-logo-fullcolor.png create mode 100644 images/unstructured-data-tensorflow-hub-logo-fullcolor.svg create mode 100644 images/unstructured-data-tensorflow-logo.png create mode 100644 images/unstructured-data-tensorflow-workflow.png create mode 100644 images/unstructured-data-tesnorflow-workflow.png create mode 100644 index.html create mode 100644 introduction-to-matplotlib/index.html create mode 100644 introduction-to-numpy/index.html create mode 100644 introduction-to-pandas/index.html create mode 100644 introduction-to-scikit-learn/index.html create mode 100644 search/search_index.json create mode 100644 sitemap.xml create mode 100644 sitemap.xml.gz diff --git a/.nojekyll b/.nojekyll new file mode 100644 index 000000000..e69de29bb diff --git a/404.html b/404.html new file mode 100644 index 000000000..fedfaf49e --- /dev/null +++ b/404.html @@ -0,0 +1,478 @@ + + + +
+ + + + + + + + + + + + + + + + + + + +Machine learning is broad. The media makes it sound like magic. Reading this article will change that. It will give you an overview of the most common types of problems machine learning can be used for. And at the same time give you a framework to approach your future machine learning proof of concept projects.
+First, we’ll clear up some definitions.
+How is machine learning, artificial intelligence and data science different?
+These three topics can be hard to understand because there are no formal definitions. Even after being a machine learning engineer for over a year, I don’t have a good answer to this question. I’d be suspicious of anyone who claims they do.
+To avoid confusion, we’ll keep it simple. For this article, you can consider machine learning the process of finding patterns in data to understand something more or to predict some kind of future event.
+The following steps have a bias towards building something and seeing how it works. Learning by doing.
+A machine learning pipeline can be broken down into three major steps. Data collection, data modelling and deployment. All influence one another.
+You may start a project by collecting data, model it, realise the data you collected was poor, go back to collecting data, model it again, find a good model, deploy it, find it doesn’t work, make another model, deploy it, find it doesn’t work again, go back to data collection. It’s a cycle.
+Wait, what does model mean? What’s does deploy mean? How do I collect data?
+Great questions.
+How you collect data will depend on your problem. We will look at examples in a minute. But one way could be your customer purchases in a spreadsheet.
+Modelling refers to using a machine learning algorithm to find insights within your collected data.
+What’s the difference between a normal algorithm and a machine learning algorithm?
+Like a cooking recipe for your favourite chicken dish, a normal algorithm is a set of instructions on how to turn a set of ingredients into that honey mustard masterpiece.
+What makes a machine learning algorithm different is instead of having the set of instructions, you start with the ingredients and the final dish ready to go. The machine learning algorithm then looks at the ingredients and the final dish and works out the set of instructions.
+There are many different types of machine learning algorithms and some perform better than others on different problems. But the premise remains, they all have the goal of finding patterns or sets of instructions in data.
+Deployment is taking your set of instructions and using it in an application. This application could be anything from recommending products to customers on your online store to a hospital trying to better predict disease presence.
+The specifics of these steps will be different for each project. But the principles within each remain similar.
+This article focuses on data modelling. It assumes you have already collected data, and are looking to build a machine learning proof of concept with it. Let’s break down how you might approach it.
++ |
---|
Machine learning projects can be broken into three steps, data collection, data modelling and deployment. This article focuses on steps within the data modelling phase and assumes you already have data. Full version on Whimsical. | +
Let’s dive a little deeper in each.
+To help decide whether or not your business could use machine learning, the first step is to match the business problem you’re trying to solve a machine learning problem.
+The four major types of machine learning are supervised learning, unsupervised learning, transfer learning and reinforcement learning (there’s semi-supervised as well but I’ve left it out for brevity). The three most used in business applications are supervised learning, unsupervised learning and transfer learning.
+Supervised learning, is called supervised because you have data and labels. A machine learning algorithm tries to learn what patterns in the data lead to the labels. The supervised part happens during training. If the algorithm guesses a wrong label, it tries to correct itself.
+For example, if you were trying to predict heart disease in a new patient. You may have the anonymised medical records of 100 patients as the data and whether or not they had heart disease as the label.
+A machine learning algorithm could look at the medical records (inputs) and whether or not a patient had heart disease (outputs) and then figure out what patterns in the medical records lead to heart disease.
+Once you’ve got a trained algorithm, you could pass through the medical records (input) of a new patient through it and get a prediction of whether or not they have heart disease (output). It’s important to remember this prediction isn’t certain. It comes back as a probability.
+The algorithm says, “based on what I’ve seen before, it looks like this new patients medical records are 70% aligned to those who have heart disease.”
+Unsupervised learning is when you have data but no labels. The data could be the purchase history of your online video game store customers. Using this data, you may want to group similar customers together so you can offer them specialised deals. You could use a machine learning algorithm to group your customers by purchase history.
+After inspecting the groups, you provide the labels. There may be a group interested in computer games, another group who prefer console games and another which only buy discounted older games. This is called clustering.
+What’s important to remember here is the algorithm did not provide these labels. It found the patterns between similar customers and using your domain knowledge, you provided the labels.
+Transfer learning is when you take the information an existing machine learning model has learned and adjust it to your own problem.
+Training a machine learning model from scratch can be expensive and time-consuming. The good news is, you don’t always have to. When machine learning algorithms find patterns in one kind of data, these patterns can be used in another type of data.
+Let’s say you’re a car insurance company and wanted to build a text classification model to classify whether or not someone submitting an insurance claim for a car accident is at fault (caused the accident) or not at fault (didn’t cause the accident).
+You could start with an existing text model, one which has read all of Wikipedia and has remembered all the patterns between different words, such as, which word is more likely to come next after another. Then using your car insurance claims (data) along with their outcomes (labels), you could tweak the existing text model to your own problem.
+If machine learning can be used in your business, it’s likely it’ll fall under one of these three types of learning. +But let’s break them down further into classification, regression and recommendation.
+Now you know these things, your next step is to define your business problem in machine learning terms.
+Let’s use the car insurance example from before. You receive thousands of claims per day which your staff read and decide whether or not the person sending in the claim is at fault or not.
+But now the number of claims are starting to come in faster than your staff can handle them. You’ve got thousands of examples of past claims which are labelled at fault or not at fault.
+Can machine learning help?
+You already know the answer. But let’s see. Does this problem fit into any of the three above? Classification, regression or recommendation?
+Let’s rephrase it.
+++We’re a car insurance company who want to classify incoming car insurance claims into at fault or not at fault.
+
See the keyword? Classify.
+It turns out, this could potentially be a machine learning classification problem. I say potentially because there’s a chance it might not work.
+When it comes to defining your business problem as a machine learning problem, start simple, more than one sentence is too much. Add complexity when required.
+The data you have or need to collect will depend on the problem you want to solve.
+If you already have data, it’s likely it will be in one of two forms. Structured or unstructured. Within each of these, you have static or streaming data.
+There are overlaps.
+Your static structured table of information may have columns which contain natural language text and photos and be updated constantly.
+For predicting heart disease, one column may be sex, another average heart rate, another average blood pressure, another chest pain intensity.
+For the insurance claim example, one column may be the text a customer has sent in for the claim, another may be the image they’ve sent in along with the text and a final a column being the outcome of the claim. This table gets updated with new claims or altered results of old claims daily.
++ |
---|
Two examples of structured data with different kinds of data within it. Table 1.0 has numerical and categorical data. Table 2.0 has unstructured data with images and natural language text but is presented in a structured manner. | +
The principle remains. You want to use the data you have to gains insights or predict something.
+For supervised learning, this involves using the feature variable(s) to predict the target variable(s). A feature variable for predicting heart disease could be sex with the target variable being whether or not the patient has heart disease.
++ |
---|
Table 1.0 broken into ID column (yellow, not used for building machine learning model), feature variables (orange) and target variables (green). A machine learning model finds the patterns in the feature variables and predicts the target variables. | +
For unsupervised learning, you won’t have labels. But you’ll still want to find patterns. Meaning, grouping together similar samples and finding samples which are outliers.
+For transfer learning, your problem stays a supervised learning problem, except you’re leveraging the patterns machine learning algorithms have learned from other data sources separate from your own.
+Remember, if you’re using a customers data to improve your business or to offer them a better service, it’s important to let them know. This is why you see “this site uses cookies” popups everywhere. The website uses how you browse the site, likely along with some kind of machine learning to improve their offering.
+You’ve defined your business problem in machine learning terms and you have data. Now define what defines success. +There are different evaluation metrics for classification, regression and recommendation problems. Which one you choose will depend on your goal.
+++For this project to be successful, the model needs to be over 95% accurate at whether someone is at fault or not at fault.
+
A 95% accurate model may sound pretty good for predicting who’s at fault in an insurance claim. But for predicting heart disease, you’ll likely want better results.
+Other things you should take into consideration for classification problems.
+For regression problems (where you want to predict a number), you’ll want to minimise the difference between what your model predicts and what the actual value is. If you’re trying to predict the price a house will sell for, you’ll want your model to get as close as possible to the actual price. To do this, use MAE or RMSE.
+Use RMSE if you want large errors to be more significant. Such as, predicting a house to be sold at $300,000 instead of $200,000 and being off by $100,000 is more than twice as bad as being off by $50,000. Or MAE if being off by $100,000 is twice as bad as being off by $50,000.
+Recommendation problems are harder to test in experimentation. One way to do so is to take a portion of your data and hide it away. When your model is built, use it to predict recommendations for the hidden data and see how it lines up.
+Let’s say you’re trying to recommend customers products on your online store. You have historical purchase data from 2010–2019. You could build a model on the 2010–2018 data and then use it to predict 2019 purchases. Then it becomes a classification problem because you’re trying to classify whether or not someone is likely to buy an item.
+However, traditional classification metrics aren’t the best for recommendation problems. Precision and recall have no concept of ordering.
+If your machine learning model returned back a list of 10 recommendations to be displayed to a customer on your website, you’d want the best ones to be displayed first right?
+To begin with, you may not have an exact figure for each of these. But knowing what metrics you should be paying attention to gives you an idea of how to evaluate your machine learning project.
+Not all data is the same. And when you hear someone referring to features, they’re referring to different kinds of data within data.
+The three main types of features are categorical, continuous (or numerical) and derived.
+Categorical features — One or the other(s). For example, in our heart disease problem, the sex of the patient. Or for an online store, whether or not someone has made a purchase or not.
+Continuous (or numerical) features — A numerical value such as average heart rate or the number of times logged in. +Derived features — Features you create from the data. Often referred to as feature engineering. Feature engineering is how a subject matter expert takes their knowledge and encodes it into the data. You might combine the number of times logged in with timestamps to make a feature called time since last login. Or turn dates from numbers into “is a weekday (yes)” and “is a weekday (no)”.
+Text, images and almost anything you can imagine can also be a feature. Regardless, they all get turned into numbers before a machine learning algorithm can model them.
+Some important things to remember when it comes to features.
+You can use features to create a simple baseline metric. A subject matter expert on customer churn may know someone is 80% likely to cancel their membership after 3 weeks of not logging in.
+Or a real estate agent who knows the sale prices of houses might know houses with over 5 bedrooms and 4 bathrooms sell for over $500,000.
+These are simplified and don’t have to be exact. But it’s what you’re going to use to see whether machine learning can improve upon or not.
+Once you’ve defined your problem, prepared your data, evaluation criteria and features it’s time to model.
+Modelling breaks into three parts, choosing a model, improving a model, comparing it with others.
+When choosing a model, you’ll want to take into consideration, interpretability and ease to debug, amount of data, training and prediction limitations.
+To address these, start simple. A state of the art model can be tempting to reach for. But if it requires 10x the compute resources to train and prediction times are 5x longer for a 2% boost in your evaluation metric, it might not be the best choice.
+Linear models such as logistic regression are usually easier to interpret, are very fast for training and predict faster than deeper models such as neural networks.
+But it’s likely your data is from the real world. Data from the real world isn’t always linear.
+What then?
+Ensembles of decision trees and gradient boosted algorithms (fancy words, definitions not important for now) usually work best on structured data, like Excel tables and dataframes. Look into random forests, XGBoost and CatBoost.
++ |
---|
A non-exhaustive example of all the different tools you can use for machine learning/data science. | +
Deep models such as neural networks generally work best on unstructured data like images, audio files and natural language text. However, the trade-off is they usually take longer to train, are harder to debug and prediction time takes longer. But this doesn’t mean you shouldn’t use them.
+Transfer learning is an approach which takes advantage of deep models and linear models. It involves taking a pre-trained deep model and using the patterns it has learned as the inputs to your linear model. This saves dramatically on training time and allows you to experiment faster.
+Where do I find pre-trained models?
+Pre-trained models are available on PyTorch hub, TensorFlow hub, model zoo and within the fast.ai framework. This is a good place to look first for building any kind of proof of concept.
+What about the other kinds of models?
+For building a proof of concept, it’s unlikely you’ll have to ever build your own machine learning model. People have already written code for these.
+What you’ll be focused on is preparing your inputs and outputs in a way they can be used with an existing model. This means having your data and labels strictly defined and understanding what problem you’re trying to solve.
+A model's first results isn’t its last. Like tuning a car, machine learning models can be tuned to improve performance.
+Tuning a model involves changing hyperparameters such as learning rate or optimizer. Or model-specific architecture factors such as number of trees for random forests and number of and type of layers for neural networks.
+These used to be something a practitioner would have to tune by hand but are increasingly becoming automated. And should be wherever possible.
+Using a pre-trained model through transfer learning often has the added benefit of all of these steps been done.
+The priority for tuning and improving models should be reproducibility and efficiency. Someone should be able to reproduce the steps you’ve taken to improve performance. And because your main bottleneck will be model training time, not new ideas to improve, your efforts should be dedicated towards efficiency.
+Compare apples to apples.
+Where model 1 and 2 can vary but not data X or data Y.
+This step involves all the other steps. Because machine learning is a highly iterative process, you’ll want to make sure your experiments are actionable.
+Your biggest goal should be minimising the time between offline experiments and online experiments.
+Offline experiments are steps you take when your project isn’t customer-facing yet. Online experiments happen when your machine learning model is in production.
+All experiments should be conducted on different portions of your data.
+These amounts can fluctuate slightly, depending on your problem and the data you have.
+Poor performance on training data means the model hasn’t learned properly. Try a different model, improve the existing one, collect more data, collect better data.
+Poor performance on test data means your model doesn’t generalise well. Your model may be overfitting the training data. Use a simpler model or collect more data.
+Poor performance once deployed (in the real world) means there’s a difference in what you trained and tested your model on and what is actually happening. Revisit step 1 & 2. Ensure your data matches up with the problem you’re trying to solve.
+When you implement a large experimental change, document what and why. Remember, like model tuning, someone, including your future self, should be able to reproduce what you’ve done.
+This means saving updated models and updated datasets regularly.
+Many businesses have heard of machine learning but aren’t sure where to start. One of the best places to start is to use the six steps above to build a proof of concept.
+A proof of concept should not be seen as something to fundamentally change how your business operates but as an exploration into whether machine learning can bring your business value.
+After all, you’re not after fancy solutions to keep up with the hype. You’re after solutions which add value.
+Put a timeline on a proof of concept, 2, 6 and 12 weeks are good amounts. With good data, a good machine learning and data science practitioner can get 80–90% of the final modelling results in a relatively small timeframe.
+Have your subject matter experts and machine learning engineers and data scientists work together. There is nothing worse than a machine learning engineer building a great model which models the wrong thing.
+If a web designer could improve the layout of an online store to help a machine learning experiment, they should know.
+Remember, due to the nature of proof of concepts, it may turn out machine learning isn’t something your business can take advantage of (unlikely). As a project manager, ensure you’re aware of this. If you are a machine learning engineer or data scientist, be willing to accept your conclusions lead nowhere.
+But all is not lost.
+The value in something not working is now you know what doesn’t work and can direct your efforts elsewhere. This is why setting a timeframe for experiments is helpful. There is never enough time but deadlines work wonders.
+If a machine learning proof of concept turns out well, take another step, if not, step back. Learning by doing is a faster process than thinking about something.
+Each of these steps could deserve an article on their own. I’ll work on it.
+In the meantime, there are some things to note.
+It’s always about the data. Without good data to begin with, no machine learning model will help you. If you want to use machine learning in your business, it starts with good data collection.
+Deployment changes everything. A good model offline doesn’t always mean a good model online. This article has focused on data modelling. Once you deploy a model, there’s infrastructure management, data verification, model retraining, analysis and more. Any cloud provider has services for these but putting them together is still a bit of a dark art. Pay your data engineers well. If you’re data engineer, share what you know.
+Data collection and model deployment are the longest parts of a machine learning pipeline. This article has only focused on modelling. And even then, it misses specifics on how to get your data ready to be modelled (other sections in this repo cover that).
+Tools of the trade vary. Machine learning is big tool comprised of many other tools. From code libraries and frameworks to different deployment architectures. There’s usually several different ways to do the same thing. Best practice is continually being changed. This article focuses on things which don’t.
+ + + + + + + +{"use strict";var za=/["'&<>]/;Xn.exports=qa;function qa(e){var t=""+e,r=za.exec(t);if(!r)return t;var o,n="",i=0,a=0;for(i=r.index;i YgycH(cS2qiCH+GZ@&_muUgA>oPm)+{O
z6lN4A<`a&IKG%O+(%#Nxz8PIEWpYWlk0_U$inZd7&)o=q){if(s=W.limit_backward,W.limit_backward=q,W.ket=W.cursor,e=W.find_among_b(P,7))switch(W.bra=W.cursor,e){case 1:if(l()){if(i=W.limit-W.cursor,!W.eq_s_b(1,"s")&&(W.cursor=W.limit-i,!W.eq_s_b(1,"t")))break;W.slice_del()}break;case 2:W.slice_from("i");break;case 3:W.slice_del();break;case 4:W.eq_s_b(2,"gu")&&W.slice_del()}W.limit_backward=s}}function b(){var e=W.limit-W.cursor;W.find_among_b(U,5)&&(W.cursor=W.limit-e,W.ket=W.cursor,W.cursor>W.limit_backward&&(W.cursor--,W.bra=W.cursor,W.slice_del()))}function d(){for(var e,r=1;W.out_grouping_b(F,97,251);)r--;if(r<=0){if(W.ket=W.cursor,e=W.limit-W.cursor,!W.eq_s_b(1,"é")&&(W.cursor=W.limit-e,!W.eq_s_b(1,"è")))return;W.bra=W.cursor,W.slice_from("e")}}function k(){if(!w()&&(W.cursor=W.limit,!f()&&(W.cursor=W.limit,!m())))return W.cursor=W.limit,void _();W.cursor=W.limit,W.ket=W.cursor,W.eq_s_b(1,"Y")?(W.bra=W.cursor,W.slice_from("i")):(W.cursor=W.limit,W.eq_s_b(1,"ç")&&(W.bra=W.cursor,W.slice_from("c")))}var p,g,q,v=[new r("col",-1,-1),new r("par",-1,-1),new r("tap",-1,-1)],h=[new r("",-1,4),new r("I",0,1),new r("U",0,2),new r("Y",0,3)],z=[new r("iqU",-1,3),new r("abl",-1,3),new r("Ièr",-1,4),new r("ièr",-1,4),new r("eus",-1,2),new r("iv",-1,1)],y=[new r("ic",-1,2),new r("abil",-1,1),new r("iv",-1,3)],C=[new r("iqUe",-1,1),new r("atrice",-1,2),new r("ance",-1,1),new r("ence",-1,5),new r("logie",-1,3),new r("able",-1,1),new r("isme",-1,1),new r("euse",-1,11),new r("iste",-1,1),new r("ive",-1,8),new r("if",-1,8),new r("usion",-1,4),new r("ation",-1,2),new r("ution",-1,4),new r("ateur",-1,2),new r("iqUes",-1,1),new r("atrices",-1,2),new r("ances",-1,1),new r("ences",-1,5),new r("logies",-1,3),new r("ables",-1,1),new r("ismes",-1,1),new r("euses",-1,11),new r("istes",-1,1),new r("ives",-1,8),new r("ifs",-1,8),new r("usions",-1,4),new r("ations",-1,2),new r("utions",-1,4),new r("ateurs",-1,2),new r("ments",-1,15),new r("ements",30,6),new r("issements",31,12),new r("ités",-1,7),new r("ment",-1,15),new r("ement",34,6),new r("issement",35,12),new r("amment",34,13),new r("emment",34,14),new r("aux",-1,10),new r("eaux",39,9),new r("eux",-1,1),new r("ité",-1,7)],x=[new r("ira",-1,1),new r("ie",-1,1),new r("isse",-1,1),new r("issante",-1,1),new r("i",-1,1),new r("irai",4,1),new r("ir",-1,1),new r("iras",-1,1),new r("ies",-1,1),new r("îmes",-1,1),new r("isses",-1,1),new r("issantes",-1,1),new r("îtes",-1,1),new r("is",-1,1),new r("irais",13,1),new r("issais",13,1),new r("irions",-1,1),new r("issions",-1,1),new r("irons",-1,1),new r("issons",-1,1),new r("issants",-1,1),new r("it",-1,1),new r("irait",21,1),new r("issait",21,1),new r("issant",-1,1),new r("iraIent",-1,1),new r("issaIent",-1,1),new r("irent",-1,1),new r("issent",-1,1),new r("iront",-1,1),new r("ît",-1,1),new r("iriez",-1,1),new r("issiez",-1,1),new r("irez",-1,1),new r("issez",-1,1)],I=[new r("a",-1,3),new r("era",0,2),new r("asse",-1,3),new r("ante",-1,3),new r("ée",-1,2),new r("ai",-1,3),new r("erai",5,2),new r("er",-1,2),new r("as",-1,3),new r("eras",8,2),new r("âmes",-1,3),new r("asses",-1,3),new r("antes",-1,3),new r("âtes",-1,3),new r("ées",-1,2),new r("ais",-1,3),new r("erais",15,2),new r("ions",-1,1),new r("erions",17,2),new r("assions",17,3),new r("erons",-1,2),new r("ants",-1,3),new r("és",-1,2),new r("ait",-1,3),new r("erait",23,2),new r("ant",-1,3),new r("aIent",-1,3),new r("eraIent",26,2),new r("èrent",-1,2),new r("assent",-1,3),new r("eront",-1,2),new r("ât",-1,3),new r("ez",-1,2),new r("iez",32,2),new r("eriez",33,2),new r("assiez",33,3),new r("erez",32,2),new r("é",-1,2)],P=[new r("e",-1,3),new r("Ière",0,2),new r("ière",0,2),new r("ion",-1,1),new r("Ier",-1,2),new r("ier",-1,2),new r("ë",-1,4)],U=[new r("ell",-1,-1),new r("eill",-1,-1),new r("enn",-1,-1),new r("onn",-1,-1),new r("ett",-1,-1)],F=[17,65,16,1,0,0,0,0,0,0,0,0,0,0,0,128,130,103,8,5],S=[1,65,20,0,0,0,0,0,0,0,0,0,0,0,0,0,128],W=new s;this.setCurrent=function(e){W.setCurrent(e)},this.getCurrent=function(){return W.getCurrent()},this.stem=function(){var e=W.cursor;return n(),W.cursor=e,u(),W.limit_backward=e,W.cursor=W.limit,k(),W.cursor=W.limit,b(),W.cursor=W.limit,d(),W.cursor=W.limit_backward,o(),!0}};return function(e){return"function"==typeof e.update?e.update(function(e){return i.setCurrent(e),i.stem(),i.getCurrent()}):(i.setCurrent(e),i.stem(),i.getCurrent())}}(),e.Pipeline.registerFunction(e.fr.stemmer,"stemmer-fr"),e.fr.stopWordFilter=e.generateStopWordFilter("ai aie aient aies ait as au aura aurai auraient aurais aurait auras aurez auriez aurions aurons auront aux avaient avais avait avec avez aviez avions avons ayant ayez ayons c ce ceci celà ces cet cette d dans de des du elle en es est et eu eue eues eurent eus eusse eussent eusses eussiez eussions eut eux eûmes eût eûtes furent fus fusse fussent fusses fussiez fussions fut fûmes fût fûtes ici il ils j je l la le les leur leurs lui m ma mais me mes moi mon même n ne nos notre nous on ont ou par pas pour qu que quel quelle quelles quels qui s sa sans se sera serai seraient serais serait seras serez seriez serions serons seront ses soi soient sois soit sommes son sont soyez soyons suis sur t ta te tes toi ton tu un une vos votre vous y à étaient étais était étant étiez étions été étée étées étés êtes".split(" ")),e.Pipeline.registerFunction(e.fr.stopWordFilter,"stopWordFilter-fr")}});
\ No newline at end of file
diff --git a/assets/javascripts/lunr/min/lunr.he.min.js b/assets/javascripts/lunr/min/lunr.he.min.js
new file mode 100644
index 000000000..b863d3eae
--- /dev/null
+++ b/assets/javascripts/lunr/min/lunr.he.min.js
@@ -0,0 +1 @@
+!function(e,r){"function"==typeof define&&define.amd?define(r):"object"==typeof exports?module.exports=r():r()(e.lunr)}(this,function(){return function(e){if(void 0===e)throw new Error("Lunr is not present. Please include / require Lunr before this script.");if(void 0===e.stemmerSupport)throw new Error("Lunr stemmer support is not present. Please include / require Lunr stemmer support before this script.");e.he=function(){this.pipeline.reset(),this.pipeline.add(e.he.trimmer,e.he.stopWordFilter,e.he.stemmer),this.searchPipeline&&(this.searchPipeline.reset(),this.searchPipeline.add(e.he.stemmer))},e.he.wordCharacters="֑-״א-תa-zA-Za-zA-Z0-90-9",e.he.trimmer=e.trimmerSupport.generateTrimmer(e.he.wordCharacters),e.Pipeline.registerFunction(e.he.trimmer,"trimmer-he"),e.he.stemmer=function(){var e=this;return e.result=!1,e.preRemoved=!1,e.sufRemoved=!1,e.pre={pre1:"ה ו י ת",pre2:"ב כ ל מ ש כש",pre3:"הב הכ הל המ הש בש לכ",pre4:"וב וכ ול ומ וש",pre5:"מה שה כל",pre6:"מב מכ מל ממ מש",pre7:"בה בו בי בת כה כו כי כת לה לו לי לת",pre8:"ובה ובו ובי ובת וכה וכו וכי וכת ולה ולו ולי ולת"},e.suf={suf1:"ך כ ם ן נ",suf2:"ים ות וך וכ ום ון ונ הם הן יכ יך ינ ים",suf3:"תי תך תכ תם תן תנ",suf4:"ותי ותך ותכ ותם ותן ותנ",suf5:"נו כם כן הם הן",suf6:"ונו וכם וכן והם והן",suf7:"תכם תכן תנו תהם תהן",suf8:"הוא היא הם הן אני אתה את אנו אתם אתן",suf9:"ני נו כי כו כם כן תי תך תכ תם תן",suf10:"י ך כ ם ן נ ת"},e.patterns=JSON.parse('{"hebrewPatterns": [{"pt1": [{"c": "ה", "l": 0}]}, {"pt2": [{"c": "ו", "l": 0}]}, {"pt3": [{"c": "י", "l": 0}]}, {"pt4": [{"c": "ת", "l": 0}]}, {"pt5": [{"c": "מ", "l": 0}]}, {"pt6": [{"c": "ל", "l": 0}]}, {"pt7": [{"c": "ב", "l": 0}]}, {"pt8": [{"c": "כ", "l": 0}]}, {"pt9": [{"c": "ש", "l": 0}]}, {"pt10": [{"c": "כש", "l": 0}]}, {"pt11": [{"c": "בה", "l": 0}]}, {"pt12": [{"c": "וב", "l": 0}]}, {"pt13": [{"c": "וכ", "l": 0}]}, {"pt14": [{"c": "ול", "l": 0}]}, {"pt15": [{"c": "ומ", "l": 0}]}, {"pt16": [{"c": "וש", "l": 0}]}, {"pt17": [{"c": "הב", "l": 0}]}, {"pt18": [{"c": "הכ", "l": 0}]}, {"pt19": [{"c": "הל", "l": 0}]}, {"pt20": [{"c": "המ", "l": 0}]}, {"pt21": [{"c": "הש", "l": 0}]}, {"pt22": [{"c": "מה", "l": 0}]}, {"pt23": [{"c": "שה", "l": 0}]}, {"pt24": [{"c": "כל", "l": 0}]}]}'),e.execArray=["cleanWord","removeDiacritics","removeStopWords","normalizeHebrewCharacters"],e.stem=function(){var r=0;for(e.result=!1,e.preRemoved=!1,e.sufRemoved=!1;r
=a&&(r=w.limit_backward,w.limit_backward=a,w.ket=w.cursor,e=w.find_among_b(m,29),w.limit_backward=r,e))switch(w.bra=w.cursor,e){case 1:w.slice_del();break;case 2:n=w.limit-w.cursor,w.in_grouping_b(c,98,122)?w.slice_del():(w.cursor=w.limit-n,w.eq_s_b(1,"k")&&w.out_grouping_b(d,97,248)&&w.slice_del());break;case 3:w.slice_from("er")}}function t(){var e,r=w.limit-w.cursor;w.cursor>=a&&(e=w.limit_backward,w.limit_backward=a,w.ket=w.cursor,w.find_among_b(u,2)?(w.bra=w.cursor,w.limit_backward=e,w.cursor=w.limit-r,w.cursor>w.limit_backward&&(w.cursor--,w.bra=w.cursor,w.slice_del())):w.limit_backward=e)}function o(){var e,r;w.cursor>=a&&(r=w.limit_backward,w.limit_backward=a,w.ket=w.cursor,e=w.find_among_b(l,11),e?(w.bra=w.cursor,w.limit_backward=r,1==e&&w.slice_del()):w.limit_backward=r)}var s,a,m=[new r("a",-1,1),new r("e",-1,1),new r("ede",1,1),new r("ande",1,1),new r("ende",1,1),new r("ane",1,1),new r("ene",1,1),new r("hetene",6,1),new r("erte",1,3),new r("en",-1,1),new r("heten",9,1),new r("ar",-1,1),new r("er",-1,1),new r("heter",12,1),new r("s",-1,2),new r("as",14,1),new r("es",14,1),new r("edes",16,1),new r("endes",16,1),new r("enes",16,1),new r("hetenes",19,1),new r("ens",14,1),new r("hetens",21,1),new r("ers",14,1),new r("ets",14,1),new r("et",-1,1),new r("het",25,1),new r("ert",-1,3),new r("ast",-1,1)],u=[new r("dt",-1,-1),new r("vt",-1,-1)],l=[new r("leg",-1,1),new r("eleg",0,1),new r("ig",-1,1),new r("eig",2,1),new r("lig",2,1),new r("elig",4,1),new r("els",-1,1),new r("lov",-1,1),new r("elov",7,1),new r("slov",7,1),new r("hetslov",9,1)],d=[17,65,16,1,0,0,0,0,0,0,0,0,0,0,0,0,48,0,128],c=[119,125,149,1],w=new n;this.setCurrent=function(e){w.setCurrent(e)},this.getCurrent=function(){return w.getCurrent()},this.stem=function(){var r=w.cursor;return e(),w.limit_backward=r,w.cursor=w.limit,i(),w.cursor=w.limit,t(),w.cursor=w.limit,o(),!0}};return function(e){return"function"==typeof e.update?e.update(function(e){return i.setCurrent(e),i.stem(),i.getCurrent()}):(i.setCurrent(e),i.stem(),i.getCurrent())}}(),e.Pipeline.registerFunction(e.no.stemmer,"stemmer-no"),e.no.stopWordFilter=e.generateStopWordFilter("alle at av bare begge ble blei bli blir blitt både båe da de deg dei deim deira deires dem den denne der dere deres det dette di din disse ditt du dykk dykkar då eg ein eit eitt eller elles en enn er et ett etter for fordi fra før ha hadde han hans har hennar henne hennes her hjå ho hoe honom hoss hossen hun hva hvem hver hvilke hvilken hvis hvor hvordan hvorfor i ikke ikkje ikkje ingen ingi inkje inn inni ja jeg kan kom korleis korso kun kunne kva kvar kvarhelst kven kvi kvifor man mange me med medan meg meget mellom men mi min mine mitt mot mykje ned no noe noen noka noko nokon nokor nokre nå når og også om opp oss over på samme seg selv si si sia sidan siden sin sine sitt sjøl skal skulle slik so som som somme somt så sånn til um upp ut uten var vart varte ved vere verte vi vil ville vore vors vort vår være være vært å".split(" ")),e.Pipeline.registerFunction(e.no.stopWordFilter,"stopWordFilter-no")}});
\ No newline at end of file
diff --git a/assets/javascripts/lunr/min/lunr.pt.min.js b/assets/javascripts/lunr/min/lunr.pt.min.js
new file mode 100644
index 000000000..6c16996d6
--- /dev/null
+++ b/assets/javascripts/lunr/min/lunr.pt.min.js
@@ -0,0 +1,18 @@
+/*!
+ * Lunr languages, `Portuguese` language
+ * https://github.com/MihaiValentin/lunr-languages
+ *
+ * Copyright 2014, Mihai Valentin
+ * http://www.mozilla.org/MPL/
+ */
+/*!
+ * based on
+ * Snowball JavaScript Library v0.3
+ * http://code.google.com/p/urim/
+ * http://snowball.tartarus.org/
+ *
+ * Copyright 2010, Oleg Mazko
+ * http://www.mozilla.org/MPL/
+ */
+
+!function(e,r){"function"==typeof define&&define.amd?define(r):"object"==typeof exports?module.exports=r():r()(e.lunr)}(this,function(){return function(e){if(void 0===e)throw new Error("Lunr is not present. Please include / require Lunr before this script.");if(void 0===e.stemmerSupport)throw new Error("Lunr stemmer support is not present. Please include / require Lunr stemmer support before this script.");e.pt=function(){this.pipeline.reset(),this.pipeline.add(e.pt.trimmer,e.pt.stopWordFilter,e.pt.stemmer),this.searchPipeline&&(this.searchPipeline.reset(),this.searchPipeline.add(e.pt.stemmer))},e.pt.wordCharacters="A-Za-zªºÀ-ÖØ-öø-ʸˠ-ˤᴀ-ᴥᴬ-ᵜᵢ-ᵥᵫ-ᵷᵹ-ᶾḀ-ỿⁱⁿₐ-ₜKÅℲⅎⅠ-ↈⱠ-ⱿꜢ-ꞇꞋ-ꞭꞰ-ꞷꟷ-ꟿꬰ-ꭚꭜ-ꭤff-stA-Za-z",e.pt.trimmer=e.trimmerSupport.generateTrimmer(e.pt.wordCharacters),e.Pipeline.registerFunction(e.pt.trimmer,"trimmer-pt"),e.pt.stemmer=function(){var r=e.stemmerSupport.Among,s=e.stemmerSupport.SnowballProgram,n=new function(){function e(){for(var e;;){if(z.bra=z.cursor,e=z.find_among(k,3))switch(z.ket=z.cursor,e){case 1:z.slice_from("a~");continue;case 2:z.slice_from("o~");continue;case 3:if(z.cursor>=z.limit)break;z.cursor++;continue}break}}function n(){if(z.out_grouping(y,97,250)){for(;!z.in_grouping(y,97,250);){if(z.cursor>=z.limit)return!0;z.cursor++}return!1}return!0}function i(){if(z.in_grouping(y,97,250))for(;!z.out_grouping(y,97,250);){if(z.cursor>=z.limit)return!1;z.cursor++}return g=z.cursor,!0}function o(){var e,r,s=z.cursor;if(z.in_grouping(y,97,250))if(e=z.cursor,n()){if(z.cursor=e,i())return}else g=z.cursor;if(z.cursor=s,z.out_grouping(y,97,250)){if(r=z.cursor,n()){if(z.cursor=r,!z.in_grouping(y,97,250)||z.cursor>=z.limit)return;z.cursor++}g=z.cursor}}function t(){for(;!z.in_grouping(y,97,250);){if(z.cursor>=z.limit)return!1;z.cursor++}for(;!z.out_grouping(y,97,250);){if(z.cursor>=z.limit)return!1;z.cursor++}return!0}function a(){var e=z.cursor;g=z.limit,b=g,h=g,o(),z.cursor=e,t()&&(b=z.cursor,t()&&(h=z.cursor))}function u(){for(var e;;){if(z.bra=z.cursor,e=z.find_among(q,3))switch(z.ket=z.cursor,e){case 1:z.slice_from("ã");continue;case 2:z.slice_from("õ");continue;case 3:if(z.cursor>=z.limit)break;z.cursor++;continue}break}}function w(){return g<=z.cursor}function m(){return b<=z.cursor}function c(){return h<=z.cursor}function l(){var e;if(z.ket=z.cursor,!(e=z.find_among_b(F,45)))return!1;switch(z.bra=z.cursor,e){case 1:if(!c())return!1;z.slice_del();break;case 2:if(!c())return!1;z.slice_from("log");break;case 3:if(!c())return!1;z.slice_from("u");break;case 4:if(!c())return!1;z.slice_from("ente");break;case 5:if(!m())return!1;z.slice_del(),z.ket=z.cursor,e=z.find_among_b(j,4),e&&(z.bra=z.cursor,c()&&(z.slice_del(),1==e&&(z.ket=z.cursor,z.eq_s_b(2,"at")&&(z.bra=z.cursor,c()&&z.slice_del()))));break;case 6:if(!c())return!1;z.slice_del(),z.ket=z.cursor,e=z.find_among_b(C,3),e&&(z.bra=z.cursor,1==e&&c()&&z.slice_del());break;case 7:if(!c())return!1;z.slice_del(),z.ket=z.cursor,e=z.find_among_b(P,3),e&&(z.bra=z.cursor,1==e&&c()&&z.slice_del());break;case 8:if(!c())return!1;z.slice_del(),z.ket=z.cursor,z.eq_s_b(2,"at")&&(z.bra=z.cursor,c()&&z.slice_del());break;case 9:if(!w()||!z.eq_s_b(1,"e"))return!1;z.slice_from("ir")}return!0}function f(){var e,r;if(z.cursor>=g){if(r=z.limit_backward,z.limit_backward=g,z.ket=z.cursor,e=z.find_among_b(S,120))return z.bra=z.cursor,1==e&&z.slice_del(),z.limit_backward=r,!0;z.limit_backward=r}return!1}function d(){var e;z.ket=z.cursor,(e=z.find_among_b(W,7))&&(z.bra=z.cursor,1==e&&w()&&z.slice_del())}function v(e,r){if(z.eq_s_b(1,e)){z.bra=z.cursor;var s=z.limit-z.cursor;if(z.eq_s_b(1,r))return z.cursor=z.limit-s,w()&&z.slice_del(),!1}return!0}function p(){var e;if(z.ket=z.cursor,e=z.find_among_b(L,4))switch(z.bra=z.cursor,e){case 1:w()&&(z.slice_del(),z.ket=z.cursor,z.limit-z.cursor,v("u","g")&&v("i","c"));break;case 2:z.slice_from("c")}}function _(){if(!l()&&(z.cursor=z.limit,!f()))return z.cursor=z.limit,void d();z.cursor=z.limit,z.ket=z.cursor,z.eq_s_b(1,"i")&&(z.bra=z.cursor,z.eq_s_b(1,"c")&&(z.cursor=z.limit,w()&&z.slice_del()))}var h,b,g,k=[new r("",-1,3),new r("ã",0,1),new r("õ",0,2)],q=[new r("",-1,3),new r("a~",0,1),new r("o~",0,2)],j=[new r("ic",-1,-1),new r("ad",-1,-1),new r("os",-1,-1),new r("iv",-1,1)],C=[new r("ante",-1,1),new r("avel",-1,1),new r("ível",-1,1)],P=[new r("ic",-1,1),new r("abil",-1,1),new r("iv",-1,1)],F=[new r("ica",-1,1),new r("ância",-1,1),new r("ência",-1,4),new r("ira",-1,9),new r("adora",-1,1),new r("osa",-1,1),new r("ista",-1,1),new r("iva",-1,8),new r("eza",-1,1),new r("logía",-1,2),new r("idade",-1,7),new r("ante",-1,1),new r("mente",-1,6),new r("amente",12,5),new r("ável",-1,1),new r("ível",-1,1),new r("ución",-1,3),new r("ico",-1,1),new r("ismo",-1,1),new r("oso",-1,1),new r("amento",-1,1),new r("imento",-1,1),new r("ivo",-1,8),new r("aça~o",-1,1),new r("ador",-1,1),new r("icas",-1,1),new r("ências",-1,4),new r("iras",-1,9),new r("adoras",-1,1),new r("osas",-1,1),new r("istas",-1,1),new r("ivas",-1,8),new r("ezas",-1,1),new r("logías",-1,2),new r("idades",-1,7),new r("uciones",-1,3),new r("adores",-1,1),new r("antes",-1,1),new r("aço~es",-1,1),new r("icos",-1,1),new r("ismos",-1,1),new r("osos",-1,1),new r("amentos",-1,1),new r("imentos",-1,1),new r("ivos",-1,8)],S=[new r("ada",-1,1),new r("ida",-1,1),new r("ia",-1,1),new r("aria",2,1),new r("eria",2,1),new r("iria",2,1),new r("ara",-1,1),new r("era",-1,1),new r("ira",-1,1),new r("ava",-1,1),new r("asse",-1,1),new r("esse",-1,1),new r("isse",-1,1),new r("aste",-1,1),new r("este",-1,1),new r("iste",-1,1),new r("ei",-1,1),new r("arei",16,1),new r("erei",16,1),new r("irei",16,1),new r("am",-1,1),new r("iam",20,1),new r("ariam",21,1),new r("eriam",21,1),new r("iriam",21,1),new r("aram",20,1),new r("eram",20,1),new r("iram",20,1),new r("avam",20,1),new r("em",-1,1),new r("arem",29,1),new r("erem",29,1),new r("irem",29,1),new r("assem",29,1),new r("essem",29,1),new r("issem",29,1),new r("ado",-1,1),new r("ido",-1,1),new r("ando",-1,1),new r("endo",-1,1),new r("indo",-1,1),new r("ara~o",-1,1),new r("era~o",-1,1),new r("ira~o",-1,1),new r("ar",-1,1),new r("er",-1,1),new r("ir",-1,1),new r("as",-1,1),new r("adas",47,1),new r("idas",47,1),new r("ias",47,1),new r("arias",50,1),new r("erias",50,1),new r("irias",50,1),new r("aras",47,1),new r("eras",47,1),new r("iras",47,1),new r("avas",47,1),new r("es",-1,1),new r("ardes",58,1),new r("erdes",58,1),new r("irdes",58,1),new r("ares",58,1),new r("eres",58,1),new r("ires",58,1),new r("asses",58,1),new r("esses",58,1),new r("isses",58,1),new r("astes",58,1),new r("estes",58,1),new r("istes",58,1),new r("is",-1,1),new r("ais",71,1),new r("eis",71,1),new r("areis",73,1),new r("ereis",73,1),new r("ireis",73,1),new r("áreis",73,1),new r("éreis",73,1),new r("íreis",73,1),new r("ásseis",73,1),new r("ésseis",73,1),new r("ísseis",73,1),new r("áveis",73,1),new r("íeis",73,1),new r("aríeis",84,1),new r("eríeis",84,1),new r("iríeis",84,1),new r("ados",-1,1),new r("idos",-1,1),new r("amos",-1,1),new r("áramos",90,1),new r("éramos",90,1),new r("íramos",90,1),new r("ávamos",90,1),new r("íamos",90,1),new r("aríamos",95,1),new r("eríamos",95,1),new r("iríamos",95,1),new r("emos",-1,1),new r("aremos",99,1),new r("eremos",99,1),new r("iremos",99,1),new r("ássemos",99,1),new r("êssemos",99,1),new r("íssemos",99,1),new r("imos",-1,1),new r("armos",-1,1),new r("ermos",-1,1),new r("irmos",-1,1),new r("ámos",-1,1),new r("arás",-1,1),new r("erás",-1,1),new r("irás",-1,1),new r("eu",-1,1),new r("iu",-1,1),new r("ou",-1,1),new r("ará",-1,1),new r("erá",-1,1),new r("irá",-1,1)],W=[new r("a",-1,1),new r("i",-1,1),new r("o",-1,1),new r("os",-1,1),new r("á",-1,1),new r("í",-1,1),new r("ó",-1,1)],L=[new r("e",-1,1),new r("ç",-1,2),new r("é",-1,1),new r("ê",-1,1)],y=[17,65,16,0,0,0,0,0,0,0,0,0,0,0,0,0,3,19,12,2],z=new s;this.setCurrent=function(e){z.setCurrent(e)},this.getCurrent=function(){return z.getCurrent()},this.stem=function(){var r=z.cursor;return e(),z.cursor=r,a(),z.limit_backward=r,z.cursor=z.limit,_(),z.cursor=z.limit,p(),z.cursor=z.limit_backward,u(),!0}};return function(e){return"function"==typeof e.update?e.update(function(e){return n.setCurrent(e),n.stem(),n.getCurrent()}):(n.setCurrent(e),n.stem(),n.getCurrent())}}(),e.Pipeline.registerFunction(e.pt.stemmer,"stemmer-pt"),e.pt.stopWordFilter=e.generateStopWordFilter("a ao aos aquela aquelas aquele aqueles aquilo as até com como da das de dela delas dele deles depois do dos e ela elas ele eles em entre era eram essa essas esse esses esta estamos estas estava estavam este esteja estejam estejamos estes esteve estive estivemos estiver estivera estiveram estiverem estivermos estivesse estivessem estivéramos estivéssemos estou está estávamos estão eu foi fomos for fora foram forem formos fosse fossem fui fôramos fôssemos haja hajam hajamos havemos hei houve houvemos houver houvera houveram houverei houverem houveremos houveria houveriam houvermos houverá houverão houveríamos houvesse houvessem houvéramos houvéssemos há hão isso isto já lhe lhes mais mas me mesmo meu meus minha minhas muito na nas nem no nos nossa nossas nosso nossos num numa não nós o os ou para pela pelas pelo pelos por qual quando que quem se seja sejam sejamos sem serei seremos seria seriam será serão seríamos seu seus somos sou sua suas são só também te tem temos tenha tenham tenhamos tenho terei teremos teria teriam terá terão teríamos teu teus teve tinha tinham tive tivemos tiver tivera tiveram tiverem tivermos tivesse tivessem tivéramos tivéssemos tu tua tuas tém tínhamos um uma você vocês vos à às éramos".split(" ")),e.Pipeline.registerFunction(e.pt.stopWordFilter,"stopWordFilter-pt")}});
\ No newline at end of file
diff --git a/assets/javascripts/lunr/min/lunr.ro.min.js b/assets/javascripts/lunr/min/lunr.ro.min.js
new file mode 100644
index 000000000..727714018
--- /dev/null
+++ b/assets/javascripts/lunr/min/lunr.ro.min.js
@@ -0,0 +1,18 @@
+/*!
+ * Lunr languages, `Romanian` language
+ * https://github.com/MihaiValentin/lunr-languages
+ *
+ * Copyright 2014, Mihai Valentin
+ * http://www.mozilla.org/MPL/
+ */
+/*!
+ * based on
+ * Snowball JavaScript Library v0.3
+ * http://code.google.com/p/urim/
+ * http://snowball.tartarus.org/
+ *
+ * Copyright 2010, Oleg Mazko
+ * http://www.mozilla.org/MPL/
+ */
+
+!function(e,i){"function"==typeof define&&define.amd?define(i):"object"==typeof exports?module.exports=i():i()(e.lunr)}(this,function(){return function(e){if(void 0===e)throw new Error("Lunr is not present. Please include / require Lunr before this script.");if(void 0===e.stemmerSupport)throw new Error("Lunr stemmer support is not present. Please include / require Lunr stemmer support before this script.");e.ro=function(){this.pipeline.reset(),this.pipeline.add(e.ro.trimmer,e.ro.stopWordFilter,e.ro.stemmer),this.searchPipeline&&(this.searchPipeline.reset(),this.searchPipeline.add(e.ro.stemmer))},e.ro.wordCharacters="A-Za-zªºÀ-ÖØ-öø-ʸˠ-ˤᴀ-ᴥᴬ-ᵜᵢ-ᵥᵫ-ᵷᵹ-ᶾḀ-ỿⁱⁿₐ-ₜKÅℲⅎⅠ-ↈⱠ-ⱿꜢ-ꞇꞋ-ꞭꞰ-ꞷꟷ-ꟿꬰ-ꭚꭜ-ꭤff-stA-Za-z",e.ro.trimmer=e.trimmerSupport.generateTrimmer(e.ro.wordCharacters),e.Pipeline.registerFunction(e.ro.trimmer,"trimmer-ro"),e.ro.stemmer=function(){var i=e.stemmerSupport.Among,r=e.stemmerSupport.SnowballProgram,n=new function(){function e(e,i){L.eq_s(1,e)&&(L.ket=L.cursor,L.in_grouping(W,97,259)&&L.slice_from(i))}function n(){for(var i,r;;){if(i=L.cursor,L.in_grouping(W,97,259)&&(r=L.cursor,L.bra=r,e("u","U"),L.cursor=r,e("i","I")),L.cursor=i,L.cursor>=L.limit)break;L.cursor++}}function t(){if(L.out_grouping(W,97,259)){for(;!L.in_grouping(W,97,259);){if(L.cursor>=L.limit)return!0;L.cursor++}return!1}return!0}function a(){if(L.in_grouping(W,97,259))for(;!L.out_grouping(W,97,259);){if(L.cursor>=L.limit)return!0;L.cursor++}return!1}function o(){var e,i,r=L.cursor;if(L.in_grouping(W,97,259)){if(e=L.cursor,!t())return void(h=L.cursor);if(L.cursor=e,!a())return void(h=L.cursor)}L.cursor=r,L.out_grouping(W,97,259)&&(i=L.cursor,t()&&(L.cursor=i,L.in_grouping(W,97,259)&&L.cursor=e;r--){var n=this.uncheckedNodes[r],i=n.child.toString();i in this.minimizedNodes?n.parent.edges[n.char]=this.minimizedNodes[i]:(n.child._str=i,this.minimizedNodes[i]=n.child),this.uncheckedNodes.pop()}};t.Index=function(e){this.invertedIndex=e.invertedIndex,this.fieldVectors=e.fieldVectors,this.tokenSet=e.tokenSet,this.fields=e.fields,this.pipeline=e.pipeline},t.Index.prototype.search=function(e){return this.query(function(r){var n=new t.QueryParser(e,r);n.parse()})},t.Index.prototype.query=function(e){for(var r=new t.Query(this.fields),n=Object.create(null),i=Object.create(null),s=Object.create(null),o=Object.create(null),a=Object.create(null),u=0;uq&(51smC3s!?#=Jq>KWOQ4|K@`v;qmvg&PtC6vQArR6pD0Vh%DnaR1
zMEdLPt@RXNTkK(MO2o?ZXBhL5vIsr3(2r>Q5pt(9>MXf(4nqZDx$Ovem560(HDg1>
z5C(bCp7}=S@{2&vr21IRZmb$uOt9e$R_8t9WKiAzJwzqu;mc@
zUGVqLw?fGJH(z3pL;-lyS}Zc2uApW)CqSs#M|$!RMIXB*-4~cOU5Ts9A?Q#7BaAh8
z>B}r>eIp$Pu>)YGt}DY;t~Mi#=sqDH;r=v-kbAi59)x>zi~(Ea%Mmv*t3Jniq3P@B
zO(uVfmT^1aW}sIs*xcy`1t=@SN|D*7un2%(vj{_RvoN)(g
z@SE-;Y<8h*Mo}iS~MZ1i{n$^pQ#5)AzE+>5m83_*~IorOwk>c1R`*EaI2+_;
zgW*?yq
@fl?M-g%CRflj2ref{J5xhL}dq*
zN~@U5F+(5+`w6JlXIJmJmoxN4BXaFv(PiOB^)a2+xJx6>?~f>4ah0|D_qO*B$bU!G
z%atS#mXfr8PNp)kGR}4A6-uS?=q(2z4R2~mKjDkuzf+$DYMCx36hUueMHVz}+tv8!
z0jueQ5&ralK>JCGRr^$3{s#~FZz+6?(6yQ3B6QpS5xW`6w>1DN
z*s3?|lT9Jtk|F0tpi0as8)$kKvdjgK-|E(Pug~mdipJ52H#0(kQmTaD!-sxSZ21hu
z+8__<^1OnzdL^nM3Op}(q2%^$dfPUr}ht~d*+GlLK4R>N$
ze^O7)fg%Vp(TU}+YJLMUKY5MT9{~T7l$4Z02PNuA-Xa~HXq0x$U_mjEF*R5S5;>C@
zsw5L!9<9U?Svz`C#7eXGJmD9s-QcHCHzR|zQg`~^WtTry83hIM9GfJQm!W$0&`6jq
z&!QDlqmuZkLRg~A!Q%?E7PfXQqj9f+l{R8Vm!&1@Vl_-t^X+WYHNBtTe