RubyGems - galaaz - Versions diffs - 0.4.6 → 0.5.0 - Mend

galaaz 0.4.6 → 0.5.0

Files changed (181) hide show

checksums.yaml +5 -5
data/README.md +3575 -118
data/Rakefile +21 -4
data/bin/gknit +152 -6
data/bin/gknit-draft +105 -0
data/bin/gknit-draft.rb +28 -0
data/bin/gknit_Rscript +127 -0
data/bin/grun +27 -1
data/bin/gstudio +47 -4
data/bin/{gstudio.rb → gstudio_irb.rb} +0 -0
data/bin/gstudio_pry.rb +7 -0
data/blogs/galaaz_ggplot/galaaz_ggplot.Rmd +3 -12
data/blogs/galaaz_ggplot/galaaz_ggplot.html +77 -222
data/blogs/galaaz_ggplot/galaaz_ggplot.md +4 -31
data/blogs/galaaz_ggplot/galaaz_ggplot.pdf +0 -0
data/blogs/galaaz_ggplot/galaaz_ggplot_files/figure-html/midwest_rb.png +0 -0
data/blogs/galaaz_ggplot/galaaz_ggplot_files/figure-html/scatter_plot_rb.png +0 -0
data/blogs/galaaz_ggplot/midwest.Rmd +1 -9
data/blogs/gknit/gknit.Rmd +232 -123
data/blogs/{dev/dev.html → gknit/gknit.html} +1897 -33
data/blogs/gknit/gknit.pdf +0 -0
data/blogs/gknit/lst.rds +0 -0
data/blogs/gknit/stats.bib +27 -0
data/blogs/manual/lst.rds +0 -0
data/blogs/manual/manual.Rmd +1893 -47
data/blogs/manual/manual.html +3153 -347
data/blogs/manual/manual.md +3575 -118
data/blogs/manual/manual.pdf +0 -0
data/blogs/manual/manual.tex +4026 -0
data/blogs/manual/manual_files/figure-html/bubble-1.png +0 -0
data/blogs/manual/manual_files/figure-html/diverging_bar.png +0 -0
data/blogs/manual/manual_files/figure-latex/bubble-1.png +0 -0
data/blogs/manual/manual_files/figure-latex/diverging_bar.pdf +0 -0
data/blogs/{dev → manual}/model.rb +0 -0
data/blogs/nse_dplyr/nse_dplyr.Rmd +849 -0
data/blogs/nse_dplyr/nse_dplyr.html +878 -0
data/blogs/nse_dplyr/nse_dplyr.md +1198 -0
data/blogs/nse_dplyr/nse_dplyr.pdf +0 -0
data/blogs/oh_my/oh_my.html +274 -386
data/blogs/oh_my/oh_my.md +208 -205
data/blogs/ruby_plot/ruby_plot.Rmd +64 -84
data/blogs/ruby_plot/ruby_plot.html +235 -208
data/blogs/ruby_plot/ruby_plot.md +239 -34
data/blogs/ruby_plot/ruby_plot.pdf +0 -0
data/blogs/ruby_plot/ruby_plot_files/figure-html/dose_len.png +0 -0
data/blogs/ruby_plot/ruby_plot_files/figure-html/facet_by_delivery.png +0 -0
data/blogs/ruby_plot/ruby_plot_files/figure-html/facet_by_dose.png +0 -0
data/blogs/ruby_plot/ruby_plot_files/figure-html/facets_by_delivery_color.png +0 -0
data/blogs/ruby_plot/ruby_plot_files/figure-html/facets_by_delivery_color2.png +0 -0
data/blogs/ruby_plot/ruby_plot_files/figure-html/facets_with_decorations.png +0 -0
data/blogs/ruby_plot/ruby_plot_files/figure-html/facets_with_jitter.png +0 -0
data/blogs/ruby_plot/ruby_plot_files/figure-html/facets_with_points.png +0 -0
data/blogs/ruby_plot/ruby_plot_files/figure-html/final_box_plot.png +0 -0
data/blogs/ruby_plot/ruby_plot_files/figure-html/final_violin_plot.png +0 -0
data/blogs/ruby_plot/ruby_plot_files/figure-html/violin_with_jitter.png +0 -0
data/examples/Bibliography/master.bib +50 -0
data/examples/Bibliography/stats.bib +72 -0
data/examples/islr/ch2.spec.rb +1 -1
data/examples/islr/ch3_boston.rb +4 -4
data/examples/islr/x_y_rnorm.jpg +0 -0
data/examples/latex_templates/Test-acm_article/Makefile +16 -0
data/examples/latex_templates/Test-acm_article/Test-acm_article.Rmd +65 -0
data/examples/latex_templates/Test-acm_article/acm_proc_article-sp.cls +1670 -0
data/examples/latex_templates/Test-acm_article/sensys-abstract.cls +703 -0
data/examples/latex_templates/Test-acm_article/sigproc.bib +59 -0
data/examples/latex_templates/Test-acs_article/Test-acs_article.Rmd +260 -0
data/examples/latex_templates/Test-acs_article/Test-acs_article.pdf +0 -0
data/examples/latex_templates/Test-acs_article/acs-Test-acs_article.bib +11 -0
data/examples/latex_templates/Test-acs_article/acs-my_output.bib +11 -0
data/examples/latex_templates/Test-acs_article/acstest.bib +17 -0
data/examples/latex_templates/Test-aea_article/AEA.cls +1414 -0
data/examples/latex_templates/Test-aea_article/BibFile.bib +0 -0
data/examples/latex_templates/Test-aea_article/Test-aea_article.Rmd +108 -0
data/examples/latex_templates/Test-aea_article/Test-aea_article.pdf +0 -0
data/examples/latex_templates/Test-aea_article/aea.bst +1269 -0
data/examples/latex_templates/Test-aea_article/multicol.sty +853 -0
data/examples/latex_templates/Test-aea_article/references.bib +0 -0
data/examples/latex_templates/Test-aea_article/setspace.sty +546 -0
data/examples/latex_templates/Test-amq_article/Test-amq_article.Rmd +256 -0
data/examples/latex_templates/Test-amq_article/Test-amq_article.pdf +0 -0
data/examples/latex_templates/Test-amq_article/Test-amq_article.pdfsync +3397 -0
data/examples/latex_templates/Test-amq_article/pics/Figure2.pdf +0 -0
data/examples/latex_templates/Test-ams_article/Test-ams_article.Rmd +215 -0
data/examples/latex_templates/Test-ams_article/amstest.bib +436 -0
data/examples/latex_templates/Test-asa_article/Test-asa_article.Rmd +153 -0
data/examples/latex_templates/Test-asa_article/Test-asa_article.pdf +0 -0
data/examples/latex_templates/Test-asa_article/agsm.bst +1353 -0
data/examples/latex_templates/Test-asa_article/bibliography.bib +233 -0
data/examples/latex_templates/Test-ieee_article/IEEEtran.bst +2409 -0
data/examples/latex_templates/Test-ieee_article/IEEEtran.cls +6346 -0
data/examples/latex_templates/Test-ieee_article/Test-ieee_article.Rmd +175 -0
data/examples/latex_templates/Test-ieee_article/Test-ieee_article.pdf +0 -0
data/examples/latex_templates/Test-ieee_article/mybibfile.bib +20 -0
data/examples/latex_templates/Test-rjournal_article/RJournal.sty +335 -0
data/examples/latex_templates/Test-rjournal_article/RJreferences.bib +18 -0
data/examples/latex_templates/Test-rjournal_article/RJwrapper.pdf +0 -0
data/examples/latex_templates/Test-rjournal_article/Test-rjournal_article.Rmd +52 -0
data/examples/latex_templates/Test-springer_article/Test-springer_article.Rmd +65 -0
data/examples/latex_templates/Test-springer_article/Test-springer_article.pdf +0 -0
data/examples/latex_templates/Test-springer_article/bibliography.bib +26 -0
data/examples/latex_templates/Test-springer_article/spbasic.bst +1658 -0
data/examples/latex_templates/Test-springer_article/spmpsci.bst +1512 -0
data/examples/latex_templates/Test-springer_article/spphys.bst +1443 -0
data/examples/latex_templates/Test-springer_article/svglov3.clo +113 -0
data/examples/latex_templates/Test-springer_article/svjour3.cls +1431 -0
data/examples/misc/moneyball.rb +1 -1
data/examples/misc/subsetting.rb +37 -37
data/examples/rmarkdown/svm-rmarkdown-anon-ms-example/svm-rmarkdown-anon-ms-example.Rmd +73 -0
data/examples/rmarkdown/svm-rmarkdown-anon-ms-example/svm-rmarkdown-anon-ms-example.pdf +0 -0
data/examples/rmarkdown/svm-rmarkdown-article-example/svm-rmarkdown-article-example.Rmd +382 -0
data/examples/rmarkdown/svm-rmarkdown-article-example/svm-rmarkdown-article-example.pdf +0 -0
data/examples/rmarkdown/svm-rmarkdown-beamer-example/svm-rmarkdown-beamer-example.Rmd +164 -0
data/examples/rmarkdown/svm-rmarkdown-beamer-example/svm-rmarkdown-beamer-example.pdf +0 -0
data/examples/rmarkdown/svm-rmarkdown-cv/svm-rmarkdown-cv.Rmd +92 -0
data/examples/rmarkdown/svm-rmarkdown-cv/svm-rmarkdown-cv.pdf +0 -0
data/examples/rmarkdown/svm-rmarkdown-syllabus-example/attend-grade-relationships.csv +482 -0
data/examples/rmarkdown/svm-rmarkdown-syllabus-example/svm-rmarkdown-syllabus-example.Rmd +280 -0
data/examples/rmarkdown/svm-rmarkdown-syllabus-example/svm-rmarkdown-syllabus-example.pdf +0 -0
data/examples/rmarkdown/svm-xaringan-example/svm-xaringan-example.Rmd +386 -0
data/lib/R_interface/r.rb +2 -2
data/lib/R_interface/r_libs.R +6 -1
data/lib/R_interface/r_methods.rb +12 -2
data/lib/R_interface/rdata_frame.rb +8 -17
data/lib/R_interface/rindexed_object.rb +1 -2
data/lib/R_interface/rlist.rb +1 -0
data/lib/R_interface/robject.rb +20 -23
data/lib/R_interface/rpkg.rb +15 -6
data/lib/R_interface/rsupport.rb +13 -19
data/lib/R_interface/ruby_extensions.rb +14 -18
data/lib/R_interface/rvector.rb +0 -12
data/lib/gknit.rb +2 -0
data/lib/gknit/draft.rb +105 -0
data/lib/gknit/knitr_engine.rb +6 -37
data/lib/util/exec_ruby.rb +22 -84
data/lib/util/inline_file.rb +7 -3
data/specs/figures/bg.jpeg +0 -0
data/specs/figures/bg.png +0 -0
data/specs/figures/bg.svg +2 -2
data/specs/figures/dose_len.png +0 -0
data/specs/figures/no_args.jpeg +0 -0
data/specs/figures/no_args.png +0 -0
data/specs/figures/no_args.svg +2 -2
data/specs/figures/width_height.jpeg +0 -0
data/specs/figures/width_height.png +0 -0
data/specs/figures/width_height_units1.jpeg +0 -0
data/specs/figures/width_height_units1.png +0 -0
data/specs/figures/width_height_units2.jpeg +0 -0
data/specs/figures/width_height_units2.png +0 -0
data/specs/r_dataframe.spec.rb +184 -11
data/specs/r_list.spec.rb +4 -4
data/specs/r_list_apply.spec.rb +11 -10
data/specs/ruby_expression.spec.rb +3 -11
data/specs/tmp.rb +106 -34
data/version.rb +1 -1
metadata +96 -33
data/bin/gknit_old_r +0 -236
data/blogs/dev/dev.Rmd +0 -77
data/blogs/dev/dev.md +0 -87
data/blogs/dev/dev_files/figure-html/bubble-1.png +0 -0
data/blogs/dev/dev_files/figure-html/diverging_bar. +0 -0
data/blogs/dev/dev_files/figure-html/diverging_bar.png +0 -0
data/blogs/dplyr/dplyr.rb +0 -63
data/blogs/galaaz_ggplot/galaaz_ggplot.aux +0 -43
data/blogs/galaaz_ggplot/galaaz_ggplot.log +0 -640
data/blogs/galaaz_ggplot/galaaz_ggplot.out +0 -10
data/blogs/galaaz_ggplot/galaaz_ggplot.tex +0 -481
data/blogs/galaaz_ggplot/midwest.png +0 -0
data/blogs/galaaz_ggplot/scatter_plot.png +0 -0
data/blogs/ruby_plot/ruby_plot.Rmd_external_figs +0 -662
data/blogs/ruby_plot/ruby_plot.tex +0 -1077
data/blogs/ruby_plot/ruby_plot_files/figure-html/dose_len.svg +0 -57
data/blogs/ruby_plot/ruby_plot_files/figure-html/facet_by_delivery.svg +0 -106
data/blogs/ruby_plot/ruby_plot_files/figure-html/facet_by_dose.svg +0 -110
data/blogs/ruby_plot/ruby_plot_files/figure-html/facets_by_delivery_color.svg +0 -174
data/blogs/ruby_plot/ruby_plot_files/figure-html/facets_by_delivery_color2.svg +0 -236
data/blogs/ruby_plot/ruby_plot_files/figure-html/facets_with_jitter.svg +0 -296
data/blogs/ruby_plot/ruby_plot_files/figure-html/facets_with_points.svg +0 -236
data/blogs/ruby_plot/ruby_plot_files/figure-html/final_box_plot.svg +0 -218
data/blogs/ruby_plot/ruby_plot_files/figure-html/final_violin_plot.svg +0 -128
data/blogs/ruby_plot/ruby_plot_files/figure-html/violin_with_jitter.svg +0 -150
data/examples/paper/paper.rb +0 -36

Binary file

@@ -0,0 +1,4026 @@
+\documentclass[11pt,]{article}
+\usepackage{lmodern}
+\usepackage{amssymb,amsmath}
+\usepackage{ifxetex,ifluatex}
+\usepackage{fixltx2e} % provides \textsubscript
+\ifnum 0\ifxetex 1\fi\ifluatex 1\fi=0 % if pdftex
+  \usepackage[T1]{fontenc}
+  \usepackage[utf8]{inputenc}
+\else % if luatex or xelatex
+  \ifxetex
+    \usepackage{mathspec}
+  \else
+    \usepackage{fontspec}
+  \fi
+  \defaultfontfeatures{Ligatures=TeX,Scale=MatchLowercase}
+\fi
+% use upquote if available, for straight quotes in verbatim environments
+\IfFileExists{upquote.sty}{\usepackage{upquote}}{}
+% use microtype if available
+\IfFileExists{microtype.sty}{%
+\usepackage{microtype}
+\UseMicrotypeSet[protrusion]{basicmath} % disable protrusion for tt fonts
+}{}
+\usepackage[margin=1in]{geometry}
+\usepackage{hyperref}
+\hypersetup{unicode=true,
+            pdftitle={Galaaz Manual},
+            pdfauthor={Rodrigo Botafogo},
+            pdfborder={0 0 0},
+            breaklinks=true}
+\urlstyle{same}  % don't use monospace font for urls
+\usepackage{color}
+\usepackage{fancyvrb}
+\newcommand{\VerbBar}{|}
+\newcommand{\VERB}{\Verb[commandchars=\\\{\}]}
+\DefineVerbatimEnvironment{Highlighting}{Verbatim}{commandchars=\\\{\}}
+% Add ',fontsize=\small' for more characters per line
+\usepackage{framed}
+\definecolor{shadecolor}{RGB}{248,248,248}
+\newenvironment{Shaded}{\begin{snugshade}}{\end{snugshade}}
+\newcommand{\KeywordTok}[1]{\textcolor[rgb]{0.13,0.29,0.53}{\textbf{#1}}}
+\newcommand{\DataTypeTok}[1]{\textcolor[rgb]{0.13,0.29,0.53}{#1}}
+\newcommand{\DecValTok}[1]{\textcolor[rgb]{0.00,0.00,0.81}{#1}}
+\newcommand{\BaseNTok}[1]{\textcolor[rgb]{0.00,0.00,0.81}{#1}}
+\newcommand{\FloatTok}[1]{\textcolor[rgb]{0.00,0.00,0.81}{#1}}
+\newcommand{\ConstantTok}[1]{\textcolor[rgb]{0.00,0.00,0.00}{#1}}
+\newcommand{\CharTok}[1]{\textcolor[rgb]{0.31,0.60,0.02}{#1}}
+\newcommand{\SpecialCharTok}[1]{\textcolor[rgb]{0.00,0.00,0.00}{#1}}
+\newcommand{\StringTok}[1]{\textcolor[rgb]{0.31,0.60,0.02}{#1}}
+\newcommand{\VerbatimStringTok}[1]{\textcolor[rgb]{0.31,0.60,0.02}{#1}}
+\newcommand{\SpecialStringTok}[1]{\textcolor[rgb]{0.31,0.60,0.02}{#1}}
+\newcommand{\ImportTok}[1]{#1}
+\newcommand{\CommentTok}[1]{\textcolor[rgb]{0.56,0.35,0.01}{\textit{#1}}}
+\newcommand{\DocumentationTok}[1]{\textcolor[rgb]{0.56,0.35,0.01}{\textbf{\textit{#1}}}}
+\newcommand{\AnnotationTok}[1]{\textcolor[rgb]{0.56,0.35,0.01}{\textbf{\textit{#1}}}}
+\newcommand{\CommentVarTok}[1]{\textcolor[rgb]{0.56,0.35,0.01}{\textbf{\textit{#1}}}}
+\newcommand{\OtherTok}[1]{\textcolor[rgb]{0.56,0.35,0.01}{#1}}
+\newcommand{\FunctionTok}[1]{\textcolor[rgb]{0.00,0.00,0.00}{#1}}
+\newcommand{\VariableTok}[1]{\textcolor[rgb]{0.00,0.00,0.00}{#1}}
+\newcommand{\ControlFlowTok}[1]{\textcolor[rgb]{0.13,0.29,0.53}{\textbf{#1}}}
+\newcommand{\OperatorTok}[1]{\textcolor[rgb]{0.81,0.36,0.00}{\textbf{#1}}}
+\newcommand{\BuiltInTok}[1]{#1}
+\newcommand{\ExtensionTok}[1]{#1}
+\newcommand{\PreprocessorTok}[1]{\textcolor[rgb]{0.56,0.35,0.01}{\textit{#1}}}
+\newcommand{\AttributeTok}[1]{\textcolor[rgb]{0.77,0.63,0.00}{#1}}
+\newcommand{\RegionMarkerTok}[1]{#1}
+\newcommand{\InformationTok}[1]{\textcolor[rgb]{0.56,0.35,0.01}{\textbf{\textit{#1}}}}
+\newcommand{\WarningTok}[1]{\textcolor[rgb]{0.56,0.35,0.01}{\textbf{\textit{#1}}}}
+\newcommand{\AlertTok}[1]{\textcolor[rgb]{0.94,0.16,0.16}{#1}}
+\newcommand{\ErrorTok}[1]{\textcolor[rgb]{0.64,0.00,0.00}{\textbf{#1}}}
+\newcommand{\NormalTok}[1]{#1}
+\usepackage{longtable,booktabs}
+\usepackage{graphicx,grffile}
+\makeatletter
+\def\maxwidth{\ifdim\Gin@nat@width>\linewidth\linewidth\else\Gin@nat@width\fi}
+\def\maxheight{\ifdim\Gin@nat@height>\textheight\textheight\else\Gin@nat@height\fi}
+\makeatother
+% Scale images if necessary, so that they will not overflow the page
+% margins by default, and it is still possible to overwrite the defaults
+% using explicit options in \includegraphics[width, height, ...]{}
+\setkeys{Gin}{width=\maxwidth,height=\maxheight,keepaspectratio}
+\IfFileExists{parskip.sty}{%
+\usepackage{parskip}
+}{% else
+\setlength{\parindent}{0pt}
+\setlength{\parskip}{6pt plus 2pt minus 1pt}
+}
+\setlength{\emergencystretch}{3em}  % prevent overfull lines
+\providecommand{\tightlist}{%
+  \setlength{\itemsep}{0pt}\setlength{\parskip}{0pt}}
+\setcounter{secnumdepth}{5}
+% Redefines (sub)paragraphs to behave more like sections
+\ifx\paragraph\undefined\else
+\let\oldparagraph\paragraph
+\renewcommand{\paragraph}[1]{\oldparagraph{#1}\mbox{}}
+\fi
+\ifx\subparagraph\undefined\else
+\let\oldsubparagraph\subparagraph
+\renewcommand{\subparagraph}[1]{\oldsubparagraph{#1}\mbox{}}
+\fi
+%%% Use protect on footnotes to avoid problems with footnotes in titles
+\let\rmarkdownfootnote\footnote%
+\def\footnote{\protect\rmarkdownfootnote}
+%%% Change title format to be more compact
+\usepackage{titling}
+% Create subtitle command for use in maketitle
+\newcommand{\subtitle}[1]{
+  \posttitle{
+    \begin{center}\large#1\end{center}
+    }
+}
+\setlength{\droptitle}{-2em}
+  \title{Galaaz Manual}
+    \pretitle{\vspace{\droptitle}\centering\huge}
+  \posttitle{\par}
+  \subtitle{How to tightly couple Ruby and R in GraalVM}
+  \author{Rodrigo Botafogo}
+    \preauthor{\centering\large\emph}
+  \postauthor{\par}
+      \predate{\centering\large\emph}
+  \postdate{\par}
+    \date{2019}
+% usar portugues do Brasil
+% \usepackage[brazilian]{babel}
+\usepackage[utf8]{inputenc}
+\usepackage{geometry}
+\geometry{a4paper, top=1in}
+% needed for kableExtra
+\usepackage{longtable}
+\usepackage{multirow}
+\usepackage[table]{xcolor}
+\usepackage{wrapfig}
+\usepackage{float}
+\usepackage{colortbl}
+\usepackage{pdflscape}
+\usepackage{tabu}
+\usepackage{threeparttable}
+\usepackage[normalem]{ulem}
+\usepackage{bbm}
+\usepackage{booktabs}
+\usepackage{expex}
+\usepackage{graphicx}
+\usepackage{fancyhdr}
+% set the header and foot style
+% style 'fancy' adds the section name on the header
+% and the page number on the footer
+\pagestyle{fancy}
+% style 'fancyhf' leaves header and footer empty
+%\fancyhf{}
+% sets the left head element to \rightmark, which contains the
+% current section (\leftmark is the current chapter)
+%\fancyhead[L]{\rightmark} .
+% sets the right head element to the page number.
+% \fancyhead[R]{\thepage}
+% lets the head rule disappear.
+% \renewcommand{\headrulewidth}{0pt}
+% Possible selectors for the optional argument of \fancyhead/\fancyfoot
+% are L (left), C (center) or R (right) for the position of the element
+% and E (even) or O (odd) to distinguish even and odd pages. If you omit
+% E/O the element is set for all pages.
+% \usepackage{lipsum}
+% make available command lastpage
+\usepackage{lastpage}
+% default fontsize 11pt better to add
+% fontsize on the yaml header
+% \usepackage[fontsize=11pt]{scrextend}
+% comandos para formatar uma tabela
+\usepackage{array}
+\newcolumntype{L}[1]{>{\raggedright\let\newline\\\arraybackslash\hspace{0pt}}m{#1}}
+\newcolumntype{C}[1]{>{\centering\let\newline\\\arraybackslash\hspace{0pt}}m{#1}}
+\newcolumntype{R}[1]{>{\raggedleft\let\newline\\\arraybackslash\hspace{0pt}}m{#1}}
+% necessário if we need to import other latex documents
+\usepackage{import}
+% Command to import an R variable to latex
+\newcommand{\RtoLatex}[2]{\newcommand{#1}{#2}}
+%
+%\newcommand{\atraso}[1]{\color{red} \textbf {Tempo desde a Assinatura do Contrato: #1 dias}}
+\usepackage{booktabs}
+\usepackage{longtable}
+\usepackage{array}
+\usepackage{multirow}
+\usepackage{wrapfig}
+\usepackage{float}
+\usepackage{colortbl}
+\usepackage{pdflscape}
+\usepackage{tabu}
+\usepackage{threeparttable}
+\usepackage{threeparttablex}
+\usepackage[normalem]{ulem}
+\usepackage{makecell}
+\usepackage{xcolor}
+\begin{document}
+\maketitle
+{
+\setcounter{tocdepth}{3}
+\tableofcontents
+}
+\section{Introduction}\label{introduction}
+Galaaz is a system for tightly coupling Ruby and R. Ruby is a powerful
+language, with a large community, a very large set of libraries and
+great for web development. However, it lacks libraries for data science,
+statistics, scientific plotting and machine learning. On the other hand,
+R is considered one of the most powerful languages for solving all of
+the above problems. Maybe the strongest competitor to R is Python with
+libraries such as NumPy, Panda, SciPy, SciKit-Learn and a couple more.
+With Galaaz we do not intend to re-implement any of the scientific
+libraries in R, we allow for very tight coupling between the two
+languages to the point that the Ruby developer does not need to know
+that there is an R engine running.
+According to Wikipedia ``Ruby is a dynamic, interpreted, reflective,
+object-oriented, general-purpose programming language. It was designed
+and developed in the mid-1990s by Yukihiro''Matz" Matsumoto in Japan."
+It reached high popularity with the development of Ruby on Rails (RoR)
+by David Heinemeier Hansson. RoR is a web application framework first
+released around 2005. It makes extensive use of Ruby's metaprogramming
+features. With RoR, Ruby became very popular. According to
+\href{https://www.tiobe.com/tiobe-index/ruby/}{Ruby's Tiobe index} it
+peeked in popularity around 2008, then declined until 2015 when it
+started picking up again. At the time of this writing (November 2018),
+the Tiobe index puts Ruby in 16th position as most popular language.
+Python, a language similar to Ruby, ranks 4th in the index. Java, C and
+C++ take the first three positions. Ruby is often criticized for its
+focus on web applications. But Ruby can do
+\href{https://github.com/markets/awesome-ruby}{much more} than just web
+applications. Yet, for scientific computing, Ruby lags way behind Python
+and R. Python has Django framework for web, NumPy for numerical arrays,
+Pandas for data analysis. R is a free software environment for
+statistical computing and graphics with thousands of libraries for data
+analysis.
+Until recently, there was no real perspective for Ruby to bridge this
+gap. Implementing a complete scientific computing infrastructure would
+take too long. Enters \href{https://www.graalvm.org/}{Oracle's GraalVM}:
+\begin{quote}
+GraalVM is a universal virtual machine for running applications written
+in JavaScript, Python 3, Ruby, R, JVM-based languages like Java, Scala,
+Kotlin, and LLVM-based languages such as C and C++.
+GraalVM removes the isolation between programming languages and enables
+interoperability in a shared runtime. It can run either standalone or in
+the context of OpenJDK, Node.js, Oracle Database, or MySQL.
+GraalVM allows you to write polyglot applications with a seamless way to
+pass values from one language to another. With GraalVM there is no
+copying or marshaling necessary as it is with other polyglot systems.
+This lets you achieve high performance when language boundaries are
+crossed. Most of the time there is no additional cost for crossing a
+language boundary at all.
+Often developers have to make uncomfortable compromises that require
+them to rewrite their software in other languages. For example:
+\begin{itemize}
+\tightlist
+\item
+  That library is not available in my language. I need to rewrite it.
+\item
+  That language would be the perfect fit for my problem, but we cannot
+  run it in our environment.
+\item
+  That problem is already solved in my language, but the language is too
+  slow.
+\end{itemize}
+With GraalVM we aim to allow developers to freely choose the right
+language for the task at hand without making compromises.
+\end{quote}
+As stated above, GraalVM is a \emph{universal} virtual machine that
+allows Ruby and R (and other languages) to run on the same environment.
+GraalVM allows polyglot applications to \emph{seamlessly} interact with
+one another and pass values from one language to the other. Although a
+great idea, GraalVM still requires application writers to know several
+languages. To eliminate that requirement, we built Galaaz, a gem for
+Ruby, to tightly couple Ruby and R and allow those languages to interact
+in a way that the user will be unaware of such interaction. In other
+words, a Ruby programmer will be able to use all the capabilities of R
+without knowing the R syntax.
+Library wrapping is a usual way of bringing features from one language
+into another. To improve performance, Python often wraps more efficient
+C libraries. For the Python developer, the existence of such C libraries
+is hidden. The problem with library wrapping is that for any new
+library, there is the need to handcraft a new wrapper.
+Galaaz, instead of wrapping a single C or R library, wraps the whole R
+language in Ruby. Doing so, all thousands of R libraries are available
+immediately to Ruby developers without any new wrapping effort.
+\subsection{What does Galaaz mean}\label{what-does-galaaz-mean}
+Galaaz is the Portuguese name for ``Galahad''. From Wikipedia:
+\begin{verbatim}
+Sir Galahad (sometimes referred to as Galeas or Galath),
+in Arthurian legend, is a knight of King Arthur's Round Table and one
+of the three achievers of the Holy Grail. He is the illegitimate son
+of Sir Lancelot and Elaine of Corbenic, and is renowned for his
+gallantry and purity as the most perfect of all knights. Emerging quite
+late in the medieval Arthurian tradition, Sir Galahad first appears in the
+Lancelot–Grail cycle, and his story is taken up in later works such as
+the Post-Vulgate Cycle and Sir Thomas Malory's Le Morte d'Arthur.
+His name should not be mistaken with Galehaut, a different knight from
+Arthurian legend.
+\end{verbatim}
+\section{System Compatibility}\label{system-compatibility}
+\begin{itemize}
+\tightlist
+\item
+  Oracle Linux 7
+\item
+  Ubuntu 18.04 LTS
+\item
+  Ubuntu 16.04 LTS
+\item
+  Fedora 28
+\item
+  macOS 10.14 (Mojave)
+\item
+  macOS 10.13 (High Sierra)
+\end{itemize}
+\section{Dependencies}\label{dependencies}
+\begin{itemize}
+\tightlist
+\item
+  TruffleRuby
+\item
+  FastR
+\end{itemize}
+\section{Installation}\label{installation}
+\begin{itemize}
+\tightlist
+\item
+  Install GrallVM (\url{http://www.graalvm.org/})
+\item
+  Install Ruby (gu install Ruby)
+\item
+  Install FastR (gu install R)
+\item
+  Install rake if you want to run the specs and examples (gem install
+  rake)
+\end{itemize}
+\section{Usage}\label{usage}
+\begin{itemize}
+\tightlist
+\item
+  Interactive shell: use `gstudio' on the command line
+\end{itemize}
+\begin{quote}
+gstudio
+\end{quote}
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{  vec = R.c(}\DecValTok{1}\NormalTok{, }\DecValTok{2}\NormalTok{, }\DecValTok{3}\NormalTok{, }\DecValTok{4}\NormalTok{)}
+\NormalTok{  puts vec}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 1 2 3 4
+\end{verbatim}
+\begin{itemize}
+\tightlist
+\item
+  Run all specs
+\end{itemize}
+\begin{quote}
+galaaz specs:all
+\end{quote}
+\begin{itemize}
+\tightlist
+\item
+  Run graphics slideshow (80+ graphics)
+\end{itemize}
+\begin{quote}
+galaaz sthda:all
+\end{quote}
+\begin{itemize}
+\tightlist
+\item
+  Run labs from Introduction to Statistical Learning with R
+\end{itemize}
+\begin{quote}
+galaaz islr:all
+\end{quote}
+\begin{itemize}
+\tightlist
+\item
+  See all available examples
+\end{itemize}
+\begin{quote}
+galaaz -T
+\end{quote}
+Shows a list with all available executalbe tasks. To execute a task,
+substitute the `rake' word in the list with `galaaz'. For instance, the
+following line shows up after `galaaz -T'
+rake master\_list:scatter\_plot \# scatter\_plot from:\ldots{}.
+execute
+\begin{quote}
+galaaz master\_list:scatter\_plot
+\end{quote}
+\section{Accessing R from Ruby}\label{accessing-r-from-ruby}
+One of the nice aspects of Galaaz on GraalVM, is that variables and
+functions defined in R, can be easily accessed from Ruby. For instance,
+to access the `mtcars' data frame from R in Ruby, we use the `:mtcar'
+symbol preceded by the `\textasciitilde{}' operator, thus
+`\textasciitilde{}:r\_vec' retrieves the value of the `mtcars' variable.
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts ~}\StringTok{:mtcars}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##                      mpg cyl  disp  hp drat    wt  qsec vs am gear carb
+## Mazda RX4           21.0   6 160.0 110 3.90 2.620 16.46  0  1    4    4
+## Mazda RX4 Wag       21.0   6 160.0 110 3.90 2.875 17.02  0  1    4    4
+## Datsun 710          22.8   4 108.0  93 3.85 2.320 18.61  1  1    4    1
+## Hornet 4 Drive      21.4   6 258.0 110 3.08 3.215 19.44  1  0    3    1
+## Hornet Sportabout   18.7   8 360.0 175 3.15 3.440 17.02  0  0    3    2
+## Valiant             18.1   6 225.0 105 2.76 3.460 20.22  1  0    3    1
+## Duster 360          14.3   8 360.0 245 3.21 3.570 15.84  0  0    3    4
+## Merc 240D           24.4   4 146.7  62 3.69 3.190 20.00  1  0    4    2
+## Merc 230            22.8   4 140.8  95 3.92 3.150 22.90  1  0    4    2
+## Merc 280            19.2   6 167.6 123 3.92 3.440 18.30  1  0    4    4
+## Merc 280C           17.8   6 167.6 123 3.92 3.440 18.90  1  0    4    4
+## Merc 450SE          16.4   8 275.8 180 3.07 4.070 17.40  0  0    3    3
+## Merc 450SL          17.3   8 275.8 180 3.07 3.730 17.60  0  0    3    3
+## Merc 450SLC         15.2   8 275.8 180 3.07 3.780 18.00  0  0    3    3
+## Cadillac Fleetwood  10.4   8 472.0 205 2.93 5.250 17.98  0  0    3    4
+## Lincoln Continental 10.4   8 460.0 215 3.00 5.424 17.82  0  0    3    4
+## Chrysler Imperial   14.7   8 440.0 230 3.23 5.345 17.42  0  0    3    4
+## Fiat 128            32.4   4  78.7  66 4.08 2.200 19.47  1  1    4    1
+## Honda Civic         30.4   4  75.7  52 4.93 1.615 18.52  1  1    4    2
+## Toyota Corolla      33.9   4  71.1  65 4.22 1.835 19.90  1  1    4    1
+## Toyota Corona       21.5   4 120.1  97 3.70 2.465 20.01  1  0    3    1
+## Dodge Challenger    15.5   8 318.0 150 2.76 3.520 16.87  0  0    3    2
+## AMC Javelin         15.2   8 304.0 150 3.15 3.435 17.30  0  0    3    2
+## Camaro Z28          13.3   8 350.0 245 3.73 3.840 15.41  0  0    3    4
+## Pontiac Firebird    19.2   8 400.0 175 3.08 3.845 17.05  0  0    3    2
+## Fiat X1-9           27.3   4  79.0  66 4.08 1.935 18.90  1  1    4    1
+## Porsche 914-2       26.0   4 120.3  91 4.43 2.140 16.70  0  1    5    2
+## Lotus Europa        30.4   4  95.1 113 3.77 1.513 16.90  1  1    5    2
+## Ford Pantera L      15.8   8 351.0 264 4.22 3.170 14.50  0  1    5    4
+## Ferrari Dino        19.7   6 145.0 175 3.62 2.770 15.50  0  1    5    6
+## Maserati Bora       15.0   8 301.0 335 3.54 3.570 14.60  0  1    5    8
+## Volvo 142E          21.4   4 121.0 109 4.11 2.780 18.60  1  1    4    2
+\end{verbatim}
+To access an R function from Ruby, the R function needs to be preceeded
+by `R.' scoping. Bellow we see and example of creating a R::Vector by
+calling the `c' R function
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts vec = R.c(}\FloatTok{1.0}\NormalTok{, }\FloatTok{2.0}\NormalTok{, }\FloatTok{3.0}\NormalTok{, }\FloatTok{4.0}\NormalTok{)}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 1 2 3 4
+\end{verbatim}
+Note that `vec' is an object of type R::Vector:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts vec.class}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## R::Vector
+\end{verbatim}
+Every object created by a call to an R function will be of a type that
+inherits from R::Object. In R, there is also a function `class'. In
+order to access that function we can call method `rclass' in the
+R::Object:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts vec.rclass}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] "numeric"
+\end{verbatim}
+When working with R::Object(s), it is possible to use the `.' operator
+to pipe operations. When using `.', the object to which the `.' is
+applied becomes the first argument of the corresponding R function. For
+instance, function `c' in R, can be used to concatenate two vectors or
+more vectors (in R, there are no scalar values, scalars are converted to
+vectors of size 1. Within Galaaz, scalar parameter is converted to a
+size one vector):
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts R.c(vec, }\DecValTok{10}\NormalTok{, }\DecValTok{20}\NormalTok{, }\DecValTok{30}\NormalTok{)}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1]  1  2  3  4 10 20 30
+\end{verbatim}
+The call above to the `c' function can also be done using `.' notation:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts vec.c(}\DecValTok{10}\NormalTok{, }\DecValTok{20}\NormalTok{, }\DecValTok{30}\NormalTok{)}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1]  1  2  3  4 10 20 30
+\end{verbatim}
+We will talk about vector indexing in a latter section. But notice here
+that indexing an R::Vector will return another R::Vector:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts vec[}\DecValTok{1}\NormalTok{]}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 1
+\end{verbatim}
+Sometimes we want to index an R::Object and get back a Ruby object that
+is not wrapped in an R::Object, but the native Ruby object. For this, we
+can index the R object with the `\textgreater{}\textgreater{}' operator:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts vec >> }\DecValTok{0}
+\NormalTok{puts vec >> }\DecValTok{2}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## 1.0
+## 3.0
+\end{verbatim}
+It is also possible to call an R function with named arguments, by
+creating the function in Galaaz with named parameters. For instance,
+here is an example of creating a `list' with named elements:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts R.list(}\StringTok{first_name: "Rodrigo"}\NormalTok{, }\StringTok{last_name: "Botafogo"}\NormalTok{)}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## $first_name
+## [1] "Rodrigo"
+##
+## $last_name
+## [1] "Botafogo"
+\end{verbatim}
+Many R functions receive another function as argument. For instance,
+method `map' applies a function to every element of a vector. With
+Galaaz, it is possible to pass a Proc, Method or Lambda in place of the
+expected R function. In this next example, we will add 2 to every
+element of our previously created vector:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts vec.map \{ |x| x + }\DecValTok{2}\NormalTok{ \}}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 3
+## [1] 4
+## [1] 5
+## [1] 6
+\end{verbatim}
+\section{gKnitting a Document}\label{gknitting-a-document}
+This manual has been formatted usign gKnit. gKnit uses Knitr and R
+markdown to knit a document in Ruby or R and output it in any of the
+available formats for R markdown. gKnit runs atop of GraalVM, and
+Galaaz. In gKnit, Ruby variables are persisted between chunks, making it
+an ideal solution for literate programming. Also, since it is based on
+Galaaz, Ruby chunks can have access to R variables and Polyglot
+Programming with Ruby and R is quite natural.
+The idea of ``literate programming'' was first introduced by Donald
+Knuth in the 1980's (Knuth 1984). The main intention of this approach
+was to develop software interspersing macro snippets, traditional source
+code, and a natural language such as English in a document that could be
+compiled into executable code and at the same time easily read by a
+human developer. According to Knuth ``The practitioner of literate
+programming can be regarded as an essayist, whose main concern is with
+exposition and excellence of style.''
+The idea of literate programming evolved into the idea of reproducible
+research, in which all the data, software code, documentation, graphics
+etc. needed to reproduce the research and its reports could be included
+in a single document or set of documents that when distributed to peers
+could be rerun generating the same output and reports.
+The R community has put a great deal of effort in reproducible research.
+In 2002, Sweave was introduced and it allowed mixing R code with Latex
+generating high quality PDF documents. A Sweave document could include
+code, the results of executing the code, graphics and text such that it
+contained the whole narrative to reproduce the research. In 2012, Knitr,
+developed by Yihui Xie from RStudio was released to replace Sweave and
+to consolidate in one single package the many extensions and add-on
+packages that were necessary for Sweave.
+With Knitr, \textbf{R markdown} was also developed, an extension to the
+Markdown format. With \textbf{R markdown} and Knitr it is possible to
+generate reports in a multitude of formats such as HTML, markdown,
+Latex, PDF, dvi, etc. \textbf{R markdown} also allows the use of
+multiple programming languages such as R, Ruby, Python, etc. in the same
+document.
+In \textbf{R markdown}, text is interspersed with code chunks that can
+be executed and both the code and its results can become part of the
+final report. Although \textbf{R markdown} allows multiple programming
+languages in the same document, only R and Python (with the reticulate
+package) can persist variables between chunks. For other languages, such
+as Ruby, every chunk will start a new process and thus all data is lost
+between chunks, unless it is somehow stored in a data file that is read
+by the next chunk.
+Being able to persist data between chunks is critical for literate
+programming otherwise the flow of the narrative is lost by all the
+effort of having to save data and then reload it. Although this might,
+at first, seem like a small nuisance, not being able to persist data
+between chunks is a major issue. For example, let's take a look at the
+following simple example in which we want to show how to create a list
+and the use it. Let's first assume that data cannot be persisted between
+chunks. In the next chunk we create a list, then we would need to save
+it to file, but to save it, we need somehow to marshal the data into a
+binary format:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{lst = R.list(}\StringTok{a: }\DecValTok{1}\NormalTok{, }\StringTok{b: }\DecValTok{2}\NormalTok{, }\StringTok{c: }\DecValTok{3}\NormalTok{)}
+\NormalTok{lst.saveRDS(}\StringTok{"lst.rds"}\NormalTok{)}
+\end{Highlighting}
+\end{Shaded}
+then, on the next chunk, where variable `lst' is used, we need to read
+back it's value
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{lst = R.readRDS(}\StringTok{"lst.rds"}\NormalTok{)}
+\NormalTok{puts lst}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## $a
+## [1] 1
+##
+## $b
+## [1] 2
+##
+## $c
+## [1] 3
+\end{verbatim}
+Now, any single code has dozens of variables that we might want to use
+and reuse between chunks. Clearly, such an approach becomes quickly
+unmanageable. Probably, because of this problem, it is very rare to see
+any \textbf{R markdown} document in the Ruby community.
+When variables can be used accross chunks, then no overhead is needed:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{lst = R.list(}\StringTok{a: }\DecValTok{1}\NormalTok{, }\StringTok{b: }\DecValTok{2}\NormalTok{, }\StringTok{c: }\DecValTok{3}\NormalTok{)}
+\CommentTok{# any other code can be added here}
+\end{Highlighting}
+\end{Shaded}
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts lst}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## $a
+## [1] 1
+##
+## $b
+## [1] 2
+##
+## $c
+## [1] 3
+\end{verbatim}
+In the Python community, the same effort to have code and text in an
+integrated environment started around the first decade of 2000. In 2006
+iPython 0.7.2 was released. In 2014, Fernando Pérez, spun off project
+Jupyter from iPython creating a web-based interactive computation
+environment. Jupyter can now be used with many languages, including Ruby
+with the iruby gem (\url{https://github.com/SciRuby/iruby}). In order to
+have multiple languages in a Jupyter notebook the SoS kernel was
+developed (\url{https://vatlab.github.io/sos-docs/}).
+\subsection{\texorpdfstring{gKnit and \textbf{R
+markdown}}{gKnit and R markdown}}\label{gknit-and-r-markdown}
+gKnit is based on knitr and \textbf{R markdown} and can knit a document
+written both in Ruby and/or R and output it in any of the available
+formats of \textbf{R markdown}. gKnit allows ruby developers to do
+literate programming and reproducible research by allowing them to have
+in a single document, text and code.
+In gKnit, Ruby variables are persisted between chunks, making it an
+ideal solution for literate programming in this language. Also, since it
+is based on Galaaz, Ruby chunks can have access to R variables and
+Polyglot Programming with Ruby and R is quite natural.
+This is not a blog post on \textbf{R markdown}, and the interested user
+is directed to the following links for detailed information on its
+capabilities and use.
+\begin{itemize}
+\tightlist
+\item
+  \url{https://rmarkdown.rstudio.com/} or
+\item
+  \url{https://bookdown.org/yihui/rmarkdown/}
+\end{itemize}
+In this post, we will describe just the main aspects of \textbf{R
+markdown}, so the user can start gKnitting Ruby and R documents quickly.
+\subsection{The Yaml header}\label{the-yaml-header}
+An \textbf{R markdown} document should start with a Yaml header and be
+stored in a file with `.Rmd' extension. This document has the following
+header for gKitting an HTML document.
+\begin{verbatim}
+---
+title: "How to do reproducible research in Ruby with gKnit"
+author:
+    - "Rodrigo Botafogo"
+    - "Daniel Mossé - University of Pittsburgh"
+tags: [Tech, Data Science, Ruby, R, GraalVM]
+date: "20/02/2019"
+output:
+  html_document:
+    self_contained: true
+    keep_md: true
+  pdf_document:
+    includes:
+      in_header: ["../../sty/galaaz.sty"]
+    number_sections: yes
+---
+\end{verbatim}
+For more information on the options in the Yaml header,
+\href{https://bookdown.org/yihui/rmarkdown/html-document.html}{check
+here}.
+\subsection{\texorpdfstring{\textbf{R Markdown}
+formatting}{R Markdown formatting}}\label{r-markdown-formatting}
+Document formatting can be done with simple markups such as:
+\subsection{Headers}\label{headers}
+\begin{verbatim}
+# Header 1
+## Header 2
+### Header 3
+\end{verbatim}
+\subsection{Lists}\label{lists}
+\begin{verbatim}
+Unordered lists:
+* Item 1
+* Item 2
+    + Item 2a
+    + Item 2b
+\end{verbatim}
+\begin{verbatim}
+Ordered Lists
+1. Item 1
+2. Item 2
+3. Item 3
+    + Item 3a
+    + Item 3b
+\end{verbatim}
+For more R markdown formatting go to
+\url{https://rmarkdown.rstudio.com/authoring_basics.html}.
+\subsection{R chunks}\label{r-chunks}
+Running and executing Ruby and R code is actually what really interests
+us is this blog.\\
+Inserting a code chunk is done by adding code in a block delimited by
+three back ticks followed by an open curly brace (`\{') followed with
+the engine name (r, ruby, rb, include, \ldots{}), an any optional
+chunk\_label and options, as shown bellow:
+\begin{verbatim}
+```{engine_name [chunk_label], [chunk_options]}
+```
+\end{verbatim}
+for instance, let's add an R chunk to the document labeled
+`first\_r\_chunk'. This is a very simple code just to create a variable
+and print it out, as follows:
+\begin{verbatim}
+```{r first_r_chunk}
+vec <- c(1, 2, 3)
+print(vec)
+```
+\end{verbatim}
+If this block is added to an \textbf{R markdown} document and gKnitted
+the result will be:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{vec <-}\StringTok{ }\KeywordTok{c}\NormalTok{(}\DecValTok{1}\NormalTok{, }\DecValTok{2}\NormalTok{, }\DecValTok{3}\NormalTok{)}
+\KeywordTok{print}\NormalTok{(vec)}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 1 2 3
+\end{verbatim}
+Now let's say that we want to do some analysis in the code, but just
+print the result and not the code itself. For this, we need to add the
+option `echo = FALSE'.
+\begin{verbatim}
+```{r second_r_chunk, echo = FALSE}
+vec2 <- c(10, 20, 30)
+vec3 <- vec * vec2
+print(vec3)
+```
+\end{verbatim}
+Here is how this block will show up in the document. Observe that the
+code is not shown and we only see the execution result in a white box
+\begin{verbatim}
+## [1] 10 40 90
+\end{verbatim}
+A description of the available chunk options can be found in
+\url{https://yihui.name/knitr/}.
+Let's add another R chunk with a function definition. In this example, a
+vector `r\_vec' is created and a new function `reduce\_sum' is defined.
+The chunk specification is
+\begin{verbatim}
+```{r data_creation}
+r_vec <- c(1, 2, 3, 4, 5)
+reduce_sum <- function(...) {
+  Reduce(sum, as.list(...))
+}
+```
+\end{verbatim}
+and this is how it will look like once executed. From now on, to be
+concise in the presentation we will not show chunk definitions any
+longer.
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{r_vec <-}\StringTok{ }\KeywordTok{c}\NormalTok{(}\DecValTok{1}\NormalTok{, }\DecValTok{2}\NormalTok{, }\DecValTok{3}\NormalTok{, }\DecValTok{4}\NormalTok{, }\DecValTok{5}\NormalTok{)}
+\NormalTok{reduce_sum <-}\StringTok{ }\ControlFlowTok{function}\NormalTok{(...) \{}
+  \KeywordTok{Reduce}\NormalTok{(sum, }\KeywordTok{as.list}\NormalTok{(...))}
+\NormalTok{\}}
+\end{Highlighting}
+\end{Shaded}
+We can, possibly in another chunk, access the vector and call the
+function as follows:
+\begin{Shaded}
+\begin{Highlighting}[]
+\KeywordTok{print}\NormalTok{(r_vec)}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 1 2 3 4 5
+\end{verbatim}
+\begin{Shaded}
+\begin{Highlighting}[]
+\KeywordTok{print}\NormalTok{(}\KeywordTok{reduce_sum}\NormalTok{(r_vec))}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 15
+\end{verbatim}
+\subsection{R Graphics with ggplot}\label{r-graphics-with-ggplot}
+In the following chunk, we create a bubble chart in R using ggplot and
+include it in this document. Note that there is no directive in the code
+to include the image, this occurs automatically. The `mpg' dataframe is
+natively available to R and to Galaaz as well.
+For the reader not knowledgeable of ggplot, ggplot is a graphics library
+based on ``the grammar of graphics'' (Wilkinson 2005). The idea of the
+grammar of graphics is to build a graphics by adding layers to the plot.
+More information can be found in
+\url{https://towardsdatascience.com/a-comprehensive-guide-to-the-grammar-of-graphics-for-effective-visualization-of-multi-dimensional-1f92b4ed4149}.
+In the plot bellow the `mpg' dataset from base R is used. ``The data
+concerns city-cycle fuel consumption in miles per gallon, to be
+predicted in terms of 3 multivalued discrete and 5 continuous
+attributes.'' (Quinlan, 1993)
+First, the `mpg' dataset if filtered to extract only cars from the
+following manumactures: Audi, Ford, Honda, and Hyundai and stored in the
+`mpg\_select' variable. Then, the selected dataframe is passed to the
+ggplot function specifying in the aesthetic method (aes) that
+`displacement' (disp) should be plotted in the `x' axis and `city
+mileage' should be on the `y' axis. In the `labs' layer we pass the
+`title' and `subtitle' for the plot. To the basic plot `g', geom\_jitter
+is added, that plots cars from the same manufactures with the same color
+(col=manufactures) and the size of the car point equal its high way
+consumption (size = hwy). Finally, a last layer is plotter containing a
+linear regression line (method = ``lm'') for every manufacturer.
+\begin{Shaded}
+\begin{Highlighting}[]
+\CommentTok{# load package and data}
+\KeywordTok{library}\NormalTok{(ggplot2)}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## Message:
+##  Registered S3 methods overwritten by 'ggplot2':
+##   method         from
+##   [.quosures     rlang
+##   c.quosures     rlang
+##   print.quosures rlang
+\end{verbatim}
+\begin{Shaded}
+\begin{Highlighting}[]
+\KeywordTok{data}\NormalTok{(mpg, }\DataTypeTok{package=}\StringTok{"ggplot2"}\NormalTok{)}
+\NormalTok{mpg_select <-}\StringTok{ }\NormalTok{mpg[mpg}\OperatorTok{$}\NormalTok{manufacturer }\OperatorTok{%in%}\StringTok{ }\KeywordTok{c}\NormalTok{(}\StringTok{"audi"}\NormalTok{, }\StringTok{"ford"}\NormalTok{, }\StringTok{"honda"}\NormalTok{, }\StringTok{"hyundai"}\NormalTok{), ]}
+\CommentTok{# Scatterplot}
+\KeywordTok{theme_set}\NormalTok{(}\KeywordTok{theme_bw}\NormalTok{())  }\CommentTok{# pre-set the bw theme.}
+\NormalTok{g <-}\StringTok{ }\KeywordTok{ggplot}\NormalTok{(mpg_select, }\KeywordTok{aes}\NormalTok{(displ, cty)) }\OperatorTok{+}\StringTok{ }
+\StringTok{  }\KeywordTok{labs}\NormalTok{(}\DataTypeTok{subtitle=}\StringTok{"mpg: Displacement vs City Mileage"}\NormalTok{,}
+       \DataTypeTok{title=}\StringTok{"Bubble chart"}\NormalTok{)}
+\NormalTok{g }\OperatorTok{+}\StringTok{ }\KeywordTok{geom_jitter}\NormalTok{(}\KeywordTok{aes}\NormalTok{(}\DataTypeTok{col=}\NormalTok{manufacturer, }\DataTypeTok{size=}\NormalTok{hwy)) }\OperatorTok{+}\StringTok{ }
+\StringTok{  }\KeywordTok{geom_smooth}\NormalTok{(}\KeywordTok{aes}\NormalTok{(}\DataTypeTok{col=}\NormalTok{manufacturer), }\DataTypeTok{method=}\StringTok{"lm"}\NormalTok{, }\DataTypeTok{se=}\NormalTok{F)}
+\end{Highlighting}
+\end{Shaded}
+\includegraphics{manual_files/figure-latex/bubble-1.png}
+\subsection{Ruby chunks}\label{ruby-chunks}
+Including a Ruby chunk is just as easy as including an R chunk in the
+document: just change the name of the engine to `ruby'. It is also
+possible to pass chunk options to the Ruby engine; however, this version
+does not accept all the options that are available to R chunks. Future
+versions will add those options.
+\begin{verbatim}
+```{ruby first_ruby_chunk}
+```
+\end{verbatim}
+In this example, the ruby chunk is called `first\_ruby\_chunk'. One
+important aspect of chunk labels is that they cannot be duplicated. If a
+chunk label is duplicated, gKnit will stop with an error.
+In the following chunk, variable `a', `b' and `c' are standard Ruby
+variables and `vec' and `vec2' are two vectors created by calling the
+`c' method on the R module.
+In Galaaz, the R module allows us to access R functions transparently.
+The `c' function in R, is a function that concatenates its arguments
+making a vector.
+It should be clear that there is no requirement in gknit to call or use
+any R functions. gKnit will knit standard Ruby code, or even general
+text without any code.
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{a = [}\DecValTok{1}\NormalTok{, }\DecValTok{2}\NormalTok{, }\DecValTok{3}\NormalTok{]}
+\NormalTok{b = }\StringTok{"US$ 250.000"}
+\NormalTok{c = }\StringTok{"The 'outputs' function"}
+\NormalTok{vec = R.c(}\DecValTok{1}\NormalTok{, }\DecValTok{2}\NormalTok{, }\DecValTok{3}\NormalTok{)}
+\NormalTok{vec2 = R.c(}\DecValTok{10}\NormalTok{, }\DecValTok{20}\NormalTok{, }\DecValTok{30}\NormalTok{)}
+\end{Highlighting}
+\end{Shaded}
+In the next block, variables `a', `vec' and `vec2' are used and printed.
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts a}
+\NormalTok{puts vec * vec2}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## 1
+## 2
+## 3
+## [1] 10 40 90
+\end{verbatim}
+Note that `a' is a standard Ruby Array and `vec' and `vec2' are vectors
+that behave accordingly, where multiplication works as expected.
+\subsection{Inline Ruby code}\label{inline-ruby-code}
+When using a Ruby chunk, the code and the output are formatted in blocks
+as seen above. This formatting is not always desired. Sometimes, we want
+to have the results of the Ruby evaluation included in the middle of a
+phrase. gKnit allows adding inline Ruby code with the `rb' engine. The
+following chunk specification will create and inline Ruby text:
+\begin{verbatim}
+This is some text with inline Ruby accessing variable 'b' which has value:
+```{rb puts b}
+```
+and is followed by some other text!
+\end{verbatim}
+This is some text with inline Ruby accessing variable `b' which has
+value: US\$ 250.000 and is followed by some other text!
+Note that it is important not to add any new line before of after the
+code block if we want everything to be in only one line, resulting in
+the following sentence with inline Ruby code.
+\subsubsection{\texorpdfstring{The `outputs'
+function}{The outputs function}}\label{the-outputs-function}
+He have previously used the standard `puts' method in Ruby chunks in
+order produce output. The result of a `puts', as seen in all previous
+chunks that use it, is formatted inside a white box that follows the
+code block. Many times however, we would like to do some processing in
+the Ruby chunk and have the result of this processing generate and
+output that is ``included'' in the document as if we had typed it in
+\textbf{R markdown} document.
+For example, suppose we want to create a new heading in our document,
+but the heading phrase is the result of some code processing: maybe it's
+the first line of a file we are going to read. Method `outputs' adds its
+output as if typed in the \textbf{R markdown} document.
+Take now a look at variable `c' (it was defined in a previous block
+above) as `c = ``The 'outputs' function''. ``The 'outputs' function'' is
+actually the name of this section and it was created using the 'outputs'
+function inside a Ruby chunk.
+The ruby chunk to generate this heading is:
+\begin{verbatim}
+```{ruby heading}
+outputs "### #{c}"
+```
+\end{verbatim}
+The three `\#\#\#' is the way we add a Heading 3 in \textbf{R markdown}.
+\subsubsection{HTML Output from Ruby
+Chunks}\label{html-output-from-ruby-chunks}
+We've just seen the use of method `outputs' to add text to the the
+\textbf{R markdown} document. This technique can also be used to add
+HTML code to the document. In \textbf{R markdown}, any html code typed
+directly in the document will be properly rendered.\\
+Here, for instance, is a table definition in HTML and its output in the
+document:
+\begin{verbatim}
+<table style="width:100%">
+  <tr>
+    <th>Firstname</th>
+    <th>Lastname</th>
+    <th>Age</th>
+  </tr>
+  <tr>
+    <td>Jill</td>
+    <td>Smith</td>
+    <td>50</td>
+  </tr>
+  <tr>
+    <td>Eve</td>
+    <td>Jackson</td>
+    <td>94</td>
+  </tr>
+</table>
+\end{verbatim}
+\begin{verbatim}
+<th>Firstname</th>
+<th>Lastname</th>
+<th>Age</th>
+\end{verbatim}
+\begin{verbatim}
+<td>Jill</td>
+<td>Smith</td>
+<td>50</td>
+\end{verbatim}
+\begin{verbatim}
+<td>Eve</td>
+<td>Jackson</td>
+<td>94</td>
+\end{verbatim}
+But manually creating HTML output is not always easy or desirable,
+specially if we intend the document to be rendered in other formats, for
+example, as Latex. Also, The above table looks ugly. The `kableExtra'
+library is a great library for creating beautiful tables. Take a look at
+\url{https://cran.r-project.org/web/packages/kableExtra/vignettes/awesome_table_in_html.html}
+In the next chunk, we output the `mtcars' dataframe from R in a nicely
+formatted table. Note that we retrieve the mtcars dataframe by using
+`\textasciitilde{}:mtcars'.
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{R.install_and_loads(}\StringTok{'kableExtra'}\NormalTok{)}
+\NormalTok{outputs (~}\StringTok{:mtcars}\NormalTok{).kable.kable_styling}
+\end{Highlighting}
+\end{Shaded}
+\begin{table}[H]
+\centering
+\begin{tabular}{l|r|r|r|r|r|r|r|r|r|r|r}
+\hline
+  & mpg & cyl & disp & hp & drat & wt & qsec & vs & am & gear & carb\\
+\hline
+Mazda RX4 & 21.0 & 6 & 160.0 & 110 & 3.90 & 2.620 & 16.46 & 0 & 1 & 4 & 4\\
+\hline
+Mazda RX4 Wag & 21.0 & 6 & 160.0 & 110 & 3.90 & 2.875 & 17.02 & 0 & 1 & 4 & 4\\
+\hline
+Datsun 710 & 22.8 & 4 & 108.0 & 93 & 3.85 & 2.320 & 18.61 & 1 & 1 & 4 & 1\\
+\hline
+Hornet 4 Drive & 21.4 & 6 & 258.0 & 110 & 3.08 & 3.215 & 19.44 & 1 & 0 & 3 & 1\\
+\hline
+Hornet Sportabout & 18.7 & 8 & 360.0 & 175 & 3.15 & 3.440 & 17.02 & 0 & 0 & 3 & 2\\
+\hline
+Valiant & 18.1 & 6 & 225.0 & 105 & 2.76 & 3.460 & 20.22 & 1 & 0 & 3 & 1\\
+\hline
+Duster 360 & 14.3 & 8 & 360.0 & 245 & 3.21 & 3.570 & 15.84 & 0 & 0 & 3 & 4\\
+\hline
+Merc 240D & 24.4 & 4 & 146.7 & 62 & 3.69 & 3.190 & 20.00 & 1 & 0 & 4 & 2\\
+\hline
+Merc 230 & 22.8 & 4 & 140.8 & 95 & 3.92 & 3.150 & 22.90 & 1 & 0 & 4 & 2\\
+\hline
+Merc 280 & 19.2 & 6 & 167.6 & 123 & 3.92 & 3.440 & 18.30 & 1 & 0 & 4 & 4\\
+\hline
+Merc 280C & 17.8 & 6 & 167.6 & 123 & 3.92 & 3.440 & 18.90 & 1 & 0 & 4 & 4\\
+\hline
+Merc 450SE & 16.4 & 8 & 275.8 & 180 & 3.07 & 4.070 & 17.40 & 0 & 0 & 3 & 3\\
+\hline
+Merc 450SL & 17.3 & 8 & 275.8 & 180 & 3.07 & 3.730 & 17.60 & 0 & 0 & 3 & 3\\
+\hline
+Merc 450SLC & 15.2 & 8 & 275.8 & 180 & 3.07 & 3.780 & 18.00 & 0 & 0 & 3 & 3\\
+\hline
+Cadillac Fleetwood & 10.4 & 8 & 472.0 & 205 & 2.93 & 5.250 & 17.98 & 0 & 0 & 3 & 4\\
+\hline
+Lincoln Continental & 10.4 & 8 & 460.0 & 215 & 3.00 & 5.424 & 17.82 & 0 & 0 & 3 & 4\\
+\hline
+Chrysler Imperial & 14.7 & 8 & 440.0 & 230 & 3.23 & 5.345 & 17.42 & 0 & 0 & 3 & 4\\
+\hline
+Fiat 128 & 32.4 & 4 & 78.7 & 66 & 4.08 & 2.200 & 19.47 & 1 & 1 & 4 & 1\\
+\hline
+Honda Civic & 30.4 & 4 & 75.7 & 52 & 4.93 & 1.615 & 18.52 & 1 & 1 & 4 & 2\\
+\hline
+Toyota Corolla & 33.9 & 4 & 71.1 & 65 & 4.22 & 1.835 & 19.90 & 1 & 1 & 4 & 1\\
+\hline
+Toyota Corona & 21.5 & 4 & 120.1 & 97 & 3.70 & 2.465 & 20.01 & 1 & 0 & 3 & 1\\
+\hline
+Dodge Challenger & 15.5 & 8 & 318.0 & 150 & 2.76 & 3.520 & 16.87 & 0 & 0 & 3 & 2\\
+\hline
+AMC Javelin & 15.2 & 8 & 304.0 & 150 & 3.15 & 3.435 & 17.30 & 0 & 0 & 3 & 2\\
+\hline
+Camaro Z28 & 13.3 & 8 & 350.0 & 245 & 3.73 & 3.840 & 15.41 & 0 & 0 & 3 & 4\\
+\hline
+Pontiac Firebird & 19.2 & 8 & 400.0 & 175 & 3.08 & 3.845 & 17.05 & 0 & 0 & 3 & 2\\
+\hline
+Fiat X1-9 & 27.3 & 4 & 79.0 & 66 & 4.08 & 1.935 & 18.90 & 1 & 1 & 4 & 1\\
+\hline
+Porsche 914-2 & 26.0 & 4 & 120.3 & 91 & 4.43 & 2.140 & 16.70 & 0 & 1 & 5 & 2\\
+\hline
+Lotus Europa & 30.4 & 4 & 95.1 & 113 & 3.77 & 1.513 & 16.90 & 1 & 1 & 5 & 2\\
+\hline
+Ford Pantera L & 15.8 & 8 & 351.0 & 264 & 4.22 & 3.170 & 14.50 & 0 & 1 & 5 & 4\\
+\hline
+Ferrari Dino & 19.7 & 6 & 145.0 & 175 & 3.62 & 2.770 & 15.50 & 0 & 1 & 5 & 6\\
+\hline
+Maserati Bora & 15.0 & 8 & 301.0 & 335 & 3.54 & 3.570 & 14.60 & 0 & 1 & 5 & 8\\
+\hline
+Volvo 142E & 21.4 & 4 & 121.0 & 109 & 4.11 & 2.780 & 18.60 & 1 & 1 & 4 & 2\\
+\hline
+\end{tabular}
+\end{table}
+\subsection{Including Ruby files in a
+chunk}\label{including-ruby-files-in-a-chunk}
+R is a language that was created to be easy and fast for statisticians
+to use. As far as I know, it was not a language to be used for
+developing large systems. Of course, there are large systems and
+libraries in R, but the focus of the language is for developing
+statistical models and distribute that to peers.
+Ruby on the other hand, is a language for large software development.
+Systems written in Ruby will have dozens, hundreds or even thousands of
+files. To document a large system with literate programming, we cannot
+expect the developer to add all the files in a single `.Rmd' file. gKnit
+provides the `include' chunk engine to include a Ruby file as if it had
+being typed in the `.Rmd' file.
+To include a file, the following chunk should be created, where is the
+name of the file to be included and where the extension, if it is `.rb',
+does not need to be added. If the `relative' option is not included,
+then it is treated as TRUE. When `relative' is true, ruby's
+`require\_relative' semantics is used to load the file, when false,
+Ruby's \$LOAD\_PATH is searched to find the file and it is 'require'd.
+\begin{verbatim}
+```{include <filename>, relative = <TRUE/FALSE>}
+```
+\end{verbatim}
+Bellow we include file `model.rb', which is in the same directory of
+this blog.\\
+This code uses R `caret' package to split a dataset in a train and test
+sets. The `caret' package is a very important a useful package for doing
+Data Analysis, it has hundreds of functions for all steps of the Data
+Analysis workflow. To use `caret' just to split a dataset is like using
+the proverbial cannon to kill the fly. We use it here only to show that
+integrating Ruby and R and using even a very complex package as `caret'
+is trivial with Galaaz.
+A word of advice: the `caret' package has lots of dependencies and
+installing it in a Linux system is a time consuming operation. Method
+`R.install\_and\_loads' will install the package if it is not already
+installed and can take a while.
+\begin{verbatim}
+```{include model}
+```
+\end{verbatim}
+\begin{verbatim}
+require 'galaaz'
+# Loads the R 'caret' package.  If not present, installs it
+R.install_and_loads 'caret'
+class Model
+  attr_reader :data
+  attr_reader :test
+  attr_reader :train
+  #==========================================================
+  #
+  #==========================================================
+  def initialize(data, percent_train:, seed: 123)
+    R.set__seed(seed)
+    @data = data
+    @percent_train = percent_train
+    @seed = seed
+  end
+  #==========================================================
+  #
+  #==========================================================
+  def partition(field)
+    train_index =
+      R.createDataPartition(@data.send(field), p: @percet_train,
+                            list: false, times: 1)
+    @train = @data[train_index, :all]
+    @test = @data[-train_index, :all]
+  end
+end
+\end{verbatim}
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{mtcars = ~}\StringTok{:mtcars}
+\NormalTok{model = }\DataTypeTok{Model}\NormalTok{.new(mtcars, }\StringTok{percent_train: }\FloatTok{0.8}\NormalTok{)}
+\NormalTok{model.partition(}\StringTok{:mpg}\NormalTok{)}
+\NormalTok{puts model.train.head}
+\NormalTok{puts model.test.head}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##                mpg cyl  disp  hp drat    wt  qsec vs am gear carb
+## Mazda RX4     21.0   6 160.0 110 3.90 2.620 16.46  0  1    4    4
+## Mazda RX4 Wag 21.0   6 160.0 110 3.90 2.875 17.02  0  1    4    4
+## Valiant       18.1   6 225.0 105 2.76 3.460 20.22  1  0    3    1
+## Merc 280      19.2   6 167.6 123 3.92 3.440 18.30  1  0    4    4
+## Merc 280C     17.8   6 167.6 123 3.92 3.440 18.90  1  0    4    4
+## Merc 450SE    16.4   8 275.8 180 3.07 4.070 17.40  0  0    3    3
+##                    mpg cyl  disp  hp drat    wt  qsec vs am gear carb
+## Datsun 710        22.8   4 108.0  93 3.85 2.320 18.61  1  1    4    1
+## Hornet 4 Drive    21.4   6 258.0 110 3.08 3.215 19.44  1  0    3    1
+## Hornet Sportabout 18.7   8 360.0 175 3.15 3.440 17.02  0  0    3    2
+## Duster 360        14.3   8 360.0 245 3.21 3.570 15.84  0  0    3    4
+## Merc 240D         24.4   4 146.7  62 3.69 3.190 20.00  1  0    4    2
+## Merc 230          22.8   4 140.8  95 3.92 3.150 22.90  1  0    4    2
+\end{verbatim}
+\subsection{Documenting Gems}\label{documenting-gems}
+gKnit also allows developers to document and load files that are not in
+the same directory of the `.Rmd' file.
+Here is an example of loading the `find.rb' file from TruffleRuby. In
+this example, relative is set to FALSE, so Ruby will look for the file
+in its \$LOAD\_PATH, and the user does not need to no it's directory.
+\begin{verbatim}
+```{include find, relative = FALSE}
+```
+\end{verbatim}
+\begin{verbatim}
+# frozen_string_literal: true
+#
+# find.rb: the Find module for processing all files under a given directory.
+#
+#
+# The +Find+ module supports the top-down traversal of a set of file paths.
+#
+# For example, to total the size of all files under your home directory,
+# ignoring anything in a "dot" directory (e.g. $HOME/.ssh):
+#
+#   require 'find'
+#
+#   total_size = 0
+#
+#   Find.find(ENV["HOME"]) do |path|
+#     if FileTest.directory?(path)
+#       if File.basename(path)[0] == ?.
+#         Find.prune       # Don't look any further into this directory.
+#       else
+#         next
+#       end
+#     else
+#       total_size += FileTest.size(path)
+#     end
+#   end
+#
+module Find
+  #
+  # Calls the associated block with the name of every file and directory listed
+  # as arguments, then recursively on their subdirectories, and so on.
+  #
+  # Returns an enumerator if no block is given.
+  #
+  # See the +Find+ module documentation for an example.
+  #
+  def find(*paths, ignore_error: true) # :yield: path
+    block_given? or return enum_for(__method__, *paths, ignore_error: ignore_error)
+    fs_encoding = Encoding.find("filesystem")
+    paths.collect!{|d| raise Errno::ENOENT, d unless File.exist?(d); d.dup}.each do |path|
+      path = path.to_path if path.respond_to? :to_path
+      enc = path.encoding == Encoding::US_ASCII ? fs_encoding : path.encoding
+      ps = [path]
+      while file = ps.shift
+        catch(:prune) do
+          yield file.dup.taint
+          begin
+            s = File.lstat(file)
+          rescue Errno::ENOENT, Errno::EACCES, Errno::ENOTDIR, Errno::ELOOP, Errno::ENAMETOOLONG
+            raise unless ignore_error
+            next
+          end
+          if s.directory? then
+            begin
+              fs = Dir.children(file, encoding: enc)
+            rescue Errno::ENOENT, Errno::EACCES, Errno::ENOTDIR, Errno::ELOOP, Errno::ENAMETOOLONG
+              raise unless ignore_error
+              next
+            end
+            fs.sort!
+            fs.reverse_each {|f|
+              f = File.join(file, f)
+              ps.unshift f.untaint
+            }
+          end
+        end
+      end
+    end
+    nil
+  end
+  #
+  # Skips the current file or directory, restarting the loop with the next
+  # entry. If the current file is a directory, that directory will not be
+  # recursively entered. Meaningful only within the block associated with
+  # Find::find.
+  #
+  # See the +Find+ module documentation for an example.
+  #
+  def prune
+    throw :prune
+  end
+  module_function :find, :prune
+end
+\end{verbatim}
+\subsection{Converting to PDF}\label{converting-to-pdf}
+One of the beauties of knitr is that the same input can be converted to
+many different outputs. One very useful format, is, of course, PDF. In
+order to converted an \textbf{R markdown} file to PDF it is necessary to
+have LaTeX installed on the system. We will not explain here how to
+install LaTeX as there are plenty of documents on the web showing how to
+proceed.
+gKnit comes with a simple LaTeX style file for gknitting this blog as a
+PDF document. Here is the Yaml header to generate this blog in PDF
+format instead of HTML:
+\begin{verbatim}
+---
+title: "gKnit - Ruby and R Knitting with Galaaz in GraalVM"
+author: "Rodrigo Botafogo"
+tags: [Galaaz, Ruby, R, TruffleRuby, FastR, GraalVM, knitr, gknit]
+date: "29 October 2018"
+output:
+  pdf\_document:
+    includes:
+      in\_header: ["../../sty/galaaz.sty"]
+    number\_sections: yes
+---
+\end{verbatim}
+\subsection{Template based documents
+generation}\label{template-based-documents-generation}
+When a document is converted to PDF it follows a certain convertion
+template. We've seen above the use of `galaaz.sty' as a basic template
+to generate a PDF document. Using the `gknit-draft' app that comes with
+Galaaz, the same .Rmd file can be compiled to different looking PDF
+documents. Galaaz automatically loads the `rticles' R package that comes
+with templates for the following journals with the respective template
+name:
+\begin{itemize}
+\tightlist
+\item
+  ACM articles: acm\_article
+\item
+  ACS articles: acs\_article
+\item
+  AEA journal submissions: aea\_article
+\item
+  AGU journal submissions: ????
+\item
+  AMS articles: ams\_article
+\item
+  American Statistical Association: asa\_article
+\item
+  Biometrics articles: biometrics\_article
+\item
+  Bulletin de l'AMQ journal submissions: amq\_article
+\item
+  CTeX documents: ctex
+\item
+  Elsevier journal submissions: elsevier\_article
+\item
+  IEEE Transaction journal submissions: ieee\_article
+\item
+  JSS articles: jss\_article
+\item
+  MDPI journal submissions: mdpi\_article
+\item
+  Monthly Notices of the Royal Astronomical Society articles:
+  mnras\_article
+\item
+  NNRAS journal submissions: nmras\_article
+\item
+  PeerJ articles: peerj\_article
+\item
+  Royal Society Open Science journal submissions: rsos\_article
+\item
+  Royal Statistical Society: rss\_article
+\item
+  Sage journal submissions: sage\_article
+\item
+  Springer journal submissions: springer\_article
+\item
+  Statistics in Medicine journal submissions: sim\_article
+\item
+  Copernicus Publications journal submissions: copernicus\_article
+\item
+  The R Journal articles: rjournal\_article
+\item
+  Frontiers articles: ???
+\item
+  Taylor \& Francis articles: ???
+\item
+  Bulletin De L'AMQ: amq\_article
+\item
+  PLOS journal: plos\_article
+\item
+  Proceedings of the National Academy of Sciences of the USA:
+  pnas\_article
+\end{itemize}
+In order to create a document with one of those templates, use the
+following command:
+\begin{verbatim}
+gknit-draft --filename <my_document> --template <template> --package <package>
+            --create_dir
+\end{verbatim}
+So, in order to create a template for writing an R Journal, use:
+\begin{verbatim}
+gknit-draft --filename my_r_article --template rjournal_article --package rticles
+            --create_dir
+\end{verbatim}
+\section{Accessing R variables}\label{accessing-r-variables}
+Galaaz allows Ruby to access variables created in R. For example, the
+`mtcars' data set is available in R and can be accessed from Ruby by
+using the `tilda' operator followed by the symbol for the variable, in
+this case `:mtcar'. In the code bellow method `outputs' is used to
+output the `mtcars' data set nicely formatted in HTML by use of the
+`kable' and `kable\_styling' functions. Method `outputs' is only
+available when used with `gknit'.
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{outputs (~}\StringTok{:mtcars}\NormalTok{).kable.kable_styling}
+\end{Highlighting}
+\end{Shaded}
+\begin{table}[H]
+\centering
+\begin{tabular}{l|r|r|r|r|r|r|r|r|r|r|r}
+\hline
+  & mpg & cyl & disp & hp & drat & wt & qsec & vs & am & gear & carb\\
+\hline
+Mazda RX4 & 21.0 & 6 & 160.0 & 110 & 3.90 & 2.620 & 16.46 & 0 & 1 & 4 & 4\\
+\hline
+Mazda RX4 Wag & 21.0 & 6 & 160.0 & 110 & 3.90 & 2.875 & 17.02 & 0 & 1 & 4 & 4\\
+\hline
+Datsun 710 & 22.8 & 4 & 108.0 & 93 & 3.85 & 2.320 & 18.61 & 1 & 1 & 4 & 1\\
+\hline
+Hornet 4 Drive & 21.4 & 6 & 258.0 & 110 & 3.08 & 3.215 & 19.44 & 1 & 0 & 3 & 1\\
+\hline
+Hornet Sportabout & 18.7 & 8 & 360.0 & 175 & 3.15 & 3.440 & 17.02 & 0 & 0 & 3 & 2\\
+\hline
+Valiant & 18.1 & 6 & 225.0 & 105 & 2.76 & 3.460 & 20.22 & 1 & 0 & 3 & 1\\
+\hline
+Duster 360 & 14.3 & 8 & 360.0 & 245 & 3.21 & 3.570 & 15.84 & 0 & 0 & 3 & 4\\
+\hline
+Merc 240D & 24.4 & 4 & 146.7 & 62 & 3.69 & 3.190 & 20.00 & 1 & 0 & 4 & 2\\
+\hline
+Merc 230 & 22.8 & 4 & 140.8 & 95 & 3.92 & 3.150 & 22.90 & 1 & 0 & 4 & 2\\
+\hline
+Merc 280 & 19.2 & 6 & 167.6 & 123 & 3.92 & 3.440 & 18.30 & 1 & 0 & 4 & 4\\
+\hline
+Merc 280C & 17.8 & 6 & 167.6 & 123 & 3.92 & 3.440 & 18.90 & 1 & 0 & 4 & 4\\
+\hline
+Merc 450SE & 16.4 & 8 & 275.8 & 180 & 3.07 & 4.070 & 17.40 & 0 & 0 & 3 & 3\\
+\hline
+Merc 450SL & 17.3 & 8 & 275.8 & 180 & 3.07 & 3.730 & 17.60 & 0 & 0 & 3 & 3\\
+\hline
+Merc 450SLC & 15.2 & 8 & 275.8 & 180 & 3.07 & 3.780 & 18.00 & 0 & 0 & 3 & 3\\
+\hline
+Cadillac Fleetwood & 10.4 & 8 & 472.0 & 205 & 2.93 & 5.250 & 17.98 & 0 & 0 & 3 & 4\\
+\hline
+Lincoln Continental & 10.4 & 8 & 460.0 & 215 & 3.00 & 5.424 & 17.82 & 0 & 0 & 3 & 4\\
+\hline
+Chrysler Imperial & 14.7 & 8 & 440.0 & 230 & 3.23 & 5.345 & 17.42 & 0 & 0 & 3 & 4\\
+\hline
+Fiat 128 & 32.4 & 4 & 78.7 & 66 & 4.08 & 2.200 & 19.47 & 1 & 1 & 4 & 1\\
+\hline
+Honda Civic & 30.4 & 4 & 75.7 & 52 & 4.93 & 1.615 & 18.52 & 1 & 1 & 4 & 2\\
+\hline
+Toyota Corolla & 33.9 & 4 & 71.1 & 65 & 4.22 & 1.835 & 19.90 & 1 & 1 & 4 & 1\\
+\hline
+Toyota Corona & 21.5 & 4 & 120.1 & 97 & 3.70 & 2.465 & 20.01 & 1 & 0 & 3 & 1\\
+\hline
+Dodge Challenger & 15.5 & 8 & 318.0 & 150 & 2.76 & 3.520 & 16.87 & 0 & 0 & 3 & 2\\
+\hline
+AMC Javelin & 15.2 & 8 & 304.0 & 150 & 3.15 & 3.435 & 17.30 & 0 & 0 & 3 & 2\\
+\hline
+Camaro Z28 & 13.3 & 8 & 350.0 & 245 & 3.73 & 3.840 & 15.41 & 0 & 0 & 3 & 4\\
+\hline
+Pontiac Firebird & 19.2 & 8 & 400.0 & 175 & 3.08 & 3.845 & 17.05 & 0 & 0 & 3 & 2\\
+\hline
+Fiat X1-9 & 27.3 & 4 & 79.0 & 66 & 4.08 & 1.935 & 18.90 & 1 & 1 & 4 & 1\\
+\hline
+Porsche 914-2 & 26.0 & 4 & 120.3 & 91 & 4.43 & 2.140 & 16.70 & 0 & 1 & 5 & 2\\
+\hline
+Lotus Europa & 30.4 & 4 & 95.1 & 113 & 3.77 & 1.513 & 16.90 & 1 & 1 & 5 & 2\\
+\hline
+Ford Pantera L & 15.8 & 8 & 351.0 & 264 & 4.22 & 3.170 & 14.50 & 0 & 1 & 5 & 4\\
+\hline
+Ferrari Dino & 19.7 & 6 & 145.0 & 175 & 3.62 & 2.770 & 15.50 & 0 & 1 & 5 & 6\\
+\hline
+Maserati Bora & 15.0 & 8 & 301.0 & 335 & 3.54 & 3.570 & 14.60 & 0 & 1 & 5 & 8\\
+\hline
+Volvo 142E & 21.4 & 4 & 121.0 & 109 & 4.11 & 2.780 & 18.60 & 1 & 1 & 4 & 2\\
+\hline
+\end{tabular}
+\end{table}
+\section{Basic Data Types}\label{basic-data-types}
+\subsection{Vector}\label{vector}
+Vectors can be thought of as contiguous cells containing data. Cells are
+accessed through indexing operations such as x{[}5{]}. Galaaz has six
+basic (`atomic') vector types: logical, integer, real, complex, string
+(or character) and raw. The modes and storage modes for the different
+vector types are listed in the following table.
+\begin{longtable}[]{@{}lcr@{}}
+\toprule
+typeof & mode & storage.mode\tabularnewline
+\midrule
+\endhead
+logical & logical & logical\tabularnewline
+integer & numeric & integer\tabularnewline
+double & numeric & double\tabularnewline
+complex & complex & comples\tabularnewline
+character & character & character\tabularnewline
+raw & raw & raw\tabularnewline
+\bottomrule
+\end{longtable}
+Single numbers, such as 4.2, and strings, such as ``four point two'' are
+still vectors, of length 1; there are no more basic types. Vectors with
+length zero are possible (and useful). String vectors have mode and
+storage mode ``character''. A single element of a character vector is
+often referred to as a character string.
+To create a vector the `c' (concatenate) method from the `R' module
+should be used:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{vec = R.c(}\DecValTok{1}\NormalTok{, }\DecValTok{2}\NormalTok{, }\DecValTok{3}\NormalTok{)}
+\NormalTok{puts vec}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 1 2 3
+\end{verbatim}
+Lets take a look at the type, mode and storage.mode of our vector vec.
+In order to print this out, we are creating a data frame `df' and
+printing it out. A data frame, for those not familiar with it, is
+basically a table. Here we create the data frame and add the column name
+by passing named parameters for each column, such as `typeof:', `mode:'
+and 'storage\_\_mode?`. You should also note here that the double
+underscore is converted to a'.`. So, when printed 'storage\_\_mode' will
+actually print as `storage.mode'.
+Data frames will later be more carefully described. In R, the method
+used to create a data frame is `data.frame', in Galaaz we use
+`data\_\_frame'.
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{df = R.data__frame(}\StringTok{typeof: }\NormalTok{vec.typeof, }\StringTok{mode: }\NormalTok{vec.mode, }\StringTok{storage__mode: }\NormalTok{vec.storage__mode)}
+\NormalTok{puts df}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##    typeof    mode storage.mode
+## 1 integer numeric      integer
+\end{verbatim}
+If you want to create a vector with floating point numbers, then we need
+at least one of the vector's element to be a float, such as 1.0. R users
+should be careful, since in R a number like `1' is converted to float
+and to have an integer the R developer will use `1L'. Galaaz follows
+normal Ruby rules and the number 1 is an integer and 1.0 is a float.
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{vec = R.c(}\FloatTok{1.0}\NormalTok{, }\DecValTok{2}\NormalTok{, }\DecValTok{3}\NormalTok{)}
+\NormalTok{puts vec}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 1 2 3
+\end{verbatim}
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{df = R.data__frame(}\StringTok{typeof: }\NormalTok{vec.typeof, }\StringTok{mode: }\NormalTok{vec.mode, }\StringTok{storage__mode: }\NormalTok{vec.storage__mode)}
+\NormalTok{outputs df.kable.kable_styling}
+\end{Highlighting}
+\end{Shaded}
+\begin{table}[H]
+\centering
+\begin{tabular}{l|l|l}
+\hline
+typeof & mode & storage.mode\\
+\hline
+double & numeric & double\\
+\hline
+\end{tabular}
+\end{table}
+In this next example we try to create a vector with a variable `hello'
+that has not yet being defined. This will raise an exception that is
+printed out. We get two return blocks, the first with a message
+explaining what went wrong and the second with the full backtrace of the
+error.
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{vec = R.c(}\DecValTok{1}\NormalTok{, hello, }\DecValTok{5}\NormalTok{)}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## Message:
+##  undefined local variable or method `hello' for #<RC:0x3d8 @out_list=nil>:RC
+\end{verbatim}
+\begin{verbatim}
+## Message:
+##  /home/rbotafogo/desenv/galaaz/lib/util/exec_ruby.rb:103:in `get_binding'
+## /home/rbotafogo/desenv/galaaz/lib/util/exec_ruby.rb:102:in `eval'
+## /home/rbotafogo/desenv/galaaz/lib/util/exec_ruby.rb:102:in `exec_ruby'
+## /home/rbotafogo/desenv/galaaz/lib/gknit/knitr_engine.rb:650:in `block in initialize'
+## /home/rbotafogo/desenv/galaaz/lib/R_interface/ruby_callback.rb:77:in `call'
+## /home/rbotafogo/desenv/galaaz/lib/R_interface/ruby_callback.rb:77:in `callback'
+## (eval):3:in `function(...) {\n          rb_method(...)'
+## unknown.r:1:in `in_dir'
+## unknown.r:1:in `block_exec'
+## /usr/local/lib/graalvm-ce-java11-20.0.0/languages/R/library/knitr/R/block.R:92:in `call_block'
+## /usr/local/lib/graalvm-ce-java11-20.0.0/languages/R/library/knitr/R/block.R:6:in `process_group.block'
+## /usr/local/lib/graalvm-ce-java11-20.0.0/languages/R/library/knitr/R/block.R:3:in `<no source>'
+## unknown.r:1:in `withCallingHandlers'
+## unknown.r:1:in `process_file'
+## unknown.r:1:in `<no source>'
+## unknown.r:1:in `<no source>'
+## <REPL>:4:in `<repl wrapper>'
+## <REPL>:1
+\end{verbatim}
+Here is a vector with logical values
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{vec = R.c(}\DecValTok{true}\NormalTok{, }\DecValTok{true}\NormalTok{, }\DecValTok{false}\NormalTok{, }\DecValTok{false}\NormalTok{, }\DecValTok{true}\NormalTok{)}
+\NormalTok{puts vec}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1]  TRUE  TRUE FALSE FALSE  TRUE
+\end{verbatim}
+\subsubsection{Combining Vectors}\label{combining-vectors}
+The `c' functions used to create vectors can also be used to combine two
+vectors:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{vec1 = R.c(}\FloatTok{10.0}\NormalTok{, }\FloatTok{20.0}\NormalTok{, }\FloatTok{30.0}\NormalTok{)}
+\NormalTok{vec2 = R.c(}\FloatTok{4.0}\NormalTok{, }\FloatTok{5.0}\NormalTok{, }\FloatTok{6.0}\NormalTok{)}
+\NormalTok{vec = R.c(vec1, vec2)}
+\NormalTok{puts vec}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 10 20 30  4  5  6
+\end{verbatim}
+In galaaz, methods can be chainned (somewhat like the pipe operator in R
+\%\textgreater{}\%, but more generic). In this next example, method `c'
+is chainned after `vec1'. This also looks like `c' is a method of the
+vector, but in reallity, this is actually closer to the pipe operator.
+When Galaaz identifies that `c' is not a method of `vec' it actually
+tries to call `R.c' with `vec1' as the first argument concatenated with
+all the other available arguments. The code bellow is automatically
+converted to the code above.
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{vec = vec1.c(vec2)}
+\NormalTok{puts vec}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 10 20 30  4  5  6
+\end{verbatim}
+\subsubsection{Vector Arithmetic}\label{vector-arithmetic}
+Arithmetic operations on vectors are performed element by element:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts vec1 + vec2}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 14 25 36
+\end{verbatim}
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts vec1 * }\DecValTok{5}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1]  50 100 150
+\end{verbatim}
+When vectors have different length, a recycling rule is applied to the
+shorter vector:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{vec3 = R.c(}\FloatTok{1.0}\NormalTok{, }\FloatTok{2.0}\NormalTok{, }\FloatTok{3.0}\NormalTok{, }\FloatTok{4.0}\NormalTok{, }\FloatTok{5.0}\NormalTok{, }\FloatTok{6.0}\NormalTok{, }\FloatTok{7.0}\NormalTok{, }\FloatTok{8.0}\NormalTok{, }\FloatTok{9.0}\NormalTok{)}
+\NormalTok{puts vec4 = vec1 + vec3}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 11 22 33 14 25 36 17 28 39
+\end{verbatim}
+\subsubsection{Vector Indexing}\label{vector-indexing}
+Vectors can be indexed by using the `{[}{]}' operator:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts vec4[}\DecValTok{3}\NormalTok{]}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 33
+\end{verbatim}
+We can also index a vector with another vector. For example, in the code
+bellow, we take elements 1, 3, 5, and 7 from vec3:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts vec4[R.c(}\DecValTok{1}\NormalTok{, }\DecValTok{3}\NormalTok{, }\DecValTok{5}\NormalTok{, }\DecValTok{7}\NormalTok{)]}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 11 33 25 17
+\end{verbatim}
+Repeating an index and having indices out of order is valid code:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts vec4[R.c(}\DecValTok{1}\NormalTok{, }\DecValTok{3}\NormalTok{, }\DecValTok{3}\NormalTok{, }\DecValTok{1}\NormalTok{)]}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 11 33 33 11
+\end{verbatim}
+It is also possible to index a vector with a negative number or negative
+vector. In these cases the indexed values are not returned:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts vec4[-}\DecValTok{3}\NormalTok{]}
+\NormalTok{puts vec4[-R.c(}\DecValTok{1}\NormalTok{, }\DecValTok{3}\NormalTok{, }\DecValTok{5}\NormalTok{, }\DecValTok{7}\NormalTok{)]}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 11 22 14 25 36 17 28 39
+## [1] 22 14 36 28 39
+\end{verbatim}
+If an index is out of range, a missing value (NA) will be reported.
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts vec4[}\DecValTok{30}\NormalTok{]}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] NA
+\end{verbatim}
+It is also possible to index a vector by range:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts vec4[(}\DecValTok{2}\NormalTok{..}\DecValTok{5}\NormalTok{)]}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 22 33 14 25
+\end{verbatim}
+Elements in a vector can be named using the `names' attribute of a
+vector:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{full_name = R.c(}\StringTok{"Rodrigo"}\NormalTok{, }\StringTok{"A"}\NormalTok{, }\StringTok{"Botafogo"}\NormalTok{)}
+\NormalTok{full_name.names = R.c(}\StringTok{"First"}\NormalTok{, }\StringTok{"Middle"}\NormalTok{, }\StringTok{"Last"}\NormalTok{)}
+\NormalTok{puts full_name}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##      First     Middle       Last
+##  "Rodrigo"        "A" "Botafogo"
+\end{verbatim}
+Or it can also be named by using the `c' function with named
+paramenters:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{full_name = R.c(}\DataTypeTok{First}\NormalTok{: }\StringTok{"Rodrigo"}\NormalTok{, }\DataTypeTok{Middle}\NormalTok{: }\StringTok{"A"}\NormalTok{, }\DataTypeTok{Last}\NormalTok{: }\StringTok{"Botafogo"}\NormalTok{)}
+\NormalTok{puts full_name}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##      First     Middle       Last
+##  "Rodrigo"        "A" "Botafogo"
+\end{verbatim}
+\subsubsection{Extracting Native Ruby Types from a
+Vector}\label{extracting-native-ruby-types-from-a-vector}
+Vectors created with `R.c' are of class R::Vector. You might have
+noticed that when indexing a vector, a new vector is returned, even if
+this vector has one single element. In order to use R::Vector with other
+ruby classes it might be necessary to extract the actual Ruby native
+type from the vector. In order to do this extraction the
+`\textgreater{}\textgreater{}' operator is used.
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts vec4}
+\NormalTok{puts vec4 >> }\DecValTok{0}
+\NormalTok{puts vec4 >> }\DecValTok{4}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 11 22 33 14 25 36 17 28 39
+## 11.0
+## 25.0
+\end{verbatim}
+Note that indexing with `\textgreater{}\textgreater{}' starts at 0 and
+not at 1, also, we cannot do negative indexing.
+\subsection{Matrix}\label{matrix}
+A matrix is a collection of elements organized as a two dimensional
+table. A matrix can be created by the `matrix' function:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{mat = R.matrix(R.c(}\FloatTok{1.0}\NormalTok{, }\FloatTok{2.0}\NormalTok{, }\FloatTok{3.0}\NormalTok{, }\FloatTok{4.0}\NormalTok{, }\FloatTok{5.0}\NormalTok{, }\FloatTok{6.0}\NormalTok{, }\FloatTok{7.0}\NormalTok{, }\FloatTok{8.0}\NormalTok{, }\FloatTok{9.0}\NormalTok{),}
+               \StringTok{nrow: }\DecValTok{3}\NormalTok{,}
+               \StringTok{ncol: }\DecValTok{3}\NormalTok{)}
+\NormalTok{puts mat}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##      [,1] [,2] [,3]
+## [1,]    1    4    7
+## [2,]    2    5    8
+## [3,]    3    6    9
+\end{verbatim}
+Note that matrices data is organized by column first. It is possible to
+organize the matrix memory by row first passing an extra argument to the
+`matrix' function:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{mat_row = R.matrix(R.c(}\FloatTok{1.0}\NormalTok{, }\FloatTok{2.0}\NormalTok{, }\FloatTok{3.0}\NormalTok{, }\FloatTok{4.0}\NormalTok{, }\FloatTok{5.0}\NormalTok{, }\FloatTok{6.0}\NormalTok{, }\FloatTok{7.0}\NormalTok{, }\FloatTok{8.0}\NormalTok{, }\FloatTok{9.0}\NormalTok{),}
+                   \StringTok{nrow: }\DecValTok{3}\NormalTok{,}
+                   \StringTok{ncol: }\DecValTok{3}\NormalTok{,}
+                   \StringTok{byrow: }\DecValTok{true}\NormalTok{)}
+\NormalTok{puts mat_row}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##      [,1] [,2] [,3]
+## [1,]    1    2    3
+## [2,]    4    5    6
+## [3,]    7    8    9
+\end{verbatim}
+\subsubsection{Indexing a Matrix}\label{indexing-a-matrix}
+A matrix can be indexed by {[}row, column{]}:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts mat_row[}\DecValTok{1}\NormalTok{, }\DecValTok{1}\NormalTok{]}
+\NormalTok{puts mat_row[}\DecValTok{2}\NormalTok{, }\DecValTok{3}\NormalTok{]}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 1
+## [1] 6
+\end{verbatim}
+It is possible to index an entire row or column with the `:all' keyword
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts mat_row[}\DecValTok{1}\NormalTok{, }\StringTok{:all}\NormalTok{]}
+\NormalTok{puts mat_row[}\StringTok{:all}\NormalTok{, }\DecValTok{2}\NormalTok{]}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 1 2 3
+## [1] 2 5 8
+\end{verbatim}
+Indexing with a vector is also possible for matrices. In the following
+example we want rows 1 and 3 and columns 2 and 3 building a 2 x 2
+matrix.
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts mat_row[R.c(}\DecValTok{1}\NormalTok{, }\DecValTok{3}\NormalTok{), R.c(}\DecValTok{2}\NormalTok{, }\DecValTok{3}\NormalTok{)]}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##      [,1] [,2]
+## [1,]    2    3
+## [2,]    8    9
+\end{verbatim}
+Matrices can be combined with functions `rbind':
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts mat_row.rbind(mat)}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##      [,1] [,2] [,3]
+## [1,]    1    2    3
+## [2,]    4    5    6
+## [3,]    7    8    9
+## [4,]    1    4    7
+## [5,]    2    5    8
+## [6,]    3    6    9
+\end{verbatim}
+and `cbind':
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts mat_row.cbind(mat)}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##      [,1] [,2] [,3] [,4] [,5] [,6]
+## [1,]    1    2    3    1    4    7
+## [2,]    4    5    6    2    5    8
+## [3,]    7    8    9    3    6    9
+\end{verbatim}
+\subsection{List}\label{list}
+A list is a data structure that can contain sublists of different types,
+while vector and matrix can only hold one type of element.
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{nums = R.c(}\FloatTok{1.0}\NormalTok{, }\FloatTok{2.0}\NormalTok{, }\FloatTok{3.0}\NormalTok{)}
+\NormalTok{strs = R.c(}\StringTok{"a"}\NormalTok{, }\StringTok{"b"}\NormalTok{, }\StringTok{"c"}\NormalTok{, }\StringTok{"d"}\NormalTok{)}
+\NormalTok{bool = R.c(}\DecValTok{true}\NormalTok{, }\DecValTok{true}\NormalTok{, }\DecValTok{false}\NormalTok{)}
+\NormalTok{lst = R.list(}\StringTok{nums: }\NormalTok{nums, }\StringTok{strs: }\NormalTok{strs, }\StringTok{bool: }\NormalTok{bool)}
+\NormalTok{puts lst}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## $nums
+## [1] 1 2 3
+##
+## $strs
+## [1] "a" "b" "c" "d"
+##
+## $bool
+## [1]  TRUE  TRUE FALSE
+\end{verbatim}
+Note that `lst' elements are named elements.
+\subsubsection{List Indexing}\label{list-indexing}
+List indexing, also called slicing, is done using the `{[}{]}' operator
+and the `{[}{[}{]}{]}' operator. Let's first start with the `{[}{]}'
+operator. The list above has three sublist indexing with `{[}{]}' will
+return one of the sublists.
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts lst[}\DecValTok{1}\NormalTok{]}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## $nums
+## [1] 1 2 3
+\end{verbatim}
+Note that when using `{[}{]}' a new list is returned. When using the
+double square bracket operator the value returned is the actual element
+of the list in the given position and not a slice of the original list
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts lst[[}\DecValTok{1}\NormalTok{]]}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 1 2 3
+\end{verbatim}
+When elements are named, as dones with lst, indexing can be done by
+name:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts lst[[}\StringTok{'bool'}\NormalTok{]][[}\DecValTok{1}\NormalTok{]] >> }\DecValTok{0}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## true
+\end{verbatim}
+In this example, first the `bool' element of the list was extracted, not
+as a list, but as a vector, then the first element of the vector was
+extracted (note that vectors also accept the `{[}{[}{]}{]}' operator)
+and then the vector was indexed by its first element, extracting the
+native Ruby type.
+\subsection{Data Frame}\label{data-frame}
+A data frame is a table like structure in which each column has the same
+number of rows. Data frames are the basic structure for storing data for
+data analysis. We have already seen a data frame previously when we
+accessed variable `\textasciitilde{}:mtcars'. In order to create a data
+frame, function 'data\_\_frame' is used:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{df = R.data__frame(}
+  \StringTok{year: }\NormalTok{R.c(}\DecValTok{2010}\NormalTok{, }\DecValTok{2011}\NormalTok{, }\DecValTok{2012}\NormalTok{),}
+  \StringTok{income: }\NormalTok{R.c(}\FloatTok{1000.0}\NormalTok{, }\FloatTok{1500.0}\NormalTok{, }\FloatTok{2000.0}\NormalTok{))}
+\NormalTok{puts df}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##   year income
+## 1 2010   1000
+## 2 2011   1500
+## 3 2012   2000
+\end{verbatim}
+\subsubsection{Data Frame Indexing}\label{data-frame-indexing}
+A data frame can be indexed the same way as a matrix, by using `{[}row,
+column{]}', where row and column can either be a numeric or the name of
+the row or column
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts (~}\StringTok{:mtcars}\NormalTok{).head}
+\NormalTok{puts (~}\StringTok{:mtcars}\NormalTok{)[}\DecValTok{1}\NormalTok{, }\DecValTok{2}\NormalTok{]}
+\NormalTok{puts (~}\StringTok{:mtcars}\NormalTok{)[}\StringTok{'Datsun 710'}\NormalTok{, }\StringTok{'mpg'}\NormalTok{]}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##                    mpg cyl disp  hp drat    wt  qsec vs am gear carb
+## Mazda RX4         21.0   6  160 110 3.90 2.620 16.46  0  1    4    4
+## Mazda RX4 Wag     21.0   6  160 110 3.90 2.875 17.02  0  1    4    4
+## Datsun 710        22.8   4  108  93 3.85 2.320 18.61  1  1    4    1
+## Hornet 4 Drive    21.4   6  258 110 3.08 3.215 19.44  1  0    3    1
+## Hornet Sportabout 18.7   8  360 175 3.15 3.440 17.02  0  0    3    2
+## Valiant           18.1   6  225 105 2.76 3.460 20.22  1  0    3    1
+## [1] 6
+## [1] 22.8
+\end{verbatim}
+Extracting a column from a data frame as a vector can be done by using
+the double square bracket operator:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts (~}\StringTok{:mtcars}\NormalTok{)[[}\StringTok{'mpg'}\NormalTok{]]}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##  [1] 21.0 21.0 22.8 21.4 18.7 18.1 14.3 24.4 22.8 19.2 17.8 16.4 17.3 15.2
+## [15] 10.4 10.4 14.7 32.4 30.4 33.9 21.5 15.5 15.2 13.3 19.2 27.3 26.0 30.4
+## [29] 15.8 19.7 15.0 21.4
+\end{verbatim}
+A data frame column can also be accessed as if it were an instance
+variable of the data frame:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts (~}\StringTok{:mtcars}\NormalTok{).mpg}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##  [1] 21.0 21.0 22.8 21.4 18.7 18.1 14.3 24.4 22.8 19.2 17.8 16.4 17.3 15.2
+## [15] 10.4 10.4 14.7 32.4 30.4 33.9 21.5 15.5 15.2 13.3 19.2 27.3 26.0 30.4
+## [29] 15.8 19.7 15.0 21.4
+\end{verbatim}
+Slicing a data frame can be done by indexing it with a vector (we use
+`head' to reduce the output):
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts (~}\StringTok{:mtcars}\NormalTok{)[R.c(}\StringTok{'mpg'}\NormalTok{, }\StringTok{'hp'}\NormalTok{)].head}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##                    mpg  hp
+## Mazda RX4         21.0 110
+## Mazda RX4 Wag     21.0 110
+## Datsun 710        22.8  93
+## Hornet 4 Drive    21.4 110
+## Hornet Sportabout 18.7 175
+## Valiant           18.1 105
+\end{verbatim}
+A row slice can be obtained by indexing by row and using the `:all'
+keyword for the column:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts (~}\StringTok{:mtcars}\NormalTok{)[R.c(}\StringTok{'Datsun 710'}\NormalTok{, }\StringTok{'Camaro Z28'}\NormalTok{), }\StringTok{:all}\NormalTok{]}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##             mpg cyl disp  hp drat   wt  qsec vs am gear carb
+## Datsun 710 22.8   4  108  93 3.85 2.32 18.61  1  1    4    1
+## Camaro Z28 13.3   8  350 245 3.73 3.84 15.41  0  0    3    4
+\end{verbatim}
+Finally, a data frame can also be indexed with a logical vector. In this
+next example, the `am' column of :mtcars is compared with 0 (with method
+`eq'). When `am' is equal to 0 the car is automatic. So, by doing
+`(\textasciitilde{}:mtcars).am.eq 0' a logical vector is created with
+`true' whenever `am' is 0 and `false' otherwise.
+\begin{Shaded}
+\begin{Highlighting}[]
+\CommentTok{# obtain a vector with 'true' for cars with automatic transmission}
+\NormalTok{automatic = (~}\StringTok{:mtcars}\NormalTok{).am.eq }\DecValTok{0}
+\NormalTok{puts automatic}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##  [1] FALSE FALSE FALSE  TRUE  TRUE  TRUE  TRUE  TRUE  TRUE  TRUE  TRUE
+## [12]  TRUE  TRUE  TRUE  TRUE  TRUE  TRUE FALSE FALSE FALSE  TRUE  TRUE
+## [23]  TRUE  TRUE  TRUE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
+\end{verbatim}
+Using this logical vector, the data frame is indexed, returning a new
+data frame in which all cars have automatic transmission.
+\begin{Shaded}
+\begin{Highlighting}[]
+\CommentTok{# slice the data frame by using this vector}
+\NormalTok{puts (~}\StringTok{:mtcars}\NormalTok{)[automatic, }\StringTok{:all}\NormalTok{]}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##                      mpg cyl  disp  hp drat    wt  qsec vs am gear carb
+## Hornet 4 Drive      21.4   6 258.0 110 3.08 3.215 19.44  1  0    3    1
+## Hornet Sportabout   18.7   8 360.0 175 3.15 3.440 17.02  0  0    3    2
+## Valiant             18.1   6 225.0 105 2.76 3.460 20.22  1  0    3    1
+## Duster 360          14.3   8 360.0 245 3.21 3.570 15.84  0  0    3    4
+## Merc 240D           24.4   4 146.7  62 3.69 3.190 20.00  1  0    4    2
+## Merc 230            22.8   4 140.8  95 3.92 3.150 22.90  1  0    4    2
+## Merc 280            19.2   6 167.6 123 3.92 3.440 18.30  1  0    4    4
+## Merc 280C           17.8   6 167.6 123 3.92 3.440 18.90  1  0    4    4
+## Merc 450SE          16.4   8 275.8 180 3.07 4.070 17.40  0  0    3    3
+## Merc 450SL          17.3   8 275.8 180 3.07 3.730 17.60  0  0    3    3
+## Merc 450SLC         15.2   8 275.8 180 3.07 3.780 18.00  0  0    3    3
+## Cadillac Fleetwood  10.4   8 472.0 205 2.93 5.250 17.98  0  0    3    4
+## Lincoln Continental 10.4   8 460.0 215 3.00 5.424 17.82  0  0    3    4
+## Chrysler Imperial   14.7   8 440.0 230 3.23 5.345 17.42  0  0    3    4
+## Toyota Corona       21.5   4 120.1  97 3.70 2.465 20.01  1  0    3    1
+## Dodge Challenger    15.5   8 318.0 150 2.76 3.520 16.87  0  0    3    2
+## AMC Javelin         15.2   8 304.0 150 3.15 3.435 17.30  0  0    3    2
+## Camaro Z28          13.3   8 350.0 245 3.73 3.840 15.41  0  0    3    4
+## Pontiac Firebird    19.2   8 400.0 175 3.08 3.845 17.05  0  0    3    2
+\end{verbatim}
+\section{Writing Expressions in
+Galaaz}\label{writing-expressions-in-galaaz}
+Galaaz extends Ruby to work with complex expressions, similar to R's
+expressions build with `quote' (base R) or `quo' (tidyverse). Let's take
+a look at some of those expressions.
+\subsection{Expressions from
+operators}\label{expressions-from-operators}
+The code bellow creates an expression summing two symbols
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{exp1 = }\StringTok{:a}\NormalTok{ + }\StringTok{:b}
+\NormalTok{puts exp1}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## a + b
+\end{verbatim}
+We can build any complex mathematical expression
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{exp2 = (}\StringTok{:a}\NormalTok{ + }\StringTok{:b}\NormalTok{) * }\FloatTok{2.0}\NormalTok{ + }\StringTok{:c}\NormalTok{ ** }\DecValTok{2}\NormalTok{ / }\StringTok{:z}
+\NormalTok{puts exp2}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## (a + b) * 2 + c^2L/z
+\end{verbatim}
+It is also possible to use inequality operators in building expressions
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{exp3 = (}\StringTok{:a}\NormalTok{ + }\StringTok{:b}\NormalTok{) >= }\StringTok{:z}
+\NormalTok{puts exp3}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## a + b >= z
+\end{verbatim}
+Galaaz provides both symbolic representations for operators, such as
+(\textgreater{}, \textless{}, !=) as functional notation for those
+operators such as (.gt, .ge, etc.). So the same expression written above
+can also be written as
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{exp4 = (}\StringTok{:a}\NormalTok{ + }\StringTok{:b}\NormalTok{).ge }\StringTok{:z}
+\NormalTok{puts exp4}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## a + b >= z
+\end{verbatim}
+Two type of expression can only be created with the functional
+representation of the operators, those are expressions involving `==',
+and `='. In order to write an expression involving `==' we need to use
+the method `.eq' and for `=' we need the function `.assign'
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{exp5 = (}\StringTok{:a}\NormalTok{ + }\StringTok{:b}\NormalTok{).eq }\StringTok{:z}
+\NormalTok{puts exp5}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## a + b == z
+\end{verbatim}
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{exp6 = }\StringTok{:y}\NormalTok{.assign }\StringTok{:a}\NormalTok{ + }\StringTok{:b}
+\NormalTok{puts exp6}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## y <- a + b
+\end{verbatim}
+In general we think that using the functional notation is preferable to
+using the symbolic notation as otherwise, we end up writing invalid
+expressions such as
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{exp_wrong = (}\StringTok{:a}\NormalTok{ + }\StringTok{:b}\NormalTok{) == }\StringTok{:z}
+\NormalTok{puts exp_wrong}
+\end{Highlighting}
+\end{Shaded}
+and it might be difficult to understand what is going on here. The
+problem lies with the fact that when using `==' we are comparing
+expression (:a + :b) to expression :z with `=='. When the comparison is
+executed, the system tries to evaluate :a, :b and :z, and those symbols
+at this time are not bound to anything and we get a ``object `a' not
+found'' message. If we only use functional notation, this type of error
+will not occur.
+\subsection{Expressions with R
+methods}\label{expressions-with-r-methods}
+It is often necessary to create an expression that uses a method or
+function. For instance, in mathematics, it's quite natural to write an
+expressin such as \(y = sin(x)\). In this case, the `sin' function is
+part of the expression and should not immediately executed. Now, let's
+say that `x' is an angle of 45\(^\circ\) and we acttually want our
+expression to be \(y = 0.850...\). When we want the function to be part
+of the expression, we call the function preceeding it by the letter E,
+such as `E.sin(x)'
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{exp7 = }\StringTok{:y}\NormalTok{.assign E.sin(}\StringTok{:x}\NormalTok{)}
+\NormalTok{puts exp7}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## y <- sin(x)
+\end{verbatim}
+Expressions can also be written using `.' notation:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{exp8 = }\StringTok{:y}\NormalTok{.assign }\StringTok{:x}\NormalTok{.sin}
+\NormalTok{puts exp8}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## y <- sin(x)
+\end{verbatim}
+When a function has multiple arguments, the first one can be used before
+the `.':
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{exp9 = }\StringTok{:x}\NormalTok{.c(}\StringTok{:y}\NormalTok{)}
+\NormalTok{puts exp9}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## c(x, y)
+\end{verbatim}
+\subsection{Evaluating an Expression}\label{evaluating-an-expression}
+Expressions can be evaluated by calling function `eval' with a binding.
+A binding can be provided with a list:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{exp = (}\StringTok{:a}\NormalTok{ + }\StringTok{:b}\NormalTok{) * }\FloatTok{2.0}\NormalTok{ + }\StringTok{:c}\NormalTok{ ** }\DecValTok{2}\NormalTok{ / }\StringTok{:z}
+\NormalTok{puts exp.eval(R.list(}\StringTok{a: }\DecValTok{10}\NormalTok{, }\StringTok{b: }\DecValTok{20}\NormalTok{, }\StringTok{c: }\DecValTok{30}\NormalTok{, }\StringTok{z: }\DecValTok{40}\NormalTok{))}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 82.5
+\end{verbatim}
+\ldots{} with a data frame:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{df = R.data__frame(}
+  \StringTok{a: }\NormalTok{R.c(}\DecValTok{1}\NormalTok{, }\DecValTok{2}\NormalTok{, }\DecValTok{3}\NormalTok{),}
+  \StringTok{b: }\NormalTok{R.c(}\DecValTok{10}\NormalTok{, }\DecValTok{20}\NormalTok{, }\DecValTok{30}\NormalTok{),}
+  \StringTok{c: }\NormalTok{R.c(}\DecValTok{100}\NormalTok{, }\DecValTok{200}\NormalTok{, }\DecValTok{300}\NormalTok{),}
+  \StringTok{z: }\NormalTok{R.c(}\DecValTok{1000}\NormalTok{, }\DecValTok{2000}\NormalTok{, }\DecValTok{3000}\NormalTok{))}
+\NormalTok{puts exp.eval(df)}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1] 32 64 96
+\end{verbatim}
+\section{Manipulating Data}\label{manipulating-data}
+One of the major benefits of Galaaz is to bring strong data manipulation
+to Ruby. The following examples were extracted from Hardley's ``R for
+Data Science'' (\url{https://r4ds.had.co.nz/}). This is a highly
+recommended book for those not already familiar with the `tidyverse'
+style of programming in R. In the sections to follow, we will limit
+ourselves to convert the R code to Galaaz.
+For these examples, we will investigate the nycflights13 data set
+available on the package by the same name. We use function
+`R.install\_and\_loads' that checks if the library is available locally,
+and if not, installs it. This data frame contains all 336,776 flights
+that departed from New York City in 2013. The data comes from the US
+Bureau of Transportation Statistics.
+Dplyr uses `tibbles' in place of data frames; unfortunately, tibbles do
+not print yet properly in Galaaz due to a bug in fastR. In order to
+print a tibble we need to convert it to a data frame using the
+'as\_\_data\_\_frame' method.
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{R.install_and_loads(}\StringTok{'nycflights13'}\NormalTok{)}
+\NormalTok{R.library(}\StringTok{'dplyr'}\NormalTok{)}
+\end{Highlighting}
+\end{Shaded}
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{flights = ~}\StringTok{:flights}
+\NormalTok{puts flights.head}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 6 x 19
+##    year month   day dep_time sched_dep_time dep_delay arr_time
+##   <int> <int> <int>    <int>          <int>     <dbl>    <int>
+## 1  2013     1     1      517            515         2      830
+## 2  2013     1     1      533            529         4      850
+## 3  2013     1     1      542            540         2      923
+## 4  2013     1     1      544            545        -1     1004
+## 5  2013     1     1      554            600        -6      812
+## 6  2013     1     1      554            558        -4      740
+## # ... with 12 more variables: sched_arr_time <int>, arr_delay <dbl>,
+## #   carrier <chr>, flight <int>, tailnum <chr>, origin <chr>, dest <chr>,
+## #   air_time <dbl>, distance <dbl>, hour <dbl>, minute <dbl>,
+## #   time_hour <dttm>
+\end{verbatim}
+\subsection{Filtering rows with
+Filter}\label{filtering-rows-with-filter}
+In this example we filter the flights data set by giving to the filter
+function two expressions: the first :month.eq 1
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts flights.filter((}\StringTok{:month}\NormalTok{.eq }\DecValTok{1}\NormalTok{), (}\StringTok{:day}\NormalTok{.eq }\DecValTok{1}\NormalTok{)).head}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 6 x 19
+##    year month   day dep_time sched_dep_time dep_delay arr_time
+##   <int> <int> <int>    <int>          <int>     <dbl>    <int>
+## 1  2013     1     1      517            515         2      830
+## 2  2013     1     1      533            529         4      850
+## 3  2013     1     1      542            540         2      923
+## 4  2013     1     1      544            545        -1     1004
+## 5  2013     1     1      554            600        -6      812
+## 6  2013     1     1      554            558        -4      740
+## # ... with 12 more variables: sched_arr_time <int>, arr_delay <dbl>,
+## #   carrier <chr>, flight <int>, tailnum <chr>, origin <chr>, dest <chr>,
+## #   air_time <dbl>, distance <dbl>, hour <dbl>, minute <dbl>,
+## #   time_hour <dttm>
+\end{verbatim}
+\subsection{Logical Operators}\label{logical-operators}
+All flights that departed in November of December
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts flights.filter((}\StringTok{:month}\NormalTok{.eq }\DecValTok{11}\NormalTok{) | (}\StringTok{:month}\NormalTok{.eq }\DecValTok{12}\NormalTok{)).head}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 6 x 19
+##    year month   day dep_time sched_dep_time dep_delay arr_time
+##   <int> <int> <int>    <int>          <int>     <dbl>    <int>
+## 1  2013    11     1        5           2359         6      352
+## 2  2013    11     1       35           2250       105      123
+## 3  2013    11     1      455            500        -5      641
+## 4  2013    11     1      539            545        -6      856
+## 5  2013    11     1      542            545        -3      831
+## 6  2013    11     1      549            600       -11      912
+## # ... with 12 more variables: sched_arr_time <int>, arr_delay <dbl>,
+## #   carrier <chr>, flight <int>, tailnum <chr>, origin <chr>, dest <chr>,
+## #   air_time <dbl>, distance <dbl>, hour <dbl>, minute <dbl>,
+## #   time_hour <dttm>
+\end{verbatim}
+The same as above, but using the `in' operator. In R, it is possible to
+define many operators by doing \%\%. The \%in\% operator checks if a
+value is in a vector. In order to use those operators from Galaaz the
+'.\_`method is used, where the first argument is the operator's symbol,
+in this case':in' and the second argument is the vector:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts flights.filter(}\StringTok{:month}\NormalTok{._ }\StringTok{:in}\NormalTok{, R.c(}\DecValTok{11}\NormalTok{, }\DecValTok{12}\NormalTok{)).head}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 6 x 19
+##    year month   day dep_time sched_dep_time dep_delay arr_time
+##   <int> <int> <int>    <int>          <int>     <dbl>    <int>
+## 1  2013    11     1        5           2359         6      352
+## 2  2013    11     1       35           2250       105      123
+## 3  2013    11     1      455            500        -5      641
+## 4  2013    11     1      539            545        -6      856
+## 5  2013    11     1      542            545        -3      831
+## 6  2013    11     1      549            600       -11      912
+## # ... with 12 more variables: sched_arr_time <int>, arr_delay <dbl>,
+## #   carrier <chr>, flight <int>, tailnum <chr>, origin <chr>, dest <chr>,
+## #   air_time <dbl>, distance <dbl>, hour <dbl>, minute <dbl>,
+## #   time_hour <dttm>
+\end{verbatim}
+\subsection{Filtering with NA (Not
+Available)}\label{filtering-with-na-not-available}
+Let's first create a `tibble' with a Not Available value (R::NA).
+Tibbles are a modern version of a data frame and operate very similarly
+to one. It differs in how it outputs the values and the result of some
+subsetting operations that are more consistent than what is obtained
+from data frame.
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{df = R.tibble(}\StringTok{x: }\NormalTok{R.c(}\DecValTok{1}\NormalTok{, R::}\DataTypeTok{NA}\NormalTok{, }\DecValTok{3}\NormalTok{))}
+\NormalTok{puts df}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 3 x 1
+##       x
+##   <int>
+## 1     1
+## 2
+## 3     3
+\end{verbatim}
+Now filtering by :x \textgreater{} 1 shows all lines that satisfy this
+condition, where the row with R:NA does not.
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts df.filter(}\StringTok{:x}\NormalTok{ > }\DecValTok{1}\NormalTok{)}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 1 x 1
+##       x
+##   <int>
+## 1     3
+\end{verbatim}
+To match an NA use method 'is\_\_na'
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts df.filter((}\StringTok{:x}\NormalTok{.is__na) | (}\StringTok{:x}\NormalTok{ > }\DecValTok{1}\NormalTok{))}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 2 x 1
+##       x
+##   <int>
+## 1
+## 2     3
+\end{verbatim}
+\subsection{Arrange Rows with arrange}\label{arrange-rows-with-arrange}
+Arrange reorders the rows of a data frame by the given arguments.
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts flights.arrange(}\StringTok{:year}\NormalTok{, }\StringTok{:month}\NormalTok{, }\StringTok{:day}\NormalTok{).head}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 6 x 19
+##    year month   day dep_time sched_dep_time dep_delay arr_time
+##   <int> <int> <int>    <int>          <int>     <dbl>    <int>
+## 1  2013     1     1      517            515         2      830
+## 2  2013     1     1      533            529         4      850
+## 3  2013     1     1      542            540         2      923
+## 4  2013     1     1      544            545        -1     1004
+## 5  2013     1     1      554            600        -6      812
+## 6  2013     1     1      554            558        -4      740
+## # ... with 12 more variables: sched_arr_time <int>, arr_delay <dbl>,
+## #   carrier <chr>, flight <int>, tailnum <chr>, origin <chr>, dest <chr>,
+## #   air_time <dbl>, distance <dbl>, hour <dbl>, minute <dbl>,
+## #   time_hour <dttm>
+\end{verbatim}
+To arrange in descending order, use function `desc'
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts flights.arrange(}\StringTok{:dep_delay}\NormalTok{.desc).head}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 6 x 19
+##    year month   day dep_time sched_dep_time dep_delay arr_time
+##   <int> <int> <int>    <int>          <int>     <dbl>    <int>
+## 1  2013     1     9      641            900      1301     1242
+## 2  2013     6    15     1432           1935      1137     1607
+## 3  2013     1    10     1121           1635      1126     1239
+## 4  2013     9    20     1139           1845      1014     1457
+## 5  2013     7    22      845           1600      1005     1044
+## 6  2013     4    10     1100           1900       960     1342
+## # ... with 12 more variables: sched_arr_time <int>, arr_delay <dbl>,
+## #   carrier <chr>, flight <int>, tailnum <chr>, origin <chr>, dest <chr>,
+## #   air_time <dbl>, distance <dbl>, hour <dbl>, minute <dbl>,
+## #   time_hour <dttm>
+\end{verbatim}
+\subsection{Selecting columns}\label{selecting-columns}
+To select specific columns from a dataset we use function `select':
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts flights.select(}\StringTok{:year}\NormalTok{, }\StringTok{:month}\NormalTok{, }\StringTok{:day}\NormalTok{).head}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 6 x 3
+##    year month   day
+##   <int> <int> <int>
+## 1  2013     1     1
+## 2  2013     1     1
+## 3  2013     1     1
+## 4  2013     1     1
+## 5  2013     1     1
+## 6  2013     1     1
+\end{verbatim}
+It is also possible to select column in a given range
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts flights.select(}\StringTok{:year}\NormalTok{.up_to }\StringTok{:day}\NormalTok{).head}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 6 x 3
+##    year month   day
+##   <int> <int> <int>
+## 1  2013     1     1
+## 2  2013     1     1
+## 3  2013     1     1
+## 4  2013     1     1
+## 5  2013     1     1
+## 6  2013     1     1
+\end{verbatim}
+Select all columns that start with a given name sequence
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts flights.select(E.starts_with(}\StringTok{'arr'}\NormalTok{)).head}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 6 x 2
+##   arr_time arr_delay
+##      <int>     <dbl>
+## 1      830        11
+## 2      850        20
+## 3      923        33
+## 4     1004       -18
+## 5      812       -25
+## 6      740        12
+\end{verbatim}
+Other functions that can be used:
+\begin{itemize}
+\item
+  ends\_with(``xyz''): matches names that end with ``xyz''.
+\item
+  contains(``ijk''): matches names that contain ``ijk''.
+\item
+  matches(``(.)\textbackslash{}1''): selects variables that match a
+  regular expression. This one matches any variables that contain
+  repeated characters.
+\item
+  num\_range(``x'', (1..3)): matches x1, x2 and x3
+\end{itemize}
+A helper function that comes in handy when we just want to rearrange
+column order is `Everything':
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts flights.select(}\StringTok{:year}\NormalTok{, }\StringTok{:month}\NormalTok{, }\StringTok{:day}\NormalTok{, E.everything).head}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 6 x 19
+##    year month   day dep_time sched_dep_time dep_delay arr_time
+##   <int> <int> <int>    <int>          <int>     <dbl>    <int>
+## 1  2013     1     1      517            515         2      830
+## 2  2013     1     1      533            529         4      850
+## 3  2013     1     1      542            540         2      923
+## 4  2013     1     1      544            545        -1     1004
+## 5  2013     1     1      554            600        -6      812
+## 6  2013     1     1      554            558        -4      740
+## # ... with 12 more variables: sched_arr_time <int>, arr_delay <dbl>,
+## #   carrier <chr>, flight <int>, tailnum <chr>, origin <chr>, dest <chr>,
+## #   air_time <dbl>, distance <dbl>, hour <dbl>, minute <dbl>,
+## #   time_hour <dttm>
+\end{verbatim}
+\subsection{\texorpdfstring{Add variables to a dataframe with
+`mutate'}{Add variables to a dataframe with mutate}}\label{add-variables-to-a-dataframe-with-mutate}
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{flights_sm = flights.}
+\NormalTok{               select((}\StringTok{:year}\NormalTok{.up_to }\StringTok{:day}\NormalTok{),}
+\NormalTok{                      E.ends_with(}\StringTok{'delay'}\NormalTok{),}
+                      \StringTok{:distance}\NormalTok{,}
+                      \StringTok{:air_time}\NormalTok{)}
+\NormalTok{puts flights_sm.head}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 6 x 7
+##    year month   day dep_delay arr_delay distance air_time
+##   <int> <int> <int>     <dbl>     <dbl>    <dbl>    <dbl>
+## 1  2013     1     1         2        11     1400      227
+## 2  2013     1     1         4        20     1416      227
+## 3  2013     1     1         2        33     1089      160
+## 4  2013     1     1        -1       -18     1576      183
+## 5  2013     1     1        -6       -25      762      116
+## 6  2013     1     1        -4        12      719      150
+\end{verbatim}
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{flights_sm = flights_sm.}
+\NormalTok{               mutate(}\StringTok{gain: :dep_delay}\NormalTok{ - }\StringTok{:arr_delay}\NormalTok{,}
+                      \StringTok{speed: :distance}\NormalTok{ / }\StringTok{:air_time}\NormalTok{ * }\DecValTok{60}\NormalTok{)}
+\NormalTok{puts flights_sm.head}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 6 x 9
+##    year month   day dep_delay arr_delay distance air_time  gain speed
+##   <int> <int> <int>     <dbl>     <dbl>    <dbl>    <dbl> <dbl> <dbl>
+## 1  2013     1     1         2        11     1400      227    -9  370.
+## 2  2013     1     1         4        20     1416      227   -16  374.
+## 3  2013     1     1         2        33     1089      160   -31  408.
+## 4  2013     1     1        -1       -18     1576      183    17  517.
+## 5  2013     1     1        -6       -25      762      116    19  394.
+## 6  2013     1     1        -4        12      719      150   -16  288.
+\end{verbatim}
+\subsection{Summarising data}\label{summarising-data}
+Function `summarise' calculates summaries for the data frame. When no
+`group\_by' is used a single value is obtained from the data frame:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts flights.summarise(}\StringTok{delay: }\NormalTok{E.mean(}\StringTok{:dep_delay}\NormalTok{, }\StringTok{na__rm: }\DecValTok{true}\NormalTok{))}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 1 x 1
+##   delay
+##   <dbl>
+## 1  12.6
+\end{verbatim}
+When a data frame is grouped with `group\_by' summaries apply to the
+given group:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{by_day = flights.group_by(}\StringTok{:year}\NormalTok{, }\StringTok{:month}\NormalTok{, }\StringTok{:day}\NormalTok{)}
+\NormalTok{puts by_day.summarise(}\StringTok{delay: :dep_delay}\NormalTok{.mean(}\StringTok{na__rm: }\DecValTok{true}\NormalTok{)).head}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 6 x 4
+## # Groups:   year, month [1]
+##    year month   day delay
+## * <int> <int> <int> <dbl>
+## 1  2013     1     1 11.5
+## 2  2013     1     2 13.9
+## 3  2013     1     3 11.0
+## 4  2013     1     4  8.95
+## 5  2013     1     5  5.73
+## 6  2013     1     6  7.15
+\end{verbatim}
+Next we put many operations together by pipping them one after the
+other:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{delays = flights.}
+\NormalTok{           group_by(}\StringTok{:dest}\NormalTok{).}
+\NormalTok{           summarise(}
+             \StringTok{count: }\NormalTok{E.n,}
+             \StringTok{dist: :distance}\NormalTok{.mean(}\StringTok{na__rm: }\DecValTok{true}\NormalTok{),}
+             \StringTok{delay: :arr_delay}\NormalTok{.mean(}\StringTok{na__rm: }\DecValTok{true}\NormalTok{)).}
+\NormalTok{           filter(}\StringTok{:count}\NormalTok{ > }\DecValTok{20}\NormalTok{, }\StringTok{:dest}\NormalTok{ != }\StringTok{"NHL"}\NormalTok{)}
+\NormalTok{puts delays.head}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 6 x 4
+##   dest  count  dist delay
+##   <chr> <int> <dbl> <dbl>
+## 1 ABQ     254 1826   4.38
+## 2 ACK     265  199   4.85
+## 3 ALB     439  143  14.4
+## 4 ATL   17215  757. 11.3
+## 5 AUS    2439 1514.  6.02
+## 6 AVL     275  584.  8.00
+\end{verbatim}
+\section{Using Data Table}\label{using-data-table}
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{R.library(}\StringTok{'data.table'}\NormalTok{)}
+\NormalTok{R.install_and_loads(}\StringTok{'curl'}\NormalTok{)}
+\NormalTok{input = }\StringTok{"https://raw.githubusercontent.com/Rdatatable/data.table/master/vignettes/flights14.csv"}
+\NormalTok{flights = R.fread(input)}
+\NormalTok{puts flights}
+\NormalTok{puts flights.dim}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##         year month day dep_delay arr_delay carrier origin dest air_time
+##      1: 2014     1   1        14        13      AA    JFK  LAX      359
+##      2: 2014     1   1        -3        13      AA    JFK  LAX      363
+##      3: 2014     1   1         2         9      AA    JFK  LAX      351
+##      4: 2014     1   1        -8       -26      AA    LGA  PBI      157
+##      5: 2014     1   1         2         1      AA    JFK  LAX      350
+##     ---
+## 253312: 2014    10  31         1       -30      UA    LGA  IAH      201
+## 253313: 2014    10  31        -5       -14      UA    EWR  IAH      189
+## 253314: 2014    10  31        -8        16      MQ    LGA  RDU       83
+## 253315: 2014    10  31        -4        15      MQ    LGA  DTW       75
+## 253316: 2014    10  31        -5         1      MQ    LGA  SDF      110
+##         distance hour
+##      1:     2475    9
+##      2:     2475   11
+##      3:     2475   19
+##      4:     1035    7
+##      5:     2475   13
+##     ---
+## 253312:     1416   14
+## 253313:     1400    8
+## 253314:      431   11
+## 253315:      502   11
+## 253316:      659    8
+## [1] 253316     11
+\end{verbatim}
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{data_table = R.data__table(}
+  \DataTypeTok{ID}\NormalTok{: R.c(}\StringTok{"b"}\NormalTok{,}\StringTok{"b"}\NormalTok{,}\StringTok{"b"}\NormalTok{,}\StringTok{"a"}\NormalTok{,}\StringTok{"a"}\NormalTok{,}\StringTok{"c"}\NormalTok{),}
+  \StringTok{a: }\NormalTok{(}\DecValTok{1}\NormalTok{..}\DecValTok{6}\NormalTok{),}
+  \StringTok{b: }\NormalTok{(}\DecValTok{7}\NormalTok{..}\DecValTok{12}\NormalTok{),}
+  \StringTok{c: }\NormalTok{(}\DecValTok{13}\NormalTok{..}\DecValTok{18}\NormalTok{)}
+\NormalTok{)}
+\NormalTok{puts data_table}
+\NormalTok{puts data_table.}\DataTypeTok{ID}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##    ID a  b  c
+## 1:  b 1  7 13
+## 2:  b 2  8 14
+## 3:  b 3  9 15
+## 4:  a 4 10 16
+## 5:  a 5 11 17
+## 6:  c 6 12 18
+## [1] "b" "b" "b" "a" "a" "c"
+\end{verbatim}
+\begin{Shaded}
+\begin{Highlighting}[]
+\CommentTok{# subset rows in i}
+\NormalTok{ans = flights[(}\StringTok{:origin}\NormalTok{.eq }\StringTok{"JFK"}\NormalTok{) & (}\StringTok{:month}\NormalTok{.eq }\DecValTok{6}\NormalTok{)]}
+\NormalTok{puts ans.head}
+\CommentTok{# Get the first two rows from flights.}
+\NormalTok{ans = flights[(}\DecValTok{1}\NormalTok{..}\DecValTok{2}\NormalTok{)]}
+\NormalTok{puts ans}
+\CommentTok{# Sort flights first by column origin in ascending order, and then by dest in descending order:}
+\CommentTok{# ans = flights[E.order(:origin, -(:dest))]}
+\CommentTok{# puts ans.head}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##    year month day dep_delay arr_delay carrier origin dest air_time
+## 1: 2014     6   1        -9        -5      AA    JFK  LAX      324
+## 2: 2014     6   1       -10       -13      AA    JFK  LAX      329
+## 3: 2014     6   1        18        -1      AA    JFK  LAX      326
+## 4: 2014     6   1        -6       -16      AA    JFK  LAX      320
+## 5: 2014     6   1        -4       -45      AA    JFK  LAX      326
+## 6: 2014     6   1        -6       -23      AA    JFK  LAX      329
+##    distance hour
+## 1:     2475    8
+## 2:     2475   12
+## 3:     2475    7
+## 4:     2475   10
+## 5:     2475   18
+## 6:     2475   14
+##    year month day dep_delay arr_delay carrier origin dest air_time
+## 1: 2014     1   1        14        13      AA    JFK  LAX      359
+## 2: 2014     1   1        -3        13      AA    JFK  LAX      363
+##    distance hour
+## 1:     2475    9
+## 2:     2475   11
+\end{verbatim}
+\begin{Shaded}
+\begin{Highlighting}[]
+\CommentTok{# Select column(s) in j}
+\CommentTok{# select arr_delay column, but return it as a vector.}
+\NormalTok{ans = flights[}\StringTok{:all}\NormalTok{, }\StringTok{:arr_delay}\NormalTok{]}
+\NormalTok{puts ans.head}
+\CommentTok{# Select arr_delay column, but return as a data.table instead.}
+\NormalTok{ans = flights[}\StringTok{:all}\NormalTok{, }\StringTok{:arr_delay}\NormalTok{.list]}
+\NormalTok{puts ans.head}
+\NormalTok{ans = flights[}\StringTok{:all}\NormalTok{, E.list(}\StringTok{:arr_delay}\NormalTok{, }\StringTok{:dep_delay}\NormalTok{)]}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## [1]  13  13   9 -26   1   0
+##    arr_delay
+## 1:        13
+## 2:        13
+## 3:         9
+## 4:       -26
+## 5:         1
+## 6:         0
+\end{verbatim}
+\section{Graphics in Galaaz}\label{graphics-in-galaaz}
+Creating graphics in Galaaz is quite easy, as it can use all the power
+of ggplot2. There are many resources in the web that teaches ggplot, so
+here we give a quick example of ggplot integration with Ruby. We
+continue to use the :mtcars dataset and we will plot a diverging bar
+plot, showing cars that have `above' or `below' gas consuption. Let's
+first prepare the data frame with the necessary data:
+\begin{Shaded}
+\begin{Highlighting}[]
+\CommentTok{# copy the R variable :mtcars to the Ruby mtcars variable}
+\NormalTok{mtcars = ~}\StringTok{:mtcars}
+\CommentTok{# create a new column 'car_name' to store the car names so that it can be}
+\CommentTok{# used for plotting. The 'rownames' of the data frame cannot be used as}
+\CommentTok{# data for plotting}
+\NormalTok{mtcars.car_name = R.rownames(}\StringTok{:mtcars}\NormalTok{)}
+\CommentTok{# compute normalized mpg and add it to a new column called mpg_z}
+\CommentTok{# Note that the mean value for mpg can be obtained by calling the 'mean'}
+\CommentTok{# function on the vector 'mtcars.mpg'.  The same with the standard}
+\CommentTok{# deviation 'sd'.  The vector is then rounded to two digits with 'round 2'}
+\NormalTok{mtcars.mpg_z = ((mtcars.mpg - mtcars.mpg.mean)/mtcars.mpg.sd).round }\DecValTok{2}
+\CommentTok{# create a new column 'mpg_type'. Function 'ifelse' is a vectorized function}
+\CommentTok{# that looks at every element of the mpg_z vector and if the value is below}
+\CommentTok{# 0, returns 'below', otherwise returns 'above'}
+\NormalTok{mtcars.mpg_type = (mtcars.mpg_z < }\DecValTok{0}\NormalTok{).ifelse(}\StringTok{"below"}\NormalTok{, }\StringTok{"above"}\NormalTok{)}
+\CommentTok{# order the mtcar data set by the mpg_z vector from smaler to larger values}
+\NormalTok{mtcars = mtcars[mtcars.mpg_z.order, }\StringTok{:all}\NormalTok{]}
+\CommentTok{# convert the car_name column to a factor to retain sorted order in plot}
+\NormalTok{mtcars.car_name = mtcars.car_name.factor }\StringTok{levels: }\NormalTok{mtcars.car_name}
+\CommentTok{# let's look at the final data frame}
+\NormalTok{puts mtcars.head}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##                      mpg cyl disp  hp drat    wt  qsec vs am gear carb
+## Cadillac Fleetwood  10.4   8  472 205 2.93 5.250 17.98  0  0    3    4
+## Lincoln Continental 10.4   8  460 215 3.00 5.424 17.82  0  0    3    4
+## Camaro Z28          13.3   8  350 245 3.73 3.840 15.41  0  0    3    4
+## Duster 360          14.3   8  360 245 3.21 3.570 15.84  0  0    3    4
+## Chrysler Imperial   14.7   8  440 230 3.23 5.345 17.42  0  0    3    4
+## Maserati Bora       15.0   8  301 335 3.54 3.570 14.60  0  1    5    8
+##                                car_name mpg_z mpg_type
+## Cadillac Fleetwood   Cadillac Fleetwood -1.61    below
+## Lincoln Continental Lincoln Continental -1.61    below
+## Camaro Z28                   Camaro Z28 -1.13    below
+## Duster 360                   Duster 360 -0.96    below
+## Chrysler Imperial     Chrysler Imperial -0.89    below
+## Maserati Bora             Maserati Bora -0.84    below
+\end{verbatim}
+Now, lets plot the diverging bar plot. When using gKnit, there is no
+need to call `R.awt' to create a plotting device, since gKnit does take
+care of it. Galaaz provides integration with ggplot. The interested
+reader should check online for more information on ggplot, since it is
+outside the scope of this manual describing how ggplot works. We give
+here but a brief description on how this plot is generated.
+ggplot implements the `grammar of graphics'. In this approach, plots are
+build by adding layers to the plot. On the first layer we describe what
+we want on the `x' and `y' axis of the plot. In this case, we have
+`car\_name' on the `x' axis and `mpg\_z' on the `y' axis. Then the type
+of graph is specified by adding `geom\_bar' (for a bar graph). We
+specify that our bars should be filled using `mpg\_type', which is
+either `above' or `bellow' giving then two colours for filling. On the
+next layer we specify the labels for the graph, then we add the title
+and subtitle. Finally, in a bar chart usually bars go on the vertical
+direction, but in this graph we want the bars to be horizontally layed
+so we add `coord\_flip'.
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{require }\StringTok{'ggplot'}
+\NormalTok{puts mtcars.ggplot(E.aes(}\StringTok{x: :car_name}\NormalTok{, }\StringTok{y: :mpg_z}\NormalTok{, }\StringTok{label: :mpg_z}\NormalTok{)) +}
+\NormalTok{     R.geom_bar(E.aes(}\StringTok{fill: :mpg_type}\NormalTok{), }\StringTok{stat: 'identity'}\NormalTok{, }\StringTok{width: }\FloatTok{0.5}\NormalTok{) +}
+\NormalTok{     R.scale_fill_manual(}\StringTok{name: 'Mileage'}\NormalTok{,}
+                         \StringTok{labels: }\NormalTok{R.c(}\StringTok{'Above Average'}\NormalTok{, }\StringTok{'Below Average'}\NormalTok{),}
+                         \StringTok{values: }\NormalTok{R.c(}\StringTok{'above'}\NormalTok{: }\StringTok{'#00ba38'}\NormalTok{, }\StringTok{'below'}\NormalTok{: }\StringTok{'#f8766d'}\NormalTok{)) +}
+\NormalTok{     R.labs(}\StringTok{subtitle: "Normalised mileage from 'mtcars'"}\NormalTok{,}
+            \StringTok{title: "Diverging Bars"}\NormalTok{) + }
+\NormalTok{     R.coord_flip}
+\end{Highlighting}
+\end{Shaded}
+\includegraphics{manual_files/figure-latex/diverging_bar.pdf}
+\section{Coding with Tidyverse}\label{coding-with-tidyverse}
+In R, and when coding with `tidyverse', arguments to a function are
+usually not \emph{referencially transparent}. That is, you can't replace
+a value with a seemingly equivalent object that you've defined
+elsewhere. To see the problem, let's first define a data frame:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{df = R.data__frame(}\StringTok{x: }\NormalTok{(}\DecValTok{1}\NormalTok{..}\DecValTok{3}\NormalTok{), }\StringTok{y: }\NormalTok{(}\DecValTok{3}\NormalTok{..}\DecValTok{1}\NormalTok{))}
+\NormalTok{puts df}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##   x y
+## 1 1 3
+## 2 2 2
+## 3 3 1
+\end{verbatim}
+and now, let's look at this code:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{my_var <-}\StringTok{ }\NormalTok{x}
+\KeywordTok{filter}\NormalTok{(df, my_var }\OperatorTok{==}\StringTok{ }\DecValTok{1}\NormalTok{)}
+\end{Highlighting}
+\end{Shaded}
+It generates the following error: ``object `x' not found.
+However, in Galaaz, arguments are referencially transparent as can be
+seen by the code bellow. Note initally that `my\_var = :x' will not give
+the error ``object `x' not found'' since `:x' is treated as an
+expression and assigned to my\_var. Then when doing (my\_var.eq 1),
+my\_var is a variable that resolves to `:x' and it becomes equivalent to
+(:x.eq 1) which is what we want.
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{my_var = }\StringTok{:x}
+\NormalTok{puts df.filter(my_var.eq }\DecValTok{1}\NormalTok{)}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##   x y
+## 1 1 3
+\end{verbatim}
+As stated by Hardley
+\begin{quote}
+dplyr code is ambiguous. Depending on what variables are defined where,
+filter(df, x == y) could be equivalent to any of:
+\end{quote}
+\begin{verbatim}
+df[df$x == df$y, ]
+df[df$x == y, ]
+df[x == df$y, ]
+df[x == y, ]
+\end{verbatim}
+In galaaz this ambiguity does not exist, filter(df, x.eq y) is not a
+valid expression as expressions are build with symbols. In doing
+filter(df, :x.eq y) we are looking for elements of the `x' column that
+are equal to a previously defined y variable. Finally in filter(df,
+:x.eq :y) we are looking for elements in which the `x' column value is
+equal to the `y' column value. This can be seen in the following two
+chunks of code:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{y = }\DecValTok{1}
+\NormalTok{x = }\DecValTok{2}
+\CommentTok{# looking for values where the 'x' column is equal to the 'y' column}
+\NormalTok{puts df.filter(}\StringTok{:x}\NormalTok{.eq }\StringTok{:y}\NormalTok{)}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##   x y
+## 1 2 2
+\end{verbatim}
+\begin{Shaded}
+\begin{Highlighting}[]
+\CommentTok{# looking for values where the 'x' column is equal to the 'y' variable}
+\CommentTok{# in this case, the number 1}
+\NormalTok{puts df.filter(}\StringTok{:x}\NormalTok{.eq y)}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##   x y
+## 1 1 3
+\end{verbatim}
+\subsection{Writing a function that applies to different data
+sets}\label{writing-a-function-that-applies-to-different-data-sets}
+Let's suppose that we want to write a function that receives as the
+first argument a data frame and as second argument an expression that
+adds a column to the data frame that is equal to the sum of elements in
+column `a' plus `x'.
+Here is the intended behaviour using the `mutate' function of `dplyr':
+\begin{verbatim}
+mutate(df1, y = a + x)
+mutate(df2, y = a + x)
+mutate(df3, y = a + x)
+mutate(df4, y = a + x)
+\end{verbatim}
+The naive approach to writing an R function to solve this problem is:
+\begin{verbatim}
+mutate_y <- function(df) {
+  mutate(df, y = a + x)
+}
+\end{verbatim}
+Unfortunately, in R, this function can fail silently if one of the
+variables isn't present in the data frame, but is present in the global
+environment. We will not go through here how to solve this problem in R.
+In Galaaz the method mutate\_y bellow will work fine and will never fail
+silently.
+\begin{Shaded}
+\begin{Highlighting}[]
+\KeywordTok{def}\NormalTok{ mutate_y(df)}
+\NormalTok{  df.mutate(}\StringTok{:y}\NormalTok{.assign }\StringTok{:a}\NormalTok{ + }\StringTok{:x}\NormalTok{)}
+\KeywordTok{end}
+\end{Highlighting}
+\end{Shaded}
+Here we create a data frame that has only one column named `x':
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{df1 = R.data__frame(}\StringTok{x: }\NormalTok{(}\DecValTok{1}\NormalTok{..}\DecValTok{3}\NormalTok{))}
+\NormalTok{puts df1}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##   x
+## 1 1
+## 2 2
+## 3 3
+\end{verbatim}
+Note that method mutate\_y will fail independetly from the fact that
+variable `a' is defined and in the scope of the method. Variable `a' has
+no relationship with the symbol `:a' used in the definition of
+`mutate\_y' above:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{a = }\DecValTok{10}
+\NormalTok{mutate_y(df1)}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## Message:
+##  Error in mutate_impl(.data, dots) :
+##   Evaluation error: object 'a' not found.
+## In addition: Warning message:
+## In mutate_impl(.data, dots) :
+##   mismatched protect/unprotect (unprotect with empty protect stack) (RError)
+## Translated to internal error
+\end{verbatim}
+\subsection{Different expressions}\label{different-expressions}
+Let's move to the next problem as presented by Hardley where trying to
+write a function in R that will receive two argumens, the first a
+variable and the second an expression is not trivial. Bellow we create a
+data frame and we want to write a function that groups data by a
+variable and summarises it by an expression:
+\begin{Shaded}
+\begin{Highlighting}[]
+\KeywordTok{set.seed}\NormalTok{(}\DecValTok{123}\NormalTok{)}
+\NormalTok{df <-}\StringTok{ }\KeywordTok{data.frame}\NormalTok{(}
+  \DataTypeTok{g1 =} \KeywordTok{c}\NormalTok{(}\DecValTok{1}\NormalTok{, }\DecValTok{1}\NormalTok{, }\DecValTok{2}\NormalTok{, }\DecValTok{2}\NormalTok{, }\DecValTok{2}\NormalTok{),}
+  \DataTypeTok{g2 =} \KeywordTok{c}\NormalTok{(}\DecValTok{1}\NormalTok{, }\DecValTok{2}\NormalTok{, }\DecValTok{1}\NormalTok{, }\DecValTok{2}\NormalTok{, }\DecValTok{1}\NormalTok{),}
+  \DataTypeTok{a =} \KeywordTok{sample}\NormalTok{(}\DecValTok{5}\NormalTok{),}
+  \DataTypeTok{b =} \KeywordTok{sample}\NormalTok{(}\DecValTok{5}\NormalTok{)}
+\NormalTok{)}
+\KeywordTok{as.data.frame}\NormalTok{(df) }
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##   g1 g2 a b
+## 1  1  1 3 3
+## 2  1  2 2 1
+## 3  2  1 5 2
+## 4  2  2 4 5
+## 5  2  1 1 4
+\end{verbatim}
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{d2 <-}\StringTok{ }\NormalTok{df }\OperatorTok{%>%}
+\StringTok{  }\KeywordTok{group_by}\NormalTok{(g1) }\OperatorTok{%>%}
+\StringTok{  }\KeywordTok{summarise}\NormalTok{(}\DataTypeTok{a =} \KeywordTok{mean}\NormalTok{(a))}
+\KeywordTok{as.data.frame}\NormalTok{(d2)          }
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##   g1        a
+## 1  1 2.500000
+## 2  2 3.333333
+\end{verbatim}
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{d2 <-}\StringTok{ }\NormalTok{df }\OperatorTok{%>%}
+\StringTok{  }\KeywordTok{group_by}\NormalTok{(g2) }\OperatorTok{%>%}
+\StringTok{  }\KeywordTok{summarise}\NormalTok{(}\DataTypeTok{a =} \KeywordTok{mean}\NormalTok{(a))}
+\KeywordTok{as.data.frame}\NormalTok{(d2)          }
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##   g2 a
+## 1  1 3
+## 2  2 3
+\end{verbatim}
+As shown by Hardley, one might expect this function to do the trick:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{my_summarise <-}\StringTok{ }\ControlFlowTok{function}\NormalTok{(df, group_var) \{}
+\NormalTok{  df }\OperatorTok{%>%}
+\StringTok{    }\KeywordTok{group_by}\NormalTok{(group_var) }\OperatorTok{%>%}
+\StringTok{    }\KeywordTok{summarise}\NormalTok{(}\DataTypeTok{a =} \KeywordTok{mean}\NormalTok{(a))}
+\NormalTok{\}}
+\CommentTok{# my_summarise(df, g1)}
+\CommentTok{#> Error: Column `group_var` is unknown}
+\end{Highlighting}
+\end{Shaded}
+In order to solve this problem, coding with dplyr requires the
+introduction of many new concepts and functions such as `quo', `quos',
+`enquo', `enquos', `!!' (bang bang), `!!!' (triple bang). Again, we'll
+leave to Hardley the explanation on how to use all those functions.
+Now, let's try to implement the same function in galaaz. The next code
+block first prints the `df' data frame defined previously in R (to
+access an R variable from Galaaz, we use the tilda operator
+`\textasciitilde{}' applied to the R variable name as symbol, i.e.,
+`:df'.
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts ~}\StringTok{:df}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##   g1 g2 a b
+## 1  1  1 3 3
+## 2  1  2 2 1
+## 3  2  1 5 2
+## 4  2  2 4 5
+## 5  2  1 1 4
+\end{verbatim}
+We then create the `my\_summarize' method and call it passing the R data
+frame and the group by variable `:g1':
+\begin{Shaded}
+\begin{Highlighting}[]
+\KeywordTok{def}\NormalTok{ my_summarize(df, group_var)}
+\NormalTok{  df.group_by(group_var).}
+\NormalTok{    summarize(}\StringTok{a: :a}\NormalTok{.mean)}
+\KeywordTok{end}
+\NormalTok{puts my_summarize(}\StringTok{:df}\NormalTok{, }\StringTok{:g1}\NormalTok{)}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 2 x 2
+##      g1     a
+##   <dbl> <dbl>
+## 1     1  2.5
+## 2     2  3.33
+\end{verbatim}
+It works!!! Well, let's make sure this was not just some coincidence
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts my_summarize(}\StringTok{:df}\NormalTok{, }\StringTok{:g2}\NormalTok{)}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 2 x 2
+##      g2     a
+##   <dbl> <dbl>
+## 1     1     3
+## 2     2     3
+\end{verbatim}
+Great, everything is fine! No magic, no new functions, no complexities,
+just normal, standard Ruby code. If you've ever done NSE in R, this
+certainly feels much safer and easy to implement.
+\subsection{Different input variables}\label{different-input-variables}
+In the previous section we've managed to get rid of all NSE formulation
+for a simple example, but does this remain true for more complex
+examples, or will the Galaaz way prove inpractical for more complex
+code?
+In the next example Hardley proposes us to write a function that given
+an expression such as `a' or `a * b', calculates three summaries. What
+we want a function that does the same as these R statements:
+\begin{verbatim}
+summarise(df, mean = mean(a), sum = sum(a), n = n())
+#> # A tibble: 1 x 3
+#>    mean   sum     n
+#>   <dbl> <int> <int>
+#> 1     3    15     5
+summarise(df, mean = mean(a * b), sum = sum(a * b), n = n())
+#> # A tibble: 1 x 3
+#>    mean   sum     n
+#>   <dbl> <int> <int>
+#> 1   9    45     5
+\end{verbatim}
+Let's try it in galaaz:
+\begin{Shaded}
+\begin{Highlighting}[]
+\KeywordTok{def}\NormalTok{ my_summarise2(df, expr)}
+\NormalTok{  df.summarize(}
+    \StringTok{mean: }\NormalTok{E.mean(expr),}
+    \StringTok{sum: }\NormalTok{E.sum(expr),}
+    \StringTok{n: }\NormalTok{E.n}
+\NormalTok{  )}
+\KeywordTok{end}
+\NormalTok{puts my_summarise2((~}\StringTok{:df}\NormalTok{), }\StringTok{:a}\NormalTok{)}
+\NormalTok{puts }\StringTok{"\textbackslash{}n"}
+\NormalTok{puts my_summarise2((~}\StringTok{:df}\NormalTok{), }\StringTok{:a}\NormalTok{ * }\StringTok{:b}\NormalTok{)}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##   mean sum n
+## 1    3  15 5
+##
+##   mean sum n
+## 1    9  45 5
+\end{verbatim}
+Once again, there is no need to use any special theory or functions. The
+only point to be careful about is the use of `E' to build expressions
+from functions `mean', `sum' and `n'.
+\subsection{Different input and output
+variable}\label{different-input-and-output-variable}
+Now the next challenge presented by Hardley is to vary the name of the
+output variables based on the received expression. So, if the input
+expression is `a', we want our data frame columns to be named `mean\_a'
+and `sum\_a'. Now, if the input expression is `b', columns should be
+named `mean\_b' and `sum\_b'.
+\begin{verbatim}
+mutate(df, mean_a = mean(a), sum_a = sum(a))
+#> # A tibble: 5 x 6
+#>      g1    g2     a     b mean_a sum_a
+#>   <dbl> <dbl> <int> <int>  <dbl> <int>
+#> 1     1     1     1     3      3    15
+#> 2     1     2     4     2      3    15
+#> 3     2     1     2     1      3    15
+#> 4     2     2     5     4      3    15
+#> # … with 1 more row
+mutate(df, mean_b = mean(b), sum_b = sum(b))
+#> # A tibble: 5 x 6
+#>      g1    g2     a     b mean_b sum_b
+#>   <dbl> <dbl> <int> <int>  <dbl> <int>
+#> 1     1     1     1     3      3    15
+#> 2     1     2     4     2      3    15
+#> 3     2     1     2     1      3    15
+#> 4     2     2     5     4      3    15
+#> # … with 1 more row
+\end{verbatim}
+In order to solve this problem in R, Hardley needs to introduce some
+more new functions and notations: `quo\_name' and the `:=' operator from
+package `rlang'
+Here is our Ruby code:
+\begin{Shaded}
+\begin{Highlighting}[]
+\KeywordTok{def}\NormalTok{ my_mutate(df, expr)}
+\NormalTok{  mean_name = }\StringTok{"mean_}\OtherTok{#\{}\NormalTok{expr.to_s}\OtherTok{\}}\StringTok{"}
+\NormalTok{  sum_name = }\StringTok{"sum_}\OtherTok{#\{}\NormalTok{expr.to_s}\OtherTok{\}}\StringTok{"}
+\NormalTok{  df.mutate(mean_name => E.mean(expr),}
+\NormalTok{            sum_name => E.sum(expr))}
+\KeywordTok{end}
+\NormalTok{puts my_mutate((~}\StringTok{:df}\NormalTok{), }\StringTok{:a}\NormalTok{)}
+\NormalTok{puts }\StringTok{"\textbackslash{}n"}
+\NormalTok{puts my_mutate((~}\StringTok{:df}\NormalTok{), }\StringTok{:b}\NormalTok{)}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##   g1 g2 a b mean_a sum_a
+## 1  1  1 3 3      3    15
+## 2  1  2 2 1      3    15
+## 3  2  1 5 2      3    15
+## 4  2  2 4 5      3    15
+## 5  2  1 1 4      3    15
+##
+##   g1 g2 a b mean_b sum_b
+## 1  1  1 3 3      3    15
+## 2  1  2 2 1      3    15
+## 3  2  1 5 2      3    15
+## 4  2  2 4 5      3    15
+## 5  2  1 1 4      3    15
+\end{verbatim}
+It really seems that ``Non Standard Evaluation'' is actually quite
+standard in Galaaz! But, you might have noticed a small change in the
+way the arguments to the mutate method were called. In a previous
+example we used df.summarise(mean: E.mean(:a), \ldots{}) where the
+column name was followed by a `:' colom. In this example, we have
+df.mutate(mean\_name =\textgreater{} E.mean(expr), \ldots{}) and
+variable mean\_name is not followed by `:' but by `=\textgreater{}'.
+This is standard Ruby notation.
+{[}explain\ldots{}.{]}
+\subsection{Capturing multiple
+variables}\label{capturing-multiple-variables}
+Moving on with new complexities, Hardley proposes us to solve the
+problem in which the summarise function will receive any number of
+grouping variables.
+This again is quite standard Ruby. In order to receive an undefined
+number of paramenters the paramenter is preceded by '*':
+\begin{Shaded}
+\begin{Highlighting}[]
+\KeywordTok{def}\NormalTok{ my_summarise3(df, *group_vars)}
+\NormalTok{  df.group_by(*group_vars).}
+\NormalTok{    summarise(}\StringTok{a: }\NormalTok{E.mean(}\StringTok{:a}\NormalTok{))}
+\KeywordTok{end}
+\NormalTok{puts my_summarise3((~}\StringTok{:df}\NormalTok{), }\StringTok{:g1}\NormalTok{, }\StringTok{:g2}\NormalTok{)}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 4 x 3
+## # Groups:   g1 [?]
+##      g1    g2     a
+##   <dbl> <dbl> <dbl>
+## 1     1     1     3
+## 2     1     2     2
+## 3     2     1     3
+## 4     2     2     4
+\end{verbatim}
+\subsection{Why does R require NSE and Galaaz does
+not?}\label{why-does-r-require-nse-and-galaaz-does-not}
+NSE introduces a number of new concepts, such as `quoting',
+`quasiquotation', `unquoting' and `unquote-splicing', while in Galaaz
+none of those concepts are needed. What gives?
+R is an extremely flexible language and it has lazy evaluation of
+parameters. When in R a function is called as `summarise(df, a = b)',
+the summarise function receives the litteral `a = b' parameter and can
+work with this as if it were a string. In R, it is not clear what a and
+b are, they can be expressions or they can be variables, it is up to the
+function to decide what `a = b' means.
+In Ruby, there is no lazy evaluation of parameters and `a' is always a
+variable and so is `b'. Variables assume their value as soon as they are
+used, so `x = a' is immediately evaluate and variable `x' will receive
+the value of variable `a' as soon as the Ruby statement is executed.
+Ruby also provides the notion of a symbol; `:a' is a symbol and does not
+evaluate to anything. Galaaz uses Ruby symbols to build expressions that
+are not bound to anything: `:a.eq :b' is clearly an expression and has
+no relationship whatsoever with the statment `a = b'. By using symbols,
+variables and expressions all the possible ambiguities that are found in
+R are eliminated in Galaaz.
+The main problem that remains, is that in R, functions are not clearly
+documented as what type of input they are expecting, they might be
+expecting regular variables or they might be expecting expressions and
+the R function will know how to deal with an input of the form `a = b',
+now for the Ruby developer it might not be immediately clear if it
+should call the function passing the value `true' if variable `a' is
+equal to variable `b' or if it should call the function passing the
+expression `:a.eq :b'.
+\subsection{Advanced dplyr features}\label{advanced-dplyr-features}
+In the blog: Programming with dplyr by using dplyr
+(\url{https://www.r-bloggers.com/programming-with-dplyr-by-using-dplyr/})
+Iñaki Úcar shows surprise that some R users are trying to code in dplyr
+avoiding the use of NSE. For instance he says:
+\begin{quote}
+Take the example of seplyr. It stands for standard evaluation dplyr, and
+enables us to program over dplyr without having ``to bring in (or study)
+any deep-theory or heavy-weight tools such as rlang/tidyeval''.
+\end{quote}
+For me, there isn't really any surprise that users are trying to avoid
+dplyr deep-theory. R users frequently are not programmers and learning
+to code is already hard business, on top of that, having to learn how to
+`quote' or `enquo' or `quos' or `enquos' is not necessarily a `piece of
+cake'. So much so, that `tidyeval' has some more advanced functions that
+instead of using quoted expressions, uses strings as arguments.
+In the following examples, we show the use of functions `group\_by\_at',
+`summarise\_at' and `rename\_at' that receive strings as argument. The
+data frame used in `starwars' that describes features of characters in
+the Starwars movies:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{puts (~}\StringTok{:starwars}\NormalTok{).head}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 6 x 13
+##   name  height  mass hair_color skin_color eye_color birth_year gender
+##   <chr>  <int> <dbl> <chr>      <chr>      <chr>          <dbl> <chr>
+## 1 Luke~    172    77 blond      fair       blue            19   male
+## 2 C-3PO    167    75 <NA>       gold       yellow         112   <NA>
+## 3 R2-D2     96    32 <NA>       white, bl~ red             33   <NA>
+## 4 Dart~    202   136 none       white      yellow          41.9 male
+## 5 Leia~    150    49 brown      light      brown           19   female
+## 6 Owen~    178   120 brown, gr~ light      blue            52   male
+## # ... with 5 more variables: homeworld <chr>, species <chr>, films <list>,
+## #   vehicles <list>, starships <list>
+\end{verbatim}
+The grouped\_mean function bellow will receive a grouping variable and
+calculate summaries for the value\_variables given:
+\begin{Shaded}
+\begin{Highlighting}[]
+\NormalTok{grouped_mean <-}\StringTok{ }\ControlFlowTok{function}\NormalTok{(data, grouping_variables, value_variables) \{}
+\NormalTok{  data }\OperatorTok{%>%}
+\StringTok{    }\KeywordTok{group_by_at}\NormalTok{(grouping_variables) }\OperatorTok{%>%}
+\StringTok{    }\KeywordTok{mutate}\NormalTok{(}\DataTypeTok{count =} \KeywordTok{n}\NormalTok{()) }\OperatorTok{%>%}
+\StringTok{    }\KeywordTok{summarise_at}\NormalTok{(}\KeywordTok{c}\NormalTok{(value_variables, }\StringTok{"count"}\NormalTok{), mean, }\DataTypeTok{na.rm =} \OtherTok{TRUE}\NormalTok{) }\OperatorTok{%>%}
+\StringTok{    }\KeywordTok{rename_at}\NormalTok{(value_variables, }\KeywordTok{funs}\NormalTok{(}\KeywordTok{paste0}\NormalTok{(}\StringTok{"mean_"}\NormalTok{, .)))}
+\NormalTok{    \}}
+\NormalTok{gm =}\StringTok{ }\NormalTok{starwars }\OperatorTok{%>%}\StringTok{ }
+\StringTok{   }\KeywordTok{grouped_mean}\NormalTok{(}\StringTok{"eye_color"}\NormalTok{, }\KeywordTok{c}\NormalTok{(}\StringTok{"mass"}\NormalTok{, }\StringTok{"birth_year"}\NormalTok{))}
+\KeywordTok{as.data.frame}\NormalTok{(gm)   }
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+##        eye_color mean_mass mean_birth_year count
+## 1          black  76.28571        33.00000    10
+## 2           blue  86.51667        67.06923    19
+## 3      blue-gray  77.00000        57.00000     1
+## 4          brown  66.09231       108.96429    21
+## 5           dark       NaN             NaN     1
+## 6           gold       NaN             NaN     1
+## 7  green, yellow 159.00000             NaN     1
+## 8          hazel  66.00000        34.50000     3
+## 9         orange 282.33333       231.00000     8
+## 10          pink       NaN             NaN     1
+## 11           red  81.40000        33.66667     5
+## 12     red, blue       NaN             NaN     1
+## 13       unknown  31.50000             NaN     3
+## 14         white  48.00000             NaN     1
+## 15        yellow  81.11111        76.38000    11
+\end{verbatim}
+The same code with Galaaz, becomes:
+\begin{Shaded}
+\begin{Highlighting}[]
+\KeywordTok{def}\NormalTok{ grouped_mean(data, grouping_variables, value_variables)}
+\NormalTok{  data.}
+\NormalTok{    group_by_at(grouping_variables).}
+\NormalTok{    mutate(}\StringTok{count: }\NormalTok{E.n).}
+\NormalTok{    summarise_at(E.c(value_variables, }\StringTok{"count"}\NormalTok{), ~}\StringTok{:mean}\NormalTok{, }\StringTok{na__rm: }\DecValTok{true}\NormalTok{).}
+\NormalTok{    rename_at(value_variables, E.funs(E.paste0(}\StringTok{"mean_"}\NormalTok{, value_variables)))}
+\KeywordTok{end}
+\NormalTok{puts grouped_mean((~}\StringTok{:starwars}\NormalTok{), }\StringTok{"eye_color"}\NormalTok{, E.c(}\StringTok{"mass"}\NormalTok{, }\StringTok{"birth_year"}\NormalTok{))}
+\end{Highlighting}
+\end{Shaded}
+\begin{verbatim}
+## # A tibble: 15 x 4
+##    eye_color     mean_mass mean_birth_year count
+##    <chr>             <dbl>           <dbl> <dbl>
+##  1 black              76.3            33      10
+##  2 blue               86.5            67.1    19
+##  3 blue-gray          77              57       1
+##  4 brown              66.1           109.     21
+##  5 dark              NaN             NaN       1
+##  6 gold              NaN             NaN       1
+##  7 green, yellow     159             NaN       1
+##  8 hazel              66              34.5     3
+##  9 orange            282.            231       8
+## 10 pink              NaN             NaN       1
+## 11 red                81.4            33.7     5
+## 12 red, blue         NaN             NaN       1
+## 13 unknown            31.5           NaN       3
+## 14 white              48             NaN       1
+## 15 yellow             81.1            76.4    11
+\end{verbatim}
+{[}TO BE CONTINUED\ldots{}{]}
+\section{Contributing}\label{contributing}
+\begin{itemize}
+\tightlist
+\item
+  Fork it
+\item
+  Create your feature branch (git checkout -b my-new-feature)
+\item
+  Write Tests!
+\item
+  Commit your changes (git commit -am `Add some feature')
+\item
+  Push to the branch (git push origin my-new-feature)
+\item
+  Create new Pull Request
+\end{itemize}
+\section*{References}\label{references}
+\addcontentsline{toc}{section}{References}
+\hypertarget{refs}{}
+\hypertarget{ref-Knuth:literate_programming}{}
+Knuth, Donald E. 1984. ``Literate Programming.'' \emph{Comput. J.} 27
+(2). Oxford, UK: Oxford University Press: 97--111.
+doi:\href{https://doi.org/10.1093/comjnl/27.2.97}{10.1093/comjnl/27.2.97}.
+\hypertarget{ref-Wilkinson:grammar_of_graphics}{}
+Wilkinson, Leland. 2005. \emph{The Grammar of Graphics (Statistics and
+Computing)}. Berlin, Heidelberg: Springer-Verlag.
+\end{document}