alexeid
diff --git a/‎R/ascent-plotting.R
+1-1 b/‎R/ascent-plotting.R
+1-1
diff --git a/‎R/bayesian-climbing-analysis.Rmd
+16-6 b/‎R/bayesian-climbing-analysis.Rmd
+16-6
diff --git a/‎R/produce-analysis-data.R
+1-1 b/‎R/produce-analysis-data.R
+1-1
diff --git a/‎bibliography/1-s2.0-S1364661315000509.pdf
828 KB b/‎bibliography/1-s2.0-S1364661315000509.pdf
828 KB
diff --git a/‎bibliography/2001.05388.pdf
477 KB b/‎bibliography/2001.05388.pdf
477 KB
diff --git a/‎bibliography/2021.03.15.435555v4.full.pdf
275 KB b/‎bibliography/2021.03.15.435555v4.full.pdf
275 KB
diff --git a/‎bibliography/3292500.3330831.pdf
775 KB b/‎bibliography/3292500.3330831.pdf
775 KB
diff --git a/‎bibliography/Draper_2016_Comparative_grading scales_accepted_manuscript.pdf
565 KB b/‎bibliography/Draper_2016_Comparative_grading scales_accepted_manuscript.pdf
565 KB
diff --git a/‎bibliography/InternationalJournalofSportPsychology-1993.pdf
306 KB b/‎bibliography/InternationalJournalofSportPsychology-1993.pdf
306 KB
diff --git a/‎bibliography/PhysicalDeterminants.pdf
1.42 MB b/‎bibliography/PhysicalDeterminants.pdf
1.42 MB
diff --git a/‎bibliography/WHR.pdf
324 KB b/‎bibliography/WHR.pdf
324 KB
diff --git a/‎manuscript/ClimbingGrades.tex
+6-2 b/‎manuscript/ClimbingGrades.tex
+6-2
diff --git a/‎manuscript/SupplementaryInformation-ClimbingGrades.tex
+22 b/‎manuscript/SupplementaryInformation-ClimbingGrades.tex
+22
diff --git a/‎results/aus/ascents-from-2016-08-01-to-2021-08-01-minAscents400-minFails1-posterior.png
241 KB b/‎results/aus/ascents-from-2016-08-01-to-2021-08-01-minAscents400-minFails1-posterior.png
241 KB
diff --git a/‎results/aus/ascents-from-2016-08-01-to-2021-08-01-minAscents400-minFails1-processing-table.tex
+29 b/‎results/aus/ascents-from-2016-08-01-to-2021-08-01-minAscents400-minFails1-processing-table.tex
+29
diff --git a/‎results/aus/ascents-from-2016-08-01-to-2021-08-01-minAscents400-minFails1-regression.png
302 KB b/‎results/aus/ascents-from-2016-08-01-to-2021-08-01-minAscents400-minFails1-regression.png
302 KB
diff --git a/‎results/nz/ascents-from-2016-08-01-to-2021-08-01-minAscents400-minFails1-posterior.png
99.2 KB b/‎results/nz/ascents-from-2016-08-01-to-2021-08-01-minAscents400-minFails1-posterior.png
99.2 KB
diff --git a/‎results/nz/ascents-from-2016-08-01-to-2021-08-01-minAscents400-minFails1-processing-table.tex
+29 b/‎results/nz/ascents-from-2016-08-01-to-2021-08-01-minAscents400-minFails1-processing-table.tex
+29
diff --git a/‎results/nz/ascents-from-2016-08-01-to-2021-08-01-minAscents400-minFails1-regression.png
131 KB b/‎results/nz/ascents-from-2016-08-01-to-2021-08-01-minAscents400-minFails1-regression.png
131 KB
diff --git a/‎results/nz/ascents-from-2016-08-01-to-2021-08-01-minAscents400-minFails1-session-posterior.png
-18 Bytes b/‎results/nz/ascents-from-2016-08-01-to-2021-08-01-minAscents400-minFails1-session-posterior.png
-18 Bytes
diff --git a/‎results/nz/ascents-from-2016-08-01-to-2021-08-01-minAscents400-minFails1-session-processing-table.tex
+1-1 b/‎results/nz/ascents-from-2016-08-01-to-2021-08-01-minAscents400-minFails1-session-processing-table.tex
+1-1
diff --git a/‎results/nz/ascents-from-2016-08-01-to-2021-08-01-minAscents400-minFails1-session-regression.png
214 Bytes b/‎results/nz/ascents-from-2016-08-01-to-2021-08-01-minAscents400-minFails1-session-regression.png
214 Bytes
@@ -31,7 +31,7 @@ ascent.summary <- function(lb.routes, gradeColName="grade", successColName="succ
 ##########################################################################################
 plot.all.attempts <- function(lb) {
 
-  climbers <- unique(lb$account.id)
+  climbers <- sort(unique(lb$account.id))
 
   legend = c();
 
 
@@ -9,7 +9,7 @@ params:
   startDate: "2016-08-01"
   endDate: "2021-08-01"
   filter.by.tickprop.lrp: FALSE
-  per.session: TRUE
+  per.session: FALSE
   min.ascents: 400
   min.failures: 1
   in.path: "~/Git/climbing-grades/data/processed/"
@@ -194,16 +194,26 @@ mean.grade <- unlist(mean.grade)
 
 hist(mean.grade)
 
+hist(data$m)
+
+
 ```
 
-```{r}
-summary  <- table(data$df$account.id, data$df$ascent_factor)
-quantile(summary[,"dog"]+summary[,"attempt"]+summary[,"working"], c(0, 0.025, 0.05, 0.1, 0.5, 0.9, 0.95, 0.975, 1))
 
-quantile((summary[,"dog"]+summary[,"attempt"]+summary[,"working"])/rowSums(summary), c(0, 0.025, 0.05, 0.5, 0.95, 0.975,1))
+```{r}
+summary  <- table(data$df$account.id, data$df$ascent.type)
 
 summary(summary[,"dog"]+summary[,"attempt"]+summary[,"working"]+summary[,"retreat"])
 
-summary((summary[,"dog"]+summary[,"attempt"]+summary[,"working"]+summary[,"retreat"])/rowSums(summary))
+fail.fraction <- (summary[,"dog"]+summary[,"attempt"]+summary[,"working"]+summary[,"retreat"])/rowSums(summary)
+
+summary(fail.fraction)
+
+```
+
+```{r}
+
+
 
+plot(data$m, fail.fraction)
 ```
@@ -55,7 +55,7 @@ produce.analysis.data <- function(params, res, routes) {
   df.top <- res3$df
   df.top$ascent.type <- as.character(df.top$ascent.type)
 
-  climbers <- unique(df.top$account.id);
+  climbers <- sort(unique(df.top$account.id));
   df.final = df.top
   final.filter.results = res3$filter.results
 
 
@@ -295,11 +295,15 @@ \section*{Discussion and Conclusion}
 
 The most questionable detail of the model presented is the idea that the probability of a successful ascent remains the same after each previous attempt of the route, i.e. practising a particle route does not improve the climber's chance of success. This is clearly a bad assumption, so at best the probability of success implied by the Bradley-Terry model should be considered as some sort of ``effective'' probability, averaged over different levels of practice. The real underlying probability is probably increasing with practice. The problems with developing a model that admits learning are at least two-fold: (i) we expect some routes are more amenable to practice than others, and (ii) it is unclear what functional form the expected improvement in probability per attempt should take.
 
-Suffice to say, there is still much work to do. Besides considerations above, foremost in our mind is the need to adapt recently developed whole-history inference methods to account for ascertainment biases in public repository data in a much more rigorous way than pursued here. This will require a better understanding of the differing ways that climbers approach self-reporting of climbing ascents. It seems likely that climber that logs their own ascent and attempts are likely to be susceptible to various biases and to follow differing conventions, depending on their purpose for making a public log book of their ascents. Data-driven approaches to learning about these differing conventions and biases in order to classifying climbers by their logging approach is an obvious next step.
+Selective logging of failures is a major concern. It is clear that most climbers don't log all failures. It seems likely that failures on easy routes would be more embarrassing than failures on harder routes. So if this motivation is no action, then harder routes will be appear relatively harder than easy routes, since the failures are underreported for easier routes. This would lead to an overestimation of the slope of the grade scale.
+
+Selection bias is another concern. This is the propensity of climbers to chose routes that are at the easier end of the grade, or at least routes that suit their climbing style (rather than choosing a random climb at the grade). There are two reasons why we think that selection bias shouldn't have a large impact on the estimate of the climbing grade slope parameter. Firstly, climbers are probably less selective at low to middle grades, and the slope is derived from the full ranges of grades that a climber attempts. Secondly, if a climber is selective at all grades, such a bias doesn't change the slope, but instead changes the intercept, because in each grade the result will be to select from the lower end of the grade, which will still result in the same slope. The main result of such selection bias will be an overestimate the grade of the climber by up to 1 grade. So selection bias will overestimate a climber's ability a bit, but it won't have a big effect on the fundamental grade scale parameter estimate. The worst case scenario will be if all climbers only climb relatively hard routes from they choices in their lowest grade and relatively easy routes from the choices in their hardest grade. This would mean the true range in the x-axis of the regression is actually up to a grade less than what is used to compute the slope. So the estimated slope will be flatter than the true slope. This extreme scenario would flatten the slope by about $(k-1)/k$, where $k$ is the difference between the highest grade and the lowest grade. In our data set the interquartile range for $k$ is 8-10. So the worst case scenario if everybody is maximally biased in this way is an underestimate of the slope of about 10\%.  
+
+Suffice to say, there is still much work to do. Foremost in our mind is the need to adapt recently developed whole-history inference methods to account for biases in public repository data in a much more rigorous way than pursued here. This will require a better understanding of the differing ways that climbers approach self-reporting of climbing ascents. It seems likely that climber that logs their own ascent and attempts are likely to be susceptible to various biases and to follow differing conventions, depending on their purpose for making a public log book of their ascents. Data-driven approaches to learning about these differing conventions and biases in order to classifying climbers by their logging approach is an obvious next step.
 
 \section*{Acknowledgement}
 
-The authors would like to thank Simon Dale and Ulf Fuchslueger from \url{thecrag.com}, for providing access to the theCrag API (\url{https://www.thecrag.com/en/article/api}) so that the public ascent data could be downloaded programmatically for the analyses produced in this work. In addition we thank Dr Joseph Heled, Daniel Krippner, Dr Michael Matschiner, and Dr Tim Vaughan for helpful discussions on earlier versions of this manuscript.
+The authors would like to thank Simon Dale and Ulf Fuchslueger from \url{thecrag.com}, for providing access to the theCrag API (\url{https://www.thecrag.com/en/article/api}) so that the public ascent data could be downloaded programmatically for the analyses produced in this work. In addition we thank Simon Dale, Dr Joseph Heled, Daniel Krippner, Dr Michael Matschiner, and Dr Tim Vaughan for helpful discussions on earlier versions of this manuscript.
 
 \printglossaries
 
 
@@ -115,6 +115,28 @@ \section{Assessing the suitability of the logistic model for climbing grade scal
 \label{fig2}
 \end{figure}
 
+\section{Estimates of flash grade and grade scale slope assuming whole-history data available}
+
+Figure \ref{aus_ascents_by_attempt} shows the estimated ``flash grade'' through time plot between August 2016 and July 2021 inclusive for 105 climbers that fulfilled our selection criteria and who climbed predominantly in Australia. The second panel reports the posterior distribution of the $e^m$, which was jointly estimated. The posterior estimate was 2.14 (95\% HPD:  $[2.11, 2.17]$).
+
+\begin{figure}
+\centering
+\includegraphics[width=\textwidth]{../results/aus/ascents-from-2016-08-01-to-2021-08-01-minAscents400-minFails1-posterior.png}
+\caption{\small The posterior estimate of each Australian climber's grade ($n=105$) through time and the posterior distribution of the proportional increase in difficulty per grade increment $d = e^m$.}
+\label{aus_ascents_by_attempt}
+\end{figure}
+
+Figure \ref{nz_ascents_by_attempt} shows the estimated ``flash grade'' through time plot between August 2016 and July 2021 inclusive for 5 climbers that fulfilled our selection criteria and who climbed predominantly in New Zealand. The second panel reports the posterior distribution of the $m$ parameter which was jointly estimated.
+
+
+\begin{figure}
+\centering
+\includegraphics[width=\textwidth]{../results/nz/ascents-from-2016-08-01-to-2021-08-01-minAscents400-minFails1-posterior.png}
+\caption{\small The posterior estimate of each New Zealand climber's grade through time and the posterior distribution of the proportional increase in difficulty per grade increment $d = e^m$. Because there were only 5 climbers in this analysis we were able to depict the 95\% credible interval around the grade estimate through time as well.}
+\label{nz_ascents_by_attempt}
+\end{figure}
+
+
 
 \section{Interpreting whole-community ascent success data}
 
 
@@ -0,0 +1,29 @@
+% latex table generated in R 3.6.2 by xtable 1.8-4 package
+% Mon Sep  6 19:22:48 2021
+\begin{table}[ht]
+\centering
+\begingroup\fontsize{9pt}{10pt}\selectfont
+\begin{tabular}{rrl}
+  \hline
+{\bf rows.in} & {\bf rows.out} & {\bf filter} \\ 
+  \hline
+1627548 & 1465494 & Exclude ascents with no date or no grade information. \\ 
+  1465494 & 1429967 & Exclude artificial ascents \\ 
+  1429967 & 1310458 & Exclude gear styles: Boulder, Alpine, DWS, Traverse, Aid, Ice, Via ferrata \\ 
+  1310458 & 1309854 & Exclude trad ascent types: greenpoint, greenpointonsight \\ 
+  1309854 & 1275445 & Exclude boulder ascent types: send, dab, repeat \\ 
+  1275445 & 1272836 & Exclude non-ascent types: hit, target, mark \\ 
+  1272836 & 691090 & Keep only Ewbank grades \\ 
+  691090 & 691079 & Remove grades with value '--' \\ 
+  691079 & 403210 & Remove ascents before 2016-08-01 \\ 
+  403210 & 397991 & Remove ascents on or after 2021-08-01 \\ 
+  397991 & 373234 & Remove ascents with no month information. \\ 
+  373234 & 293566 & Remove ascents with grade less than 16 \\ 
+  293566 & 230274 & Exclude ambiguous ascent types: tick, lead, leadsolo, second, toprope, aidsolo, ropedsolo \\ 
+  230274 & 67986 & Keep climbers with at least 400 ascents, and at least 1 failed ascents. \\ 
+   \hline
+\end{tabular}
+\endgroup
+\caption{Summary of data processing for analysis of Australia ascent data.} 
+\label{table-data-processing-aus}
+\end{table}
@@ -0,0 +1,29 @@
+% latex table generated in R 3.6.2 by xtable 1.8-4 package
+% Mon Sep  6 19:02:03 2021
+\begin{table}[ht]
+\centering
+\begingroup\fontsize{9pt}{10pt}\selectfont
+\begin{tabular}{rrl}
+  \hline
+{\bf rows.in} & {\bf rows.out} & {\bf filter} \\ 
+  \hline
+41546 & 38147 & Exclude ascents with no date or no grade information. \\ 
+  38147 & 37928 & Exclude artificial ascents \\ 
+  37928 & 37928 & Exclude gear styles:  \\ 
+  37928 & 37871 & Exclude trad ascent types: greenpoint, greenpointonsight \\ 
+  37871 & 36197 & Exclude boulder ascent types: send, dab, repeat \\ 
+  36197 & 36160 & Exclude non-ascent types: hit, target, mark \\ 
+  36160 & 33167 & Keep only Ewbank grades \\ 
+  33167 & 33167 & Remove grades with value '--' \\ 
+  33167 & 26462 & Remove ascents before 2016-08-01 \\ 
+  26462 & 26343 & Remove ascents on or after 2021-08-01 \\ 
+  26343 & 25208 & Remove ascents with no month information. \\ 
+  25208 & 21488 & Remove ascents with grade less than 16 \\ 
+  21488 & 15626 & Exclude ambiguous ascent types: tick, lead, leadsolo, second, toprope, aidsolo, ropedsolo \\ 
+  15626 & 2707 & Keep climbers with at least 400 ascents, and at least 1 failed ascents. \\ 
+   \hline
+\end{tabular}
+\endgroup
+\caption{Summary of data processing for analysis of New Zealand ascent data.} 
+\label{table-data-processing-nz}
+\end{table}
@@ -1,5 +1,5 @@
 % latex table generated in R 3.6.2 by xtable 1.8-4 package
-% Mon Sep  6 12:00:45 2021
+% Mon Sep  6 19:17:05 2021
 \begin{table}[ht]
 \centering
 \begingroup\fontsize{9pt}{10pt}\selectfont