manuscript.tex

% Options for packages loaded elsewhere
\PassOptionsToPackage{unicode}{hyperref}
\PassOptionsToPackage{hyphens}{url}
\PassOptionsToPackage{dvipsnames,svgnames,x11names}{xcolor}
%
\documentclass[
  man,floatsintext]{apa6}
\usepackage{amsmath,amssymb}
\usepackage{iftex}
\ifPDFTeX
  \usepackage[T1]{fontenc}
  \usepackage[utf8]{inputenc}
  \usepackage{textcomp} % provide euro and other symbols
\else % if luatex or xetex
  \usepackage{unicode-math} % this also loads fontspec
  \defaultfontfeatures{Scale=MatchLowercase}
  \defaultfontfeatures[\rmfamily]{Ligatures=TeX,Scale=1}
\fi
\usepackage{lmodern}
\ifPDFTeX\else
  % xetex/luatex font selection
\fi
% Use upquote if available, for straight quotes in verbatim environments
\IfFileExists{upquote.sty}{\usepackage{upquote}}{}
\IfFileExists{microtype.sty}{% use microtype if available
  \usepackage[]{microtype}
  \UseMicrotypeSet[protrusion]{basicmath} % disable protrusion for tt fonts
}{}
\makeatletter
\@ifundefined{KOMAClassName}{% if non-KOMA class
  \IfFileExists{parskip.sty}{%
    \usepackage{parskip}
  }{% else
    \setlength{\parindent}{0pt}
    \setlength{\parskip}{6pt plus 2pt minus 1pt}}
}{% if KOMA class
  \KOMAoptions{parskip=half}}
\makeatother
\usepackage{xcolor}
\usepackage{graphicx}
\makeatletter
\def\maxwidth{\ifdim\Gin@nat@width>\linewidth\linewidth\else\Gin@nat@width\fi}
\def\maxheight{\ifdim\Gin@nat@height>\textheight\textheight\else\Gin@nat@height\fi}
\makeatother
% Scale images if necessary, so that they will not overflow the page
% margins by default, and it is still possible to overwrite the defaults
% using explicit options in \includegraphics[width, height, ...]{}
\setkeys{Gin}{width=\maxwidth,height=\maxheight,keepaspectratio}
% Set default figure placement to htbp
\makeatletter
\def\fps@figure{htbp}
\makeatother
\setlength{\emergencystretch}{3em} % prevent overfull lines
\providecommand{\tightlist}{%
  \setlength{\itemsep}{0pt}\setlength{\parskip}{0pt}}
\setcounter{secnumdepth}{-\maxdimen} % remove section numbering
% Make \paragraph and \subparagraph free-standing
\ifx\paragraph\undefined\else
  \let\oldparagraph\paragraph
  \renewcommand{\paragraph}[1]{\oldparagraph{#1}\mbox{}}
\fi
\ifx\subparagraph\undefined\else
  \let\oldsubparagraph\subparagraph
  \renewcommand{\subparagraph}[1]{\oldsubparagraph{#1}\mbox{}}
\fi
\newlength{\cslhangindent}
\setlength{\cslhangindent}{1.5em}
\newlength{\csllabelwidth}
\setlength{\csllabelwidth}{3em}
\newlength{\cslentryspacingunit} % times entry-spacing
\setlength{\cslentryspacingunit}{\parskip}
\newenvironment{CSLReferences}[2] % #1 hanging-ident, #2 entry spacing
 {% don't indent paragraphs
  \setlength{\parindent}{0pt}
  % turn on hanging indent if param 1 is 1
  \ifodd #1
  \let\oldpar\par
  \def\par{\hangindent=\cslhangindent\oldpar}
  \fi
  % set entry spacing
  \setlength{\parskip}{#2\cslentryspacingunit}
 }%
 {}
\usepackage{calc}
\newcommand{\CSLBlock}[1]{#1\hfill\break}
\newcommand{\CSLLeftMargin}[1]{\parbox[t]{\csllabelwidth}{#1}}
\newcommand{\CSLRightInline}[1]{\parbox[t]{\linewidth - \csllabelwidth}{#1}\break}
\newcommand{\CSLIndent}[1]{\hspace{\cslhangindent}#1}
\ifLuaTeX
\usepackage[bidi=basic]{babel}
\else
\usepackage[bidi=default]{babel}
\fi
\babelprovide[main,import]{english}
% get rid of language-specific shorthands (see #6817):
\let\LanguageShortHands\languageshorthands
\def\languageshorthands#1{}
% Manuscript styling
\usepackage{upgreek}
\captionsetup{font=singlespacing,justification=justified}

% Table formatting
\usepackage{longtable}
\usepackage{lscape}
% \usepackage[counterclockwise]{rotating}   % Landscape page setup for large tables
\usepackage{multirow}		% Table styling
\usepackage{tabularx}		% Control Column width
\usepackage[flushleft]{threeparttable}	% Allows for three part tables with a specified notes section
\usepackage{threeparttablex}            % Lets threeparttable work with longtable

% Create new environments so endfloat can handle them
% \newenvironment{ltable}
%   {\begin{landscape}\centering\begin{threeparttable}}
%   {\end{threeparttable}\end{landscape}}
\newenvironment{lltable}{\begin{landscape}\centering\begin{ThreePartTable}}{\end{ThreePartTable}\end{landscape}}

% Enables adjusting longtable caption width to table width
% Solution found at http://golatex.de/longtable-mit-caption-so-breit-wie-die-tabelle-t15767.html
\makeatletter
\newcommand\LastLTentrywidth{1em}
\newlength\longtablewidth
\setlength{\longtablewidth}{1in}
\newcommand{\getlongtablewidth}{\begingroup \ifcsname LT@\roman{LT@tables}\endcsname \global\longtablewidth=0pt \renewcommand{\LT@entry}[2]{\global\advance\longtablewidth by ##2\relax\gdef\LastLTentrywidth{##2}}\@nameuse{LT@\roman{LT@tables}} \fi \endgroup}

% \setlength{\parindent}{0.5in}
% \setlength{\parskip}{0pt plus 0pt minus 0pt}

% Overwrite redefinition of paragraph and subparagraph by the default LaTeX template
% See https://github.com/crsh/papaja/issues/292
\makeatletter
\renewcommand{\paragraph}{\@startsection{paragraph}{4}{\parindent}%
  {0\baselineskip \@plus 0.2ex \@minus 0.2ex}%
  {-1em}%
  {\normalfont\normalsize\bfseries\itshape\typesectitle}}

\renewcommand{\subparagraph}[1]{\@startsection{subparagraph}{5}{1em}%
  {0\baselineskip \@plus 0.2ex \@minus 0.2ex}%
  {-\z@\relax}%
  {\normalfont\normalsize\itshape\hspace{\parindent}{#1}\textit{\addperi}}{\relax}}
\makeatother

% \usepackage{etoolbox}
\makeatletter
\patchcmd{\HyOrg@maketitle}
  {\section{\normalfont\normalsize\abstractname}}
  {\section*{\normalfont\normalsize\abstractname}}
  {}{\typeout{Failed to patch abstract.}}
\patchcmd{\HyOrg@maketitle}
  {\section{\protect\normalfont{\@title}}}
  {\section*{\protect\normalfont{\@title}}}
  {}{\typeout{Failed to patch title.}}
\makeatother

\usepackage{xpatch}
\makeatletter
\xapptocmd\appendix
  {\xapptocmd\section
    {\addcontentsline{toc}{section}{\appendixname\ifoneappendix\else~\theappendix\fi\\: #1}}
    {}{\InnerPatchFailed}%
  }
{}{\PatchFailed}
\keywords{spatial non-independence; cultural non-independence; cross-national analyses; simulations; replications; reanalyses\newline\indent Word count: 5102 words excl. Methods (Methods: 2163 words)}
\usepackage{lineno}

\linenumbers
\usepackage{csquotes}
\raggedbottom
\usepackage{setspace}
\AtBeginEnvironment{tabular}{\singlespacing}
\AtBeginEnvironment{lltable}{\singlespacing}
\AtBeginEnvironment{tablenotes}{\doublespacing}
\captionsetup[table]{font={stretch=1.5}}
\captionsetup[figure]{font={stretch=1,small}}
\nolinenumbers
\ifLuaTeX
  \usepackage{selnolig}  % disable illegal ligatures
\fi
\IfFileExists{bookmark.sty}{\usepackage{bookmark}}{\usepackage{hyperref}}
\IfFileExists{xurl.sty}{\usepackage{xurl}}{} % add URL line breaks if available
\urlstyle{same}
\hypersetup{
  pdftitle={Cross-national analyses require additional controls to account for the non-independence of nations},
  pdfauthor={Scott Claessens1*, Thanos Kyritsis1, \& Quentin D. Atkinson1,2*},
  pdflang={en-EN},
  pdfkeywords={spatial non-independence; cultural non-independence; cross-national analyses; simulations; replications; reanalyses},
  colorlinks=true,
  linkcolor={Maroon},
  filecolor={Maroon},
  citecolor={Blue},
  urlcolor={blue},
  pdfcreator={LaTeX via pandoc}}

\title{Cross-national analyses require additional controls to account for the non-independence of nations}
\author{Scott Claessens\textsuperscript{1*}, Thanos Kyritsis\textsuperscript{1}, \& Quentin D. Atkinson\textsuperscript{1,2*}}
\date{}


\shorttitle{Non-independence of nations}

\affiliation{\vspace{0.5cm}\textsuperscript{1} \footnotesize School of Psychology, University of Auckland, Auckland, New Zealand\\\textsuperscript{2} \footnotesize School of Anthropology and Museum Ethnography, University of Oxford, Oxford, United Kingdom \newline *email: \href{mailto:scott.claessens@gmail.com}{\nolinkurl{scott.claessens@gmail.com}}; \href{mailto:q.atkinson@auckland.ac.nz}{\nolinkurl{q.atkinson@auckland.ac.nz}}}

\abstract{%
Cross-national analyses test hypotheses about the drivers of variation in national outcomes. However, since nations are connected in various ways, such as via spatial proximity and shared cultural ancestry, cross-national analyses often violate assumptions of non-independence, inflating false positive rates. Here, we show that, despite being recognised as an important statistical pitfall for over 200 years, cross-national research in economics and psychology still does not sufficiently account for non-independence. In a review of the 100 highest-cited cross-national studies of economic development and values, we find that controls for non-independence are rare. When studies do control for non-independence, our simulations suggest that most commonly used methods are insufficient for reducing false positives in non-independent data. In reanalyses of twelve previous cross-national correlations, half of the estimates are compatible with no association after controlling for non-independence using global proximity matrices. We urge social scientists to sufficiently control for non-independence in cross-national research.
}


\begin{document}
\maketitle

\linenumbers

\hypertarget{introduction}{%
\section{Introduction}\label{introduction}}

Nations are an important population unit structuring modern human life. The nation in which someone is born has a large effect on what they can expect out of life, including their income level\textsuperscript{1}, life expectancy\textsuperscript{2}, mental health\textsuperscript{3}, subjective well-being\textsuperscript{4}, and educational attainment\textsuperscript{5}. Nations are also among the most important determinants of human cultural variation, with greater cultural similarity within than outside national borders\textsuperscript{6}.

Given the importance of nations for structuring human behaviour, there is justifiably huge interest in statistical analyses that attempt to predict variation in national outcomes of all kinds. At the time of writing, a search in Web of Science for the term ``cross-national'' in titles or abstracts returned over 13,000 unique hits. The standard practice for cross-national analyses is to conduct bivariate correlations or multiple regressions with individual data points representing different nations. Such analyses widen the scope of social science beyond Western populations\textsuperscript{7,8} and have been used to study, among other topics, the causes of variation in the economic wealth of nations\textsuperscript{9--12}, global patternings of cultural norms and values\textsuperscript{13--16}, and the universality and diversity of human behaviour and psychology around the world\textsuperscript{17--20}.

However, cross-national analyses are complicated by the fact that nations are not statistically independent data points. Unlike independent random samples from a population, nations are related to one another in a number of ways. First, nations that are closer to one another tend to be more similar than distant nations. This phenomenon is known as spatial non-independence\textsuperscript{21}, and it occurs because nations in close spatial proximity share characteristics due to local cultural diffusion of ideas\textsuperscript{22} and regional variation in climate and environment\textsuperscript{21}. For example, the neighbouring African nations Zambia and Tanzania have similar levels of terrain ruggedness, which has been used to partially explain their similar levels of economic development\textsuperscript{23}. This pattern conforms to Tobler's first law of geography: ``everything is related to everything else, but near things are more related than distant things''\textsuperscript{24} (p.~236).

Second, nations with shared cultural ancestry tend to be more similar than culturally unrelated nations. This is known as cultural phylogenetic non-independence\textsuperscript{25--27}, and occurs because related nations share cultural traits inherited via descent from a common ancestor. Shared cultural ancestry can result in a form of pseudoreplication, whereby multiple instances of the same trait across nations are merely duplicates of the ancestral original\textsuperscript{25,28}. For example, the related island nations Tonga and Tuvalu share similar languages and customs due to cultural inheritance from a common Polynesian population dating back more than 1,000 years\textsuperscript{29,30}. More recently, shared ancestry explains similarities in institutions, norms, technologies, and values between colonial settlements and their colonisers (e.g.~English, French, Spanish, and Portuguese settlements of the Americas). Importantly, these deep cultural connections between nations often span large geographic distances around the world. Tonga and Tuvalu share cultural traits despite being separated by over 1,500 kilometres of ocean, and South American and European nations remain culturally similar today despite their locations on two separate continents. Shared cultural ancestry must therefore be considered independently of spatial proximity in the study of nations.

Spatial and cultural phylogenetic non-independence between nations make cross-national inference challenging. A fundamental assumption of regression analysis is that model residuals should be independently and identically distributed\textsuperscript{31}. But without accounting for spatial or cultural non-independence between nations, model residuals can show structure that remains unaccounted for, violating this assumption. Treating nations as independent can thus inflate false positive rates\textsuperscript{32}, producing spurious relationships between variables that in fact only indirectly covary due to spatial or cultural connections\textsuperscript{33} (see Supplementary Figure \ref{fig:dag} for an example causal model).

Non-independence is widely acknowledged in fields that routinely deal with spatially or culturally structured data. In ecology and sociology, studies with regional-level data use a variety of autoregressive models designed to account for spatial patternings\textsuperscript{34,35}. In anthropology, researchers have recognised cultural non-independence as an important statistical pitfall for over 200 years, with issues of cultural pseudoreplication being identified in early comparative studies of marriage practices across societies\textsuperscript{25}. In the twentieth century, anthropologists began to emphasise that human societies do not develop independently, but rather exist in a globally interconnected world system linked by shared history and cultural ancestry\textsuperscript{36}. In order to minimise the confounding effects of this non-independence in comparisons of human societies, researchers compiled the Standard Cross-Cultural Sample of 186 cultures which deliberately avoids sampling closely related cultures\textsuperscript{28}, though it is difficult to completely remove spatial and cultural dependencies\textsuperscript{37,38} and the smaller sample of cultures reduces statistical power. Today, anthropologists borrow phylogenetic comparative methods from evolutionary biology, such as phylogenetic least squares regression\textsuperscript{39}, when comparing societies, treating culturally related societies in the same way as biologists treat genetically related species (e.g.\textsuperscript{40,41}).

At the national level, recent reanalyses have revealed that several cross-national relationships reported in economics and psychology do not hold when controlling for non-independence between nations. One working paper replicated 25 analyses of persistence in economics, in which modern national outcomes are regressed against historical characteristics of those nations, and found that over half of the relationships were attenuated when controlling for spatial non-independence\textsuperscript{42}. Another replication study found that many of the widely publicised relationships between national-level pathogen prevalence and political institutions and attitudes fail to hold when controlling for various kinds of non-independence\textsuperscript{43}. These reanalyses, and others\textsuperscript{44--46}, raise the question: how widespread a concern is non-independence in studies of national-level outcomes?

To address this question, we consider national-level variables of general interest across the social sciences: economic development and cultural values. These variables are frequently included as both outcomes and predictors in cross-national studies in economics and psychology\textsuperscript{9--16}. First, we demonstrate that economic development and cultural values are spatially and culturally non-independent across nations, emphasising the need to control for non-independence. Second, we review the 100 highest-cited cross-national studies of economic development and cultural values and determine baseline rates of controlling for non-independence in the literature. Third, we run simulations to determine whether common methods of dealing with non-independence in the literature sufficiently reduce false positive rates. Fourth, we reanalyse twelve previous cross-national analyses of economic development and cultural values from our literature review, incorporating global geographic and linguistic proximity matrices as controls for spatial and cultural non-independence.

\hypertarget{results}{%
\section{Results}\label{results}}

\hypertarget{national-level-economic-development-and-cultural-values-are-spatially-and-culturally-non-independent}{%
\subsection{National-level economic development and cultural values are spatially and culturally non-independent}\label{national-level-economic-development-and-cultural-values-are-spatially-and-culturally-non-independent}}

In order to motivate our research question, it is important to first quantify the degree of spatial and cultural non-independence for economic development and cultural values around the world. If these variables are independent or only weakly non-independent, then the issue might be safe to ignore. However, if they are more strongly non-independent, then there is a possibility that non-independence could be confounding cross-national inferences.

To this end, we used Bayesian multilevel models to simultaneously estimate geographic and cultural phylogenetic signal for a range of economic development and cultural values variables. For economic development, we focused on the Human Development Index\textsuperscript{47}, gross domestic product per capita, annual gross domestic product per capita growth, and the Gini index of income inequality. For cultural values, we focused on two primary dimensions of cultural values from the World Values Survey, traditional vs.~secular values and survival vs.~self-expression values\textsuperscript{16}, as well as cultural tightness\textsuperscript{14} and individualism\textsuperscript{15}. These variables are not intended to be a comprehensive list of all national-level variables included in cross-national research, but rather an illustrative set of variables that are widely used in the literature.

For all of these variables, we found that a substantial proportion of national-level variation was explained by spatial proximity and/or shared cultural ancestry between nations (Figure \ref{fig:plotSignal}; see Supplementary Table \ref{tab:tableSignal} for numerical results). Signal estimates were often strong, with spatial proximity and shared cultural ancestry frequently explaining over half of the national-level variation. For spatial proximity, Bayes Factors indicated strong evidence that the geographic signal estimates differed from zero for all economic development variables and traditional values. However, the evidence was only equivocal for survival values and individualism, and strong evidence was found that the geographic signal estimate for tightness was equal to zero. For shared cultural ancestry, Bayes Factors indicated strong evidence that the cultural phylogenetic signal estimates differed from zero for all economic development and cultural values variables except for gross domestic product per capita growth, for which the evidence was equivocal. These findings emphasise the need to account for spatial and cultural phylogenetic non-independence in cross-national analyses of economic development and cultural values.


\begin{figure}
\centering
\includegraphics{manuscript_files/figure-latex/plotSignal-1.pdf}
\caption{\label{fig:plotSignal}Posterior estimates of geographic and cultural phylogenetic signal for a range of economic development and cultural values variables. Geographic and cultural phylogenetic signal are operationalised as the proportion of national-level variance explained by geographic and linguistic proximity matrices. Grey ridges are full posterior distributions, points are posterior median values, and black lines are equal-tailed 50\% and 95\% credible intervals. Number of observations from these models are as follows: HDI (n = 1449), GDP per capita (n = 10289), GDP per capita growth (n = 9755), Gini index (n = 1826), traditional values (n = 277676), survival values (n = 277676), tightness (n = 57), and individualism (n = 67). HDI = Human Development Index; GDP = gross domestic product.}
\end{figure}

\hypertarget{previous-cross-national-analyses-have-not-sufficiently-accounted-for-non-independence}{%
\subsection{Previous cross-national analyses have not sufficiently accounted for non-independence}\label{previous-cross-national-analyses-have-not-sufficiently-accounted-for-non-independence}}

Given that economic development and cultural values show evidence of geographic and cultural phylogenetic signal, have cross-national analyses sufficiently accounted for this non-independence? To assess this, we searched the published literature for articles that combined the search terms ``economic development'' or ``values'' with the search terms ``cross-national'', ``cross-cultural'', or ``cross-country''. We removed articles that did not report original research, were not relevant to economic development or cultural values, or did not report at least one cross-national analysis. We then retained the 100 articles (50 for economic development, 50 for cultural values) with the highest annual rate of citations (see Supplementary Data 1). For each of these highly-cited articles, we exhaustively recorded every cross-national analysis reported in the main text (n = 4,308), identifying in each case whether or not the analysis attempted to control for spatial, cultural, or any other form of non-independence between nations (see Methods for detailed search criteria and coding decisions).

The results of our literature review show that most published articles containing cross-national analyses make no attempt to account for statistical non-independence. Figure \ref{fig:plotReview1}a plots the proportion of articles that contain at least one cross-national analysis accounting for non-independence. We find that 42\% of economic development articles contain at least one attempt to control for non-independence (two-tailed 95\% bootstrap confidence interval {[}0.30 0.54{]}), while this proportion decreases to only 8\% for cultural values articles (two-tailed 95\% bCI {[}0.02 0.16{]}). Both kinds of article are most likely to use regional fixed effects (e.g.~continent fixed effects) to account for non-independence, but some articles also include controls for spatial distance (e.g.~latitude) and shared cultural history (e.g.~colony status). These proportions are even lower when focusing on the full sample of 4,308 analyses: only 5\% (equal-tailed 95\% credible interval {[}0.02 0.13{]}) of individual economic development analyses and 1\% (equal-tailed 95\% CI {[}0.00 0.02{]}) of individual cultural values analyses are estimated to control for non-independence (Supplementary Figure \ref{fig:plotReview2}).


\begin{figure}
\centering
\includegraphics{manuscript_files/figure-latex/plotReview1-1.pdf}
\caption{\label{fig:plotReview1}Results from literature review of 100 highly-cited cross-national studies of economic development (red) and cultural values (blue). (a) Proportion of articles containing at least one analysis accounting for non-independence, overall and split by common methods of controlling for non-independence. Points represent raw proportions of articles and ranges represent two-tailed 95\% bootstrap confidence intervals (n = 1000 bootstrap samples). (b) The association between journal impact factor and the probability that an article contains at least one analysis accounting for non-independence. (c) Estimated trend over time for the probability that an article contains at least one analysis accounting for non-independence. Lines and shaded areas are posterior median regression lines and equal-tailed 50\% credible intervals from Bayesian logistic regression models (n = 100 observations). Dots represent raw counts of individual articles that did (top) or did not (bottom) account for non-independence. Region FEs = region fixed effects.}
\end{figure}

While our review contains articles from journals with a range of impact factors, our estimates could be biased downwards by analyses published in lower impact outlets with more relaxed standards for issues like non-independence. It is also possible that, since our literature review goes back as far as 1993, our estimates are being biased downwards by earlier studies, and that controls for non-independence have increased over time with methodological advancements and greater awareness of the issue. To test these possible explanations for our low estimates, we fitted logistic regression models to the data from the review, including log journal impact factor and publication year as separate predictors. Interestingly, we found that, if anything, studies from higher impact journals were less likely to include at least one control for non-independence than studies from lower impact journals, both for studies of economic development (b = -0.38, equal-tailed 95\% CI {[}-0.87 0.09{]}) and for studies of cultural values (b = -0.56, equal-tailed 95\% CI {[}-1.10 -0.05{]}; Figure \ref{fig:plotReview1}b). Moreover, splines revealed no relationship between publication year and the probability of including at least one control for non-independence, both for studies of economic development (b = -0.13, equal-tailed 95\% CI {[}-1.10 0.82{]}) and for studies of cultural values (b = -0.02, equal-tailed 95\% CI {[}-1.00 0.96{]}; Figure \ref{fig:plotReview1}c).

\hypertarget{common-methods-of-controlling-for-non-independence-are-insufficient-for-reducing-false-positive-rates-in-non-independent-data}{%
\subsection{Common methods of controlling for non-independence are insufficient for reducing false positive rates in non-independent data}\label{common-methods-of-controlling-for-non-independence-are-insufficient-for-reducing-false-positive-rates-in-non-independent-data}}

Our literature review revealed that most cross-national analyses in the literature do not control for spatial or cultural phylogenetic non-independence. When they do, they tend to include controls like latitude and regional fixed effects. Do these methods sufficiently account for statistical non-independence?

To compare the efficacy of different methods in the literature, we conducted a simulation study. We simulated national-level datasets (n = 236 nations) with varying degrees of spatial or cultural phylogenetic autocorrelation (i.e.~non-independence) for outcome and predictor variables, but with no direct causal relationship between the variables. We then fitted naive regressions without controls to these datasets, as well as regression models with controls for latitude, longitude, and continent fixed effects. Despite not being identified in our literature review, we also included other methods that are often used in the literature to account for non-independence. Additional spatial controls included the mean of the predictor variable within a surrounding 2000km radius (e.g.\textsuperscript{48}) and Conley standard errors\textsuperscript{49,50} based on geographic distances between nations (e.g.\textsuperscript{19,48}). Additional cultural controls included fixed effects for the language families of the majority-spoken languages in each nation (e.g.\textsuperscript{51}) and Conley standard errors based on genetic distances between nations (e.g.\textsuperscript{19,48}). These fixed effect approaches attempt to account for non-independence by holding geographic location constant (latitude, longitude), discarding between-region variation and exploiting only local variation (continent fixed effects, mean of surrounding 2000km), or correcting standard errors for autocorrelation post-hoc while leaving model coefficients unchanged (Conley standard errors).

Beyond fixed effect approaches, we also fitted Bayesian random effects regressions that explicitly model spatial and/or cultural phylogenetic non-independence by allowing nations to covary according to geographic and/or linguistic proximity matrices. Geographic proximity between nations is calculated from inverse distances between longitude and latitude coordinates. Linguistic proximity between nations is calculated from a global phylogenetic tree that represents hierarchical relationships of genealogical descent for all languages in the world. For each pair of nations, we calculated inverse phylogenetic distances (i.e.~number of branches separating two taxa) between all languages spoken in that nation pair and produced an average linguistic proximity score weighted by the percentages of speakers within those nations. To include the resulting geographic and linguistic proximity matrices in our models, we included a Gaussian process\textsuperscript{52,53} over latitude and longitude values and/or assumed that nation random intercepts were correlated in proportion to their linguistic proximity\textsuperscript{54}. These random effects approaches attempt to account for non-independence by modelling the covariance between nations that is induced by their geographic or linguistic connections.

Figures \ref{fig:plotSim3} and \ref{fig:plotSim4} plot the estimated false positive rates from our simulation study, split by different methods and different degrees of spatial or cultural phylogenetic autocorrelation (see Supplementary Tables \ref{tab:tableSim1} and \ref{tab:tableSim2} for numerical results and Supplementary Figures \ref{fig:plotSim1} and \ref{fig:plotSim2} for full distributions of effect sizes under strong autocorrelation). Across all model types, false positive rates were measured as the proportion of models that estimated a slope with a two-tailed 95\% confidence / credible interval excluding zero, falsely inferring a relationship when none is present. For reference, weak autocorrelation in our simulation is comparable to the geographic signal for survival values in Figure \ref{fig:plotSignal} (i.e.~20\% of the national-level variance is explained by non-independence), while moderate and strong levels of autocorrelation are comparable to the cultural phylogenetic signal for traditional and survival values, respectively (i.e.~50\% and 80\% of the national-level variance is explained by non-independence).

Our simulation study revealed that with at least moderate degrees of spatial or cultural phylogenetic autocorrelation for both outcome and predictor variables, naive regression models produce false positive rates above chance levels. This false positive rate increases as the degree of autocorrelation increases. With strong spatial autocorrelation for both outcomes and predictors, false positive rates reach as high as 77\%. We find a slightly lower false positive rate under strong cultural phylogenetic autocorrelation, though this false positive rate is still greater than expected by chance (36\%).


\begin{figure}
\centering
\includegraphics{manuscript_files/figure-latex/plotSim3-1.pdf}
\caption{\label{fig:plotSim3}False positive rates for different methods of controlling for spatial non-independence in our simulation study. For simulated outcome and predictor variables, we systematically varied the strength of spatial autocorrelation, from weak (0.2) to moderate (0.5) to strong (0.8). We simulated 100 datasets per parameter combination and fitted different models to each dataset. False positive rates were operationalised as the proportion of models that estimated a slope with a two-tailed 95\% confidence / credible interval excluding zero. Points represent raw proportions of false positive models, ranges represent two-tailed 95\% bootstrap confidence intervals (n = 1000 bootstrap samples), and dashed lines indicate the 5\% false positive rate that is expected due to chance. Colours indicate whether the strength of autocorrelation for the predictor variable is 0.2 (red), 0.5, (green) or 0.8 (blue). SEs = standard errors.}
\end{figure}


\begin{figure}
\centering
\includegraphics{manuscript_files/figure-latex/plotSim4-1.pdf}
\caption{\label{fig:plotSim4}False positive rates for different methods of controlling for cultural phylogenetic non-independence in our simulation study. For simulated outcome and predictor variables, we systematically varied the strength of cultural phylogenetic autocorrelation, from weak (0.2) to moderate (0.5) to strong (0.8). We simulated 100 datasets per parameter combination and fitted different models to each dataset. False positive rates were operationalised as the proportion of models that estimated a slope with a two-tailed 95\% confidence / credible interval excluding zero. Points represent raw proportions of false positive models, ranges represent two-tailed 95\% bootstrap confidence intervals (n = 1000 bootstrap samples), and dashed lines indicate the 5\% false positive rate that is expected due to chance. Colours indicate whether the strength of autocorrelation for the predictor variable is 0.2 (red), 0.5, (green) or 0.8 (blue). SEs = standard errors.}
\end{figure}

Most methods common in the literature do not reduce these high false positive rates. With strong spatial autocorrelation for both outcome and predictor variables, false positive rates remain above 50\% when controlling for latitude, longitude, and language family fixed effects (Figure \ref{fig:plotSim3}). Similarly, Conley standard error corrections based on spatial and genetic distances do not reduce false positive rates below 40\% under strong spatial autocorrelation. The most effective fixed effects methods are continent fixed effects, which continue to produce a false positive rate of 35\% under strong spatial autocorrelation, and controlling for the mean of the predictor variable within a 2000km radius, which eliminates false positives under even strong spatial autocorrelation (6\%). However, additional simulations revealed that these reductions in false positive rates come at the cost of lower statistical power (see Supplementary Figures \ref{fig:plotPowerGeo01} - \ref{fig:plotPowerGeo05}). In additional simulations where the true relationship between the predictor and outcome variable was known, power analyses showed that both continent fixed effects and the 2000km radius control had less than 80\% power to detect moderate true correlations (r = 0.3) under strong spatial autocorrelation.

By contrast, Bayesian spatial Gaussian process regression with longitude and latitude strikes a balance between reducing false positives and retaining high statistical power to detect true effects. This approach reduces false positives to 15\% under moderate spatial autocorrelation and 23\% under strong spatial autocorrelation. Random effects models that additionally account for linguistic proximity between nations perform equally well, though models with only linguistic covariance continue to produce false positives. False positives are not completely eliminated with these random effects models. Nevertheless, these methods have at least 80\% power to detect moderate (r = 0.3) and large (r = 0.5) true correlations between variables under all levels of spatial autocorrelation (see Supplementary Figures \ref{fig:plotPowerGeo01} - \ref{fig:plotPowerGeo05}).

In our simulation of cultural phylogenetic non-independence, we find that none of the fixed effects methods reduce false positive rates (Figure \ref{fig:plotSim4}). Controls for latitude, longitude, continent fixed effects, the mean of the predictor variable in a 2000km radius, and Conley standard error corrections based on spatial and genetic distances do little to change false positive rates. Even language family fixed effects continue to produce a false positive rate of 32\% under strong cultural phylogenetic autocorrelation. By contrast, models with random effects covarying according to linguistic proximity completely eliminate false positives across all degrees of cultural phylogenetic autocorrelation. This approach is also the only method that is able to detect large true correlations (r = 0.5) with at least 80\% power (see Supplementary Figures \ref{fig:plotPowerLin01} - \ref{fig:plotPowerLin05}). Random effects models that additionally account for geographic proximity between nations perform equally well, though models with only a spatial Gaussian process continue to produce false positives.

\hypertarget{key-findings-in-the-literature-are-not-robust-to-reanalysis-with-more-rigorous-methods}{%
\subsection{Key findings in the literature are not robust to reanalysis with more rigorous methods}\label{key-findings-in-the-literature-are-not-robust-to-reanalysis-with-more-rigorous-methods}}

Our literature review and simulation study have shown that controls for non-independence are rare in cross-national studies of economic development and cultural values, and when studies do attempt to control for non-independence, the methods typically used are unable to sufficiently reduce false positive rates. This raises the worrying possibility that the cross-national literature in economics and psychology is populated with spurious relationships.

To determine how widespread this issue of spurious cross-national relationships might be, we reanalysed a subset of twelve previous cross-national analyses from our literature review, controlling for spatial and cultural phylogenetic non-independence using global geographic and linguistic proximity matrices. Out of the 100 papers included in our literature review, primary or secondary data were publicly available for 47 papers. We attempted to replicate key statistically significant cross-national correlations from these papers --- mostly initial bivariate regression specifications without covariates (see Methods) --- and stopped when we had sampled a set of twelve analyses for which we were able to replicate the original result. The final set included six analyses from our economic development review\textsuperscript{55--60} and six from our cultural values review\textsuperscript{13,14,16,61--63} that had available data and were able to be replicated. We pre-registered this set before running any control models (\url{https://osf.io/uywx8/}). We controlled for non-independence by including (1) a Gaussian process allowing nation random intercepts to covary according to a geographic proximity matrix, and/or (2) nation random intercepts that covaried according to a linguistic proximity matrix (see Supplementary Methods for full models).

Figure \ref{fig:plotReplications1} visualises the results of our reanalysis (see Supplementary Table \ref{tab:tableReplications} for numerical results). Cross-national correlation effect sizes tended to reduce when controlling for statistical non-independence between nations, sometimes by as much as half of the original effect size. Overall, after controlling for non-independence, six out of twelve cross-national associations had 95\% credible intervals that included zero. For the economic development analyses, four out of six cross-national relationships had 95\% credible intervals including zero when controlling for spatial non-independence. For the cultural values analyses, two out of six cross-national relationships had 95\% credible intervals including zero when controlling for cultural phylogenetic non-independence. Supplementary Figure \ref{fig:plotReplications2} shows these cross-national correlations plotted against the raw data.


\begin{figure}
\centering
\includegraphics{manuscript_files/figure-latex/plotReplications1-1.pdf}
\caption{\label{fig:plotReplications1}Posterior correlations from our reanalysis of twelve previous cross-national analyses. For each previous cross-national relationship, we plot the posterior slopes from a naive regression (red), a regression controlling for spatial non-independence (green), a regression controlling for cultural phylogenetic non-independence (blue), and a regression controlling for both spatial and cultural phylogenetic non-independence simultaneously (purple). All outcome and predictor variables are standardised. Most analyses are simple bivariate cross-national correlations, but Gelfand et al.~(2011) is a partial correlation controlling for log gross national income and Adamczyk and Pitt (2009) is a multilevel model including several covariates. Coloured ridges are full posterior distributions, and points and black lines represent posterior medians and equal-tailed 95\% credible intervals. Numbers of observations from the models are as follows, from top to bottom: n = 69, n = 45, n = 103, n = 98, n = 63, n = 89, n = 33, n = 75, n = 67, n = 28, n = 38, and n = 28. GDP = gross domestic product. FLFP = female labour force participation.}
\end{figure}

To understand why some cross-national correlations were attenuated by controls for non-independence while others were robust, we further explored our fitted models for evidence of spatial and cultural autocorrelation. For each outcome variable, our Gaussian process models provided varying estimates of how quickly spatial autocorrelation declined with distance (Supplementary Figure \ref{fig:plotReplications3}). For example, in Skidmore and Toya\textsuperscript{60} gross domestic product growth was only moderately spatially autocorrelated at 1,000 km distance (posterior median spatial autocorrelation at 1,000 km = 0.42, equal-tailed 95\% CI {[}0.07 0.90{]}), whereas in Inglehart and Baker\textsuperscript{16} traditional values were strongly spatially autocorrelated at the same distance (posterior median spatial autocorrelation at 1,000 km = 0.96, 95\% CI {[}0.81 0.99{]}). We also found varying estimates of cultural phylogenetic signal (Supplementary Figure \ref{fig:plotReplications4}), with some outcome variables expressing low signal (e.g.~confidence in institutions\textsuperscript{63}; posterior median = 0.07, 95\% CI {[}0.00 0.53{]}) and others expressing high signal (e.g.~female labour force participation\textsuperscript{62}; posterior median = 0.89, 95\% CI {[}0.63 0.98{]}). Exploratory regressions provided suggestive evidence that stronger estimates of spatial autocorrelation or cultural phylogenetic signal resulted in a more pronounced reduction in the effect size when controlling for non-independence between nations (Supplementary Figure \ref{fig:plotReplications5}). However, these negative slopes for spatial autocorrelation (b = -0.19, 95\% CI {[}-1.33 1.04{]}) and cultural phylogenetic signal (b = -0.28, 95\% CI {[}-1.26 0.70{]}) were both very uncertain, due to the small number of analyses and the posterior uncertainty in effect sizes and estimates of non-independence.

\hypertarget{discussion}{%
\section{Discussion}\label{discussion}}

In a literature review and simulation, we found that cross-national studies in economics and psychology rarely account for non-independence between nations, and, when they do, the methods they use are insufficient to reduce false positives in non-independent data. In a reanalysis of twelve cross-national correlations, we further showed that neglecting to account for non-independence has resulted in potentially spurious relationships in the published literature, with half of the correlations failing to replicate when controlling for spatial or cultural non-independence with more rigorous methods. These findings suggest that cross-national analyses in economics and psychology should be interpreted with caution until non-independence is sufficiently accounted for.

Our initial analyses add to and clarify existing evidence regarding the degree of non-independence for national-level economic and cultural variables. One previous study suggested that geographic proximity is more important than deep cultural ancestry in explaining the distribution of human development across Eurasian nations, though the authors noted that their small sample of 44 nations and regional focus limited their statistical power\textsuperscript{64}. By contrast, our global samples of over 160 nations revealed strong cultural phylogenetic signal, as well as geographic signal, for the Human Development Index, GDP per capita, and the Gini index of inequality. Another previous study found that similarities in the cultural values of nations are predicted by linguistic, but not geographic, distances between those nations\textsuperscript{6}. We find this same result for survival vs.~self-expression values, cultural tightness, and individualism, but for traditional vs.~secular values we find that both linguistic and geographic proximity are important independent predictors of global variation. These findings emphasise the need to account for both spatial and cultural phylogenetic non-independence in cross-national studies of economic development and cultural values.

Crucially, our literature review and simulation study revealed that the most commonly used controls for non-independence do not sufficiently deal with the issue. In our simulations, controlling for either latitude or longitude did not reduce false positive rates. This result calls into question the use of controls like distance to the equator to account for non-independence in cross-national regression models, though these controls may still be suitable to account for regional or latitudinal variation in climate, ecology, and natural threats (e.g.~pathogens), which we did not simulate. High false positive rates persisted with Conley standard errors, despite recent claims that these standard error corrections are sufficient to deal with spatial non-independence\textsuperscript{65}. The simulation also confirmed the assertion that fixed effects for spatial or cultural groupings (e.g.~continent or language family fixed effects) are insufficient because non-independence still remains within groupings\textsuperscript{43}. This logic further applies to analyses that control for non-independence by separately analysing different regions (e.g.\textsuperscript{66}). Controlling for the mean of the predictor variable within a 2000km radius\textsuperscript{48} eliminated false positive rates in spatially autocorrelated data, but had reduced statistical power to detect true associations. Across all model types in our simulation, the only methods that reduced false positive rates while retaining high statistical power were the random effects models with covariance matrices. The important advantage of these models is not that they are Bayesian per se (any of the approaches used here could be implemented in a Bayesian framework), but rather that they explicitly model covariance as a function of spatial or cultural distance.

There are other approaches to controlling for non-independence that we did not include in our simulation. For example, conditional autoregressive models\textsuperscript{34} and generalised additive models\textsuperscript{67} are approaches that can be applied in both frequentist and Bayesian frameworks. There are also alternative ways to operationalise cultural distances between nations beyond linguistic distances, including metrics like cultural fixation indices (e.g.~cultural \(F_{ST}\)\textsuperscript{6,68}), covariance based on genetic distances\textsuperscript{69}, and phylogenetic distances between religious traditions. We see merit in each of these approaches and the use of one over another will depend on the specific question at hand. We decided to focus on linguistic distances in this study since language is a tangible socially-learned trait that has previously been used to successfully track the effects of deep cultural ancestry on modern national outcomes\textsuperscript{64,70,71}. Future work should explore whether other approaches are sufficient to reduce false positive rates in spatially and culturally non-independent data. In addition to spatial proximity and shared cultural ancestry, we did not simulate other sources of non-independence that potentially exist in real cross-national datasets, such as modern connections between nations due to flows of people and information (e.g.~flight networks, social media networks) and shared histories of colonialism and capitalist modes of production that have shaped today's global landscape\textsuperscript{72,73}. Additional controls will be required to ensure that these sources of non-independence do not confound cross-national inferences.

Ours is not the first review to show that studies are misapplying statistical methods in ways that inflate false positive rates. For example, other literature reviews have shown that studies in the social sciences tend to use small samples of participants\textsuperscript{74}, treat ordinal data as metric\textsuperscript{75}, incorrectly handle missing values\textsuperscript{76}, and ignore best practices in meta-analyses\textsuperscript{77}. Why do cross-national studies also rarely account for non-independence? At the institutional level, one possibility is that such practices are incentivised because they generate statistically significant relationships, which increase the probability that a study is published\textsuperscript{74}. Indeed, we found that controls for non-independence were less common among articles published in high impact journals, suggesting that researchers are rewarded for such practices. At the individual level, another possibility is that researchers outside of anthropology and ecology are less aware of the problem, or believe that the problem does not apply to analyses of nations. Even if researchers appreciate the problem, they might not know of suitable controls or perceive the methods to be too complex.

These institutional- and individual-level barriers can be combatted. First, cross-national replication studies like ours and others\textsuperscript{42--46}, combined with the methodological reviews included in Registered Reports\textsuperscript{78}, might change incentive structures and encourage researchers to analyse the world's nations with more rigorous methods. Second, more explicit descriptions of causal models could promote controls for non-independence by clearly outlining the nature of confounding and the sources of autocorrelation in cross-national data\textsuperscript{79}. The causal model outlined in Supplementary Figure \ref{fig:dag} is a useful example, but individual studies must outline their own particular causal assumptions, which may include further sources of non-independence and confounding variables to control for (e.g.~post-communist status, colony status). These causal models can then be used to design tailored statistical estimation strategies. Indeed, in our review, economists studying economic development dealt with national-level non-independence more than psychologists studying cultural values, likely because economics studies tend to be lengthy statistical exercises that systematically incorporate or exclude numerous variables in an attempt to infer causation. Third, the recent widespread accessibility of open source statistical software, such as the programming language Stan\textsuperscript{80} and the R package brms\textsuperscript{81}, should promote the use of more rigorous methods to control for non-independence. Using brms, for example, Bayesian Gaussian process regression is straightforward to conduct, requiring only longitude and latitude values for nations. We have provided an online tutorial to help researchers apply these methods to their own cross-cultural datasets (\url{https://scottclaessens.github.io/blog/2022/crossnational/}).

Until such changes are implemented and sufficient controls for non-independence are the norm, existing cross-national correlations should be interpreted with caution. In our reanalyses, we found that half of the cross-national correlations had equal-tailed 95\% credible intervals that included zero when controlling for spatial and/or cultural phylogenetic non-independence. While these results are in line with previous reanalyses\textsuperscript{42}, we note that we are unable to outright reject the claims from these studies, since we only reanalysed the first bivariate regression specifications presented in the papers\textsuperscript{65}. More detailed sets of reanalyses would be required to comprehensively challenge the claims from these specific papers. Nevertheless, these reanalyses do show, more broadly, that the problem of statistical non-independence applies to a wider range of national-level variables than those identified by previous work, such as parasite stress and democratic outcomes\textsuperscript{43}. Moreover, given our finding that most studies in the current cross-national literature do not deal with non-independence at all, our reanalyses raise the worrying possibility that this literature is populated with spurious relationships. Future work should expand our set of reanalyses to determine the extent of this problem in the literature.

We do not wish to dissuade researchers from conducting cross-national studies. On the contrary, such work promises to deepen understanding of our world, including the causes and consequences of economic development and cultural values. Moreover, cross-national studies allow social scientists to broaden their scope of study beyond Western populations\textsuperscript{7}, providing the representative samples necessary to test evolutionary and socio-ecological theories of human behaviour\textsuperscript{8,82}. But in order to minimise spurious relationships in global datasets, we urge researchers to control for spatial and cultural phylogenetic non-independence when reporting cross-national correlations. Nations are not independent, and our statistical models must reflect this.

\hypertarget{methods}{%
\section{Methods}\label{methods}}

\hypertarget{geographic-and-cultural-phylogenetic-signal-for-measures-of-economic-development-and-cultural-values}{%
\subsection{Geographic and cultural phylogenetic signal for measures of economic development and cultural values}\label{geographic-and-cultural-phylogenetic-signal-for-measures-of-economic-development-and-cultural-values}}

To estimate the degree of spatial and cultural phylogenetic non-independence in economic development and cultural values, we calculated geographic and cultural phylogenetic signal for global measures of development and values. For economic development variables, we retrieved longitudinal data on the Human Development Index\textsuperscript{47} (1990 - 2019; n = 189 nations), gross domestic product per capita (1960 - 2021; n = 209 nations), annual percentage growth in gross domestic product per capita (1961 - 2021; n = 208 nations), and the Gini coefficient of income inequality (1967 - 2021; n = 167 nations). Human development data were retrieved from the United Nations Development Programme (\url{https://hdr.undp.org/en/content/download-data}) and data for all other economic development variables were retrieved from the World Bank (\url{https://data.worldbank.org/}). For cultural values variables, we retrieved longitudinal data on traditional vs.~secular values and survival vs.~self-expression values from the World Values Survey\textsuperscript{16} (1981 - 2019; n = 116 nations). We downloaded the full Integrated Values Survey, which included all waves from the World Values Survey and the European Values Survey, and computed the two dimensions of cultural values following procedures from previous research\textsuperscript{16}. Additionally, we retrieved cross-sectional data on cultural tightness (n = 57 nations) and individualism (n = 97 nations) from previous work\textsuperscript{13,83}.

To calculate geographic and cultural phylogenetic signal, we created two proximity matrices for 269 of the world's nations: a geographic proximity matrix and a linguistic proximity matrix. Geographic distance between two nations was calculated as the logged geodesic distance between nation capital cities (data from the maps R package\textsuperscript{84}) using the geosphere R package\textsuperscript{85}. The geographic proximity matrix was computed as one minus the log geographic distance matrix scaled between 0 and 1. Linguistic proximity between two nations was calculated as the cultural proximity between all languages spoken within those nations, weighted by speaker percentages. We acquired cultural proximity data by combining the language family trees provided by Glottolog v3.0\textsuperscript{86} into one global language tree (undated and unresolved). We calculated cultural proximity \(s\) between two languages \(j\) and \(k\) as the distance (in number of nodes traversed) of their most recent common ancestor \(i\) to the root of the tree, through the formula:

\begin{gather}
s_{jk} = \frac{n_{r}-n_{i}}{n_{r}}
\end{gather}

where \(n_{r}\) is the maximum path length (in number of nodes traversed) leading to the pan-human root \(r\), and \(n_{i}\) is the maximum path length leading to node \(i\). We then combined these proximities with speaker data from Ethnologue 21\textsuperscript{87} and compared every language spoken within those nations by at least 1 permille of the population, weighted by speaker percentages, through the formula:

\begin{gather}
w_{lm} = {\Sigma}{\Sigma}p_{lj}p_{mk}s_{jk}
\end{gather}

where \(p_{lj}\) is the percentage of the population in nation \(l\) speaking language \(j\), \(p_{mk}\) is the percentage of the population in nation \(m\) speaking language \(k\), and \(s_{jk}\) is the proximity measure between languages \(j\) and \(k\)\textsuperscript{88}. This calculation resulted in a linguistic proximity matrix with values between 0 and 1.

We included these matrices in Bayesian multilevel models, allowing nation random intercepts to covary according to both geographic and linguistic proximity simultaneously. These models were fitted with the R package brms\textsuperscript{81} and converged normally (\(\hat{R}\) \textless{} 1.1). The assumptions of these models were met: residuals were approximately normally distributed, though this was not formally tested. Estimates of geographic and cultural phylogenetic signal were computed as the proportion of national-level variance in these models explained by geographic and linguistic proximity matrices.

\hypertarget{literature-review}{%
\subsection{Literature review}\label{literature-review}}

We exported two searches from Web of Science (\url{https://www.webofknowledge.com/}) on 27\textsuperscript{th} September 2021, restricting our searches to articles published between 1900 and 2018. The first search was for the terms ``economic development'' AND (``cross-national'' OR ``cross-cultural'' OR ``cross-country''), which returned 965 articles. The second search was for the terms ``values'' AND (``cross-national'' OR ``cross-cultural'' OR ``cross-country''), which returned 6806 articles. As this was not a formal systematic literature review, we did not follow PRISMA\textsuperscript{89} guidelines for systematic literature reviews.

Once exported, we ordered the articles by descending number of citations per year since initial publication, using citation counts reported by Web of Science. We then coded each article, in order, for inclusion in our review. Articles were only included if: (1) they were judged to be relevant to economic development or cultural values; (2) they were an original empirical research article; and (3) they contained at least one analysis with national-level outcome or predictor variables. We stopped when we had included 50 articles for the economic development review and 50 articles for the cultural values review.

Within each included article, we exhaustively coded every individual cross-national analysis reported in the main text. We coded mainly correlation or regression analyses, and explicitly excluded meta-analyses, factor analyses, measurement invariance analyses, multidimensional scaling analyses, hierarchical clustering analyses, multiverse analyses, and scale development / validation analyses. We also excluded analyses that compared only two, three, four, five, or six nations. For each included analysis, we recorded the year, impact factor of the journal (retrieved from \url{https://jcr.clarivate.com/jcr/home}), outcome variable, all predictor variables, test statistic, p-value, number of nations, number of data points, model type, if the data were available, and whether and how the analysis attempted to control for non-independence.

We coded common attempts to control for non-independence between nations. These included: (1) any higher-level control variables for spatial regional groupings (e.g.~continent fixed effects); (2) any geographic distance control variables (e.g.~distance between capital cities, distance from equator, latitude); (3) any control variables capturing shared cultural history (e.g.~former colony, legal origin fixed effects, linguistic history, cultural influence); and (4) any other control variables, tests, or approaches that were deemed as attempts to control for non-independence (e.g.~eigenvector filtering\textsuperscript{90}, controls for trade-weightings between nations, cross-sectional dependence tests\textsuperscript{91}, separate analyses for subsets of nations). These were coded by the first author.

Once we had compiled our review database, we calculated the proportion of articles attempting to control for non-independence at least once. We also calculated the proportion of articles employing the different types of control listed above at least once: regional fixed effects, distance, shared cultural history, or other. For these proportions, we calculated two-tailed 95\% bootstrap confidence intervals with 1,000 bootstrap iterations. Additionally, we predicted the probability of an article attempting to control for non-independence at least once using Bayesian logistic regression, including in separate models log journal impact factor and year of publication as linear and spline predictors, respectively.

For individual analyses, we dealt with the nested nature of the data (analyses nested within articles) by fitting Bayesian multilevel logistic regression models with review type (economic development vs.~cultural values) as the sole fixed effect and random intercepts for articles. We fitted these models separately for overall attempts to control for non-independence and split by method type. We report the adjusted proportions with equal-tailed 95\% credible intervals (see Results and Supplementary Figure \ref{fig:plotReview2}). Additionally, we predicted the probability of an analysis attempting to control for non-independence using Bayesian multilevel logistic regression with random intercepts for articles. In separate models, we included log journal impact factor and year of publication as linear and spline predictors, respectively. All Bayesian models were fitted with the brms R package\textsuperscript{81}. Our priors were informed by prior predictive checks, and all models converged normally (\(\hat{R}\) \textless{} 1.1). The assumptions of these models (i.e., binary nested data) were met.

\hypertarget{simulations}{%
\subsection{Simulations}\label{simulations}}

We simulated data for 236 nations \(i\) with varying degrees of spatial or cultural phylogenetic signal for outcome \(y\) and predictor \(x\) using the following generative model:

\begin{gather}
\begin{bmatrix}y_i\\x_i \end{bmatrix} \sim \text{MVNormal}
\begin{pmatrix}\begin{bmatrix}\alpha_y\\\alpha_x \end{bmatrix},\textbf{S}\end{pmatrix}\\
\alpha_y \sim \text{Normal}(0, \sqrt{\lambda} \cdot \Sigma) \nonumber \\
\alpha_x \sim \text{Normal}(0, \sqrt{\rho} \cdot \Sigma) \nonumber \\
\textbf{S} = 
\begin{pmatrix}\sqrt{1 - \lambda} & 0 \\ 0 & \sqrt{1 - \rho} \end{pmatrix}
\begin{pmatrix}1 & r \\ r & 1\end{pmatrix}
\begin{pmatrix}\sqrt{1 - \lambda} & 0 \\ 0 & \sqrt{1 - \rho} \end{pmatrix} \nonumber
\end{gather}

where \(\Sigma\) is a correlation matrix proportional to either geographic or linguistic proximities between nations, \(\lambda\) and \(\rho\) are autocorrelation parameters that represent the expected spatial or cultural phylogenetic signal for outcome and predictor variables, respectively, and \(r\) is the true cross-national correlation between the variables after accounting for autocorrelation. Importantly, when \(r = 0\) in this simulation, we know that there is no direct causal relationship between \(y\) and \(x\). Instead, any relationship between the two variables is merely the result of autocorrelation.

We set the autocorrelation parameters \(\lambda\) and \(\rho\) to either 0.2 (weak), 0.5 (moderate), or 0.8 (strong). We also initially set the true cross-national correlation to 0 in order to determine false positive rates, and then additionally set \(r\) to 0.1 (small effect), 0.3 (medium effect), and 0.5 (large effect) in order to determine statistical power to detect true effects. For each parameter combination, we simulated 100 datasets, resulting in 3600 datasets. Each dataset had 236 rows representing different nations, with the following associated data for each nation: latitude, longitude, continent (Africa, Asia, Europe, North America, Oceania, or South America), language family of the nation's majority spoken language (Afro-Asiatic, Atlantic-Congo, Austroasiatic, Austronesian, Eskimo-Aleut, Indo-European, Japonic, Kartvelian, Koreanic, Mande, Mongolic-Khitan, Nilotic, Nuclear Trans New Guinea, Sino-Tibetan, Tai-Kadai, Tupian, Turkic, or Uralic), the mean of the predictor variable within a 2000km radius, and coordinates for genetic distances from a previous study\textsuperscript{19} (only available for 177 nations).

With the resulting simulated datasets, we standardised outcome and predictor variables and fitted eleven different models: (1) naive regression without controls, (2) regression with latitude control, (3) regression with longitude control, (4) regression with continent fixed effects, (5) regression with language family fixed effects, (6) regression controlling for the mean of the predictor variable in a 2000km radius, (7) regression employing Conley standard errors based on geographic distances, (8) regression employing Conley standard errors based on genetic distances, (9) Bayesian regression including a Gaussian process over latitudes and longitudes, (10) Bayesian regression including random intercepts covarying according to linguistic proximity, and (11) Bayesian regression including both a Gaussian process over latitudes and longitudes and random intercepts covarying according to linguistic proximity.

Models employing Conley standard errors either required latitude and longitude values or coordinates for genetic distances. To determine distance cutoffs, we employed an approach recommended in previous work\textsuperscript{92}: we fitted models with a range of feasible distance cutoffs and retained the model with the largest standard error for the slope parameter. These models were fitted using the conleyreg R package\textsuperscript{93}. Bayesian models were fitted using the brms R package\textsuperscript{81}. Our choice of priors was based on prior predictive simulation. All models converged normally (\(\hat{R}\) \textless{} 1.1). Across all model types and parameter combinations, we calculated the false positive rate as the proportion of models that estimated slopes with a two-tailed 95\% confidence / credible interval excluding zero when \(r = 0\). We calculated statistical power as the proportion of models that estimated slopes with a 95\% confidence / credible interval excluding zero when \(r > 0\). We calculated two-tailed 95\% bootstrap confidence intervals for these false positive rates and statistical power estimates with 1,000 bootstrap iterations.

\hypertarget{reanalyses}{%
\subsection{Reanalyses}\label{reanalyses}}

We searched the individual analyses from our literature review for statistically significant cross-national correlations with available primary or secondary data. We restricted our search to one analysis per paper, and searched until we had a set of twelve analyses, six from economic development papers and six from cultural values papers, for which we were able to replicate the original result (i.e.~find a cross-national correlation with the same sign and roughly the same effect size). We also ensured that at least one analysis was a multilevel model, with multiple observations per nation.

The twelve analyses that we settled on\textsuperscript{13,14,16,55--63} were mostly bivariate cross-national correlations, except for two. One analysis\textsuperscript{14} additionally controlled for log gross national income, and another analysis\textsuperscript{60} is a multilevel model including random intercepts for nations and several individual-level and national-level covariates (see Model 5 in original paper). Before running any additional models, we pre-registered these twelve analyses on the Open Science Framework on 25\textsuperscript{th} January 2022 (\url{https://osf.io/u8tbf}). We endeavoured to keep the sample sizes of our reanalyses as close to the original analyses as possible, though there were some deviations (see Supplementary Table \ref{tab:tableDeviations}). Despite these slight deviations from the original analyses, all models reported in Figure \ref{fig:plotReplications1} are fitted to the same number of data points, meaning that any changes in effect sizes are solely due to controlling for non-independence.

For each individual analysis, we ran four models: (1) a naive regression replicating the original finding, (2) a regression including a Gaussian process allowing nation random intercepts to covary according to a geographic proximity matrix from latitude and longitude values, (3) a regression including nation random intercepts that covaried according to a linguistic proximity matrix, and (4) a regression including both a geographic Gaussian process and nation random intercepts with linguistic covariance. See Supplementary Methods for full models.

We fitted these models using the brms R package\textsuperscript{81}. Our choice of priors was based on prior predictive simulation. All models converged normally (\(\hat{R}\) \textless{} 1.1), though for some models we resorted to using approximate Gaussian processes\textsuperscript{94} to reach convergence. The assumptions of these models were met: residuals were approximately normally distributed, though this was not formally tested.

\hypertarget{reproducibility}{%
\subsection{Reproducibility}\label{reproducibility}}

All data and code are accessible on GitHub\textsuperscript{95}. We used the targets R package\textsuperscript{96} to create a reproducible data analysis pipeline and the papaja R package\textsuperscript{97} to reproducibly generate the manuscript.

\hypertarget{ethics}{%
\subsection{Ethics}\label{ethics}}

We did not apply for ethical approval through an ethics board as we analysed only publicly available and simulated data in this study.

\newpage
\nolinenumbers

\hypertarget{data-availability}{%
\section{Data Availability}\label{data-availability}}

All data to reproduce the statistical analyses in this manuscript can be found on GitHub\textsuperscript{95}. Data on human development were retrieved from the United Nations Development Programme (\url{https://hdr.undp.org/en/content/download-data}). Data on GDP per capita, annual GDP per capita growth, and the Gini coefficient were retrieved from the World Bank (\url{https://data.worldbank.org/}). Data on traditional vs.~secular values and survival vs.~self-expression values were retrieved from the World Values Survey (\url{https://www.worldvaluessurvey.org/wvs.jsp}). Data on cultural tightness were retrieved from the OSF repository for ref\textsuperscript{83} (\url{https://osf.io/47pe8/}). The review data generated in this study are provided in Supplementary Data 1. All other datasets (e.g., for replications) were retrieved from tables and supplementary tables directly from papers cited in the main text\textsuperscript{13,14,16,55--63} - these datasets can be found in our GitHub repository\textsuperscript{95}.

\hypertarget{code-availability}{%
\section{Code Availability}\label{code-availability}}

All code to reproduce the statistical analyses in this manuscript can be found on GitHub\textsuperscript{95}.

\newpage

\hypertarget{references}{%
\section{References}\label{references}}

\begingroup

\hypertarget{refs}{}
\begin{CSLReferences}{0}{0}
\leavevmode\vadjust pre{\hypertarget{ref-Caselli2005}{}}%
\CSLLeftMargin{1. }%
\CSLRightInline{Caselli, F. \href{https://doi.org/10.1016/S1574-0684(05)01009-9}{Accounting for cross-country income differences}. in (eds. Aghion, P. \& Durlauf, S. N.) vol. 1 679--741 (Elsevier, 2005).}

\leavevmode\vadjust pre{\hypertarget{ref-Austin2012}{}}%
\CSLLeftMargin{2. }%
\CSLRightInline{Austin, K. F. \& McKinney, L. A. \href{https://doi.org/10.1525/sop.2012.55.3.421}{Disease, war, hunger, and deprivation: A cross-national investigation of the determinants of life expectancy in less-developed and sub-{S}aharan {A}frican nations}. \emph{Sociological Perspectives} \textbf{55}, 421--447 (2012).}

\leavevmode\vadjust pre{\hypertarget{ref-Rai2013}{}}%
\CSLLeftMargin{3. }%
\CSLRightInline{Rai, D., Zitko, P., Jones, K., Lynch, J. \& Araya, R. \href{https://doi.org/10.1192/bjp.bp.112.112482}{Country- and individual-level socioeconomic determinants of depression: Multilevel cross-national comparison}. \emph{British Journal of Psychiatry} \textbf{202}, 195--203 (2013).}

\leavevmode\vadjust pre{\hypertarget{ref-Diener2009}{}}%
\CSLLeftMargin{4. }%
\CSLRightInline{Diener, E., Diener, M. \& Diener, C. Factors predicting the subjective well-being of nations. in \emph{Culture and well-being: The collected works of {E}d {D}iener} (ed. Diener, E.) 43--70 (Springer Netherlands, 2009). doi:\href{https://doi.org/10.1007/978-90-481-2352-0_3}{10.1007/978-90-481-2352-0\_3}.}

\leavevmode\vadjust pre{\hypertarget{ref-Kirkcaldy2004}{}}%
\CSLLeftMargin{5. }%
\CSLRightInline{Kirkcaldy, B., Furnham, A. \& Siefen, G. \href{https://doi.org/10.1027/1016-9040.9.2.107}{The relationship between health efficacy, educational attainment, and well-being among 30 nations}. \emph{European Psychologist} \textbf{9}, 107--119 (2004).}

\leavevmode\vadjust pre{\hypertarget{ref-White2021}{}}%
\CSLLeftMargin{6. }%
\CSLRightInline{White, C. J. M., Muthukrishna, M. \& Norenzayan, A. \href{https://doi.org/10.1073/pnas.2109650118}{Cultural similarity among coreligionists within and between countries}. \emph{Proceedings of the National Academy of Sciences} \textbf{118}, e2109650118 (2021).}

\leavevmode\vadjust pre{\hypertarget{ref-Henrich2010}{}}%
\CSLLeftMargin{7. }%
\CSLRightInline{Henrich, J., Heine, S. J. \& Norenzayan, A. \href{https://doi.org/10.1017/S0140525X0999152X}{The weirdest people in the world?} \emph{Behavioral and Brain Sciences} \textbf{33}, 61--83 (2010).}

\leavevmode\vadjust pre{\hypertarget{ref-Pollet2014}{}}%
\CSLLeftMargin{8. }%
\CSLRightInline{Pollet, T. V., Tybur, J. M., Frankenhuis, W. E. \& Rickard, I. J. \href{https://doi.org/10.1007/s12110-014-9206-3}{What can cross-cultural correlations teach us about human nature?} \emph{Human Nature} \textbf{25}, 410--429 (2014).}

\leavevmode\vadjust pre{\hypertarget{ref-Benhabib1994}{}}%
\CSLLeftMargin{9. }%
\CSLRightInline{Benhabib, J. \& Spiegel, M. M. \href{https://doi.org/10.1016/0304-3932(94)90047-7}{The role of human capital in economic development: Evidence from aggregate cross-country data}. \emph{Journal of Monetary Economics} \textbf{34}, 143--173 (1994).}

\leavevmode\vadjust pre{\hypertarget{ref-Comin2010}{}}%
\CSLLeftMargin{10. }%
\CSLRightInline{Comin, D., Easterly, W. \& Gong, E. \href{http://www.jstor.org/stable/25760309}{Was the wealth of nations determined in 1000 {BC}?} \emph{American Economic Journal: Macroeconomics} \textbf{2}, 65--97 (2010).}

\leavevmode\vadjust pre{\hypertarget{ref-LaPorta1997}{}}%
\CSLLeftMargin{11. }%
\CSLRightInline{La Porta, R., Lopez-De-Silanes, F., Shleifer, A. \& Vishny, R. W. \href{https://doi.org/10.1111/j.1540-6261.1997.tb02727.x}{Legal determinants of external finance}. \emph{The Journal of Finance} \textbf{52}, 1131--1150 (1997).}

\leavevmode\vadjust pre{\hypertarget{ref-Sachs2001}{}}%
\CSLLeftMargin{12. }%
\CSLRightInline{Sachs, J. D. \& Warner, A. M. \href{https://doi.org/10.1016/S0014-2921(01)00125-8}{The curse of natural resources}. \emph{European Economic Review} \textbf{45}, 827--838 (2001).}

\leavevmode\vadjust pre{\hypertarget{ref-Fincher2008}{}}%
\CSLLeftMargin{13. }%
\CSLRightInline{Fincher, C. L., Thornhill, R., Murray, D. R. \& Schaller, M. \href{https://doi.org/10.1098/rspb.2008.0094}{Pathogen prevalence predicts human cross-cultural variability in individualism/collectivism}. \emph{Proceedings of the Royal Society B: Biological Sciences} \textbf{275}, 1279--1285 (2008).}

\leavevmode\vadjust pre{\hypertarget{ref-Gelfand2011}{}}%
\CSLLeftMargin{14. }%
\CSLRightInline{Gelfand, M. J. \emph{et al.} \href{https://doi.org/10.1126/science.1197754}{Differences between tight and loose cultures: A 33-nation study}. \emph{Science} \textbf{332}, 1100--1104 (2011).}

\leavevmode\vadjust pre{\hypertarget{ref-Hofstede2001}{}}%
\CSLLeftMargin{15. }%
\CSLRightInline{Hofstede, G. \emph{Culture's consequences: Comparing values, behaviors, institutions and organizations across nations}. (Sage Publications, 2001).}

\leavevmode\vadjust pre{\hypertarget{ref-Inglehart2000}{}}%
\CSLLeftMargin{16. }%
\CSLRightInline{Inglehart, R. \& Baker, W. E. \href{https://doi.org/10.2307/2657288}{Modernization, cultural change, and the persistence of traditional values}. \emph{American Sociological Review} \textbf{65}, 19--51 (2000).}

\leavevmode\vadjust pre{\hypertarget{ref-Awad2018}{}}%
\CSLLeftMargin{17. }%
\CSLRightInline{Awad, E. \emph{et al.} \href{https://doi.org/10.1038/s41586-018-0637-6}{The moral machine experiment}. \emph{Nature} \textbf{563}, 59--64 (2018).}

\leavevmode\vadjust pre{\hypertarget{ref-Rhoads2021}{}}%
\CSLLeftMargin{18. }%
\CSLRightInline{Rhoads, S. A., Gunter, D., Ryan, R. M. \& Marsh, A. A. \href{https://doi.org/10.1177/0956797621994767}{Global variation in subjective well-being predicts seven forms of altruism}. \emph{Psychological Science} \textbf{32}, 1247--1261 (2021).}

\leavevmode\vadjust pre{\hypertarget{ref-Schulz2019}{}}%
\CSLLeftMargin{19. }%
\CSLRightInline{Schulz, J. F., Bahrami-Rad, D., Beauchamp, J. P. \& Henrich, J. \href{https://doi.org/10.1126/science.aau5141}{The {C}hurch, intensive kinship, and global psychological variation}. \emph{Science} \textbf{366}, eaau5141 (2019).}

\leavevmode\vadjust pre{\hypertarget{ref-Thomson2018}{}}%
\CSLLeftMargin{20. }%
\CSLRightInline{Thomson, R. \emph{et al.} \href{https://doi.org/10.1073/pnas.1713191115}{Relational mobility predicts social behaviors in 39 countries and is tied to historical farming and threat}. \emph{Proceedings of the National Academy of Sciences} \textbf{115}, 7521--7526 (2018).}

\leavevmode\vadjust pre{\hypertarget{ref-Kissling2008}{}}%
\CSLLeftMargin{21. }%
\CSLRightInline{Kissling, W. D. \& Carl, G. \href{https://doi.org/10.1111/j.1466-8238.2007.00334.x}{Spatial autocorrelation and the selection of simultaneous autoregressive models}. \emph{Global Ecology and Biogeography} \textbf{17}, 59--71 (2008).}

\leavevmode\vadjust pre{\hypertarget{ref-Hewlett2002}{}}%
\CSLLeftMargin{22. }%
\CSLRightInline{Hewlett, B. S., DeSilvestri, A. \& Guglielmino, C. R. \href{https://doi.org/10.1086/339379}{Semes and genes in {Africa}}. \emph{Current Anthropology} \textbf{43}, 313--321 (2002).}

\leavevmode\vadjust pre{\hypertarget{ref-Nunn2012}{}}%
\CSLLeftMargin{23. }%
\CSLRightInline{Nunn, N. \& Puga, D. \href{https://doi.org/10.1162/REST_a_00161}{Ruggedness: The blessing of bad geography in {A}frica}. \emph{The Review of Economics and Statistics} \textbf{94}, 20--36 (2012).}

\leavevmode\vadjust pre{\hypertarget{ref-Tobler1970}{}}%
\CSLLeftMargin{24. }%
\CSLRightInline{Tobler, W. R. \href{https://doi.org/10.2307/143141}{A computer movie simulating urban growth in the {D}etroit region}. \emph{Economic Geography} \textbf{46}, 234--240 (1970).}

\leavevmode\vadjust pre{\hypertarget{ref-Tylor1889}{}}%
\CSLLeftMargin{25. }%
\CSLRightInline{Tylor, E. B. \href{https://doi.org/10.2307/2842423}{On a method of investigating the development of institutions; applied to laws of marriage and descent}. \emph{The Journal of the Anthropological Institute of Great Britain and Ireland} \textbf{18}, 245--272 (1889).}

\leavevmode\vadjust pre{\hypertarget{ref-Naroll1961}{}}%
\CSLLeftMargin{26. }%
\CSLRightInline{Naroll, R. \href{https://doi.org/10.1086/287778}{Two solutions to {G}alton's {P}roblem}. \emph{Philosophy of Science} \textbf{28}, 15--39 (1961).}

\leavevmode\vadjust pre{\hypertarget{ref-Naroll1965}{}}%
\CSLLeftMargin{27. }%
\CSLRightInline{Naroll, R. \href{http://www.jstor.org/stable/40969817}{Galton's {P}roblem: The logic of cross-cultural analysis}. \emph{Social Research} \textbf{32}, 428--451 (1965).}

\leavevmode\vadjust pre{\hypertarget{ref-Murdock1969}{}}%
\CSLLeftMargin{28. }%
\CSLRightInline{Murdock, G. P. \& White, D. R. \href{https://doi.org/10.2307/3772907}{Standard cross-cultural sample}. \emph{Ethnology} \textbf{8}, 329--369 (1969).}

\leavevmode\vadjust pre{\hypertarget{ref-Gray2009}{}}%
\CSLLeftMargin{29. }%
\CSLRightInline{Gray, R. D., Drummond, A. J. \& Greenhill, S. J. \href{https://doi.org/10.1126/science.1166858}{Language phylogenies reveal expansion pulses and pauses in {Pacific} settlement}. \emph{Science} \textbf{323}, 479--483 (2009).}

\leavevmode\vadjust pre{\hypertarget{ref-Green1999}{}}%
\CSLLeftMargin{30. }%
\CSLRightInline{Green, R. \& Pawley, A. Early {Oceanic} architectural forms and settlement patterns: Linguistic, archaeological and ethnological perspectives. in \emph{Archaeology and language {III}: Artefacts, languages and texts} (eds. Blench, R. \& Spriggs, M.) 31--89 (Routledge, 1999).}

\leavevmode\vadjust pre{\hypertarget{ref-Jarque1987}{}}%
\CSLLeftMargin{31. }%
\CSLRightInline{Jarque, C. M. \& Bera, A. K. \href{https://doi.org/10.2307/1403192}{A test for normality of observations and regression residuals}. \emph{International Statistical Review / Revue Internationale de Statistique} \textbf{55}, 163--172 (1987).}

\leavevmode\vadjust pre{\hypertarget{ref-Legendre1993}{}}%
\CSLLeftMargin{32. }%
\CSLRightInline{Legendre, P. \href{https://doi.org/10.2307/1939924}{Spatial autocorrelation: Trouble or new paradigm?} \emph{Ecology} \textbf{74}, 1659--1673 (1993).}

\leavevmode\vadjust pre{\hypertarget{ref-Roberts2013}{}}%
\CSLLeftMargin{33. }%
\CSLRightInline{Roberts, J., Seán AND Winters. \href{https://doi.org/10.1371/journal.pone.0070902}{Linguistic diversity and traffic accidents: Lessons from statistical studies of cultural traits}. \emph{PLOS ONE} \textbf{8}, 1--13 (2013).}

\leavevmode\vadjust pre{\hypertarget{ref-Lichstein2002}{}}%
\CSLLeftMargin{34. }%
\CSLRightInline{Lichstein, J. W., Simons, T. R., Shriner, S. A. \& Franzreb, K. E. \href{https://doi.org/10.1890/0012-9615(2002)072\%5B0445:SAAAMI\%5D2.0.CO;2}{Spatial autocorrelation and autoregressive models in ecology}. \emph{Ecological Monographs} \textbf{72}, 445--463 (2002).}

\leavevmode\vadjust pre{\hypertarget{ref-Loftin1983}{}}%
\CSLLeftMargin{35. }%
\CSLRightInline{Loftin, C. \& Ward, S. K. \href{https://doi.org/10.2307/2095150}{A spatial autocorrelation model of the effects of population density on fertility}. \emph{American Sociological Review} \textbf{48}, 121--128 (1983).}

\leavevmode\vadjust pre{\hypertarget{ref-Ferguson1997}{}}%
\CSLLeftMargin{36. }%
\CSLRightInline{Ferguson, J. Anthropology and its evil twin. in (eds. Cooper, F. \& Packard, R.) 150--175 (University of California Press Berkeley, 1997).}

\leavevmode\vadjust pre{\hypertarget{ref-Dow2008}{}}%
\CSLLeftMargin{37. }%
\CSLRightInline{Dow, M. M. \& Eff, E. A. \href{https://doi.org/10.1177/1069397107311186}{Global, regional, and local network autocorrelation in the standard cross-cultural sample}. \emph{Cross-Cultural Research} \textbf{42}, 148--171 (2008).}

\leavevmode\vadjust pre{\hypertarget{ref-Eff2004}{}}%
\CSLLeftMargin{38. }%
\CSLRightInline{Eff, E. A. Does {M}r. {G}alton still have a problem? Autocorrelation in the standard cross-cultural sample. \emph{World Cultures} \textbf{15}, 153--170 (2004).}

\leavevmode\vadjust pre{\hypertarget{ref-Symonds2014}{}}%
\CSLLeftMargin{39. }%
\CSLRightInline{Symonds, M. R. E. \& Blomberg, S. P. A primer on phylogenetic generalised least squares. in \emph{Modern phylogenetic comparative methods and their application in evolutionary biology: Concepts and practice} (ed. Garamszegi, L. Z.) 105--130 (Springer Berlin Heidelberg, 2014). doi:\href{https://doi.org/10.1007/978-3-662-43550-2_5}{10.1007/978-3-662-43550-2\_5}.}

\leavevmode\vadjust pre{\hypertarget{ref-Watts2018}{}}%
\CSLLeftMargin{40. }%
\CSLRightInline{Watts, J., Sheehan, O., Bulbulia, J., Gray, R. D. \& Atkinson, Q. D. \href{https://doi.org/10.1038/s41562-018-0379-3}{Christianity spread faster in small, politically structured societies}. \emph{Nature Human Behaviour} \textbf{2}, 559--564 (2018).}

\leavevmode\vadjust pre{\hypertarget{ref-Atkinson2016}{}}%
\CSLLeftMargin{41. }%
\CSLRightInline{Atkinson, Q. D., Coomber, T., Passmore, S., Greenhill, S. J. \& Kushnick, G. \href{https://doi.org/10.1371/journal.pone.0156340}{Cultural and environmental predictors of pre-{European} deforestation on {Pacific} islands}. \emph{PLOS ONE} \textbf{11}, 1--15 (2016).}

\leavevmode\vadjust pre{\hypertarget{ref-Kelly2020}{}}%
\CSLLeftMargin{42. }%
\CSLRightInline{Kelly, M. \href{http://ssrn.com/abstract=3688200}{Understanding persistence}. \emph{CEPR Discussion Paper No. DP15246} (2020).}

\leavevmode\vadjust pre{\hypertarget{ref-Bromham2018}{}}%
\CSLLeftMargin{43. }%
\CSLRightInline{Bromham, L., Hua, X., Cardillo, M., Schneemann, H. \& Greenhill, S. J. \href{https://doi.org/10.1098/rsos.181100}{Parasites and politics: Why cross-cultural studies must control for relatedness, proximity and covariation}. \emph{Royal Society Open Science} \textbf{5}, 181100 (2018).}

\leavevmode\vadjust pre{\hypertarget{ref-Bromham2021}{}}%
\CSLLeftMargin{44. }%
\CSLRightInline{Bromham, L., Skeels, A., Schneemann, H., Dinnage, R. \& Hua, X. \href{https://doi.org/10.1038/s41562-020-01039-8}{There is little evidence that spicy food in hot countries is an adaptation to reducing infection risk}. \emph{Nature Human Behaviour} \textbf{5}, 878--891 (2021).}

\leavevmode\vadjust pre{\hypertarget{ref-Currie2012}{}}%
\CSLLeftMargin{45. }%
\CSLRightInline{Currie, T. E. \& Mace, R. \href{https://doi.org/10.1017/S0140525X11000963}{Analyses do not support the parasite-stress theory of human sociality}. \emph{Behavioral and Brain Sciences} \textbf{35}, 83--85 (2012).}

\leavevmode\vadjust pre{\hypertarget{ref-Passmore2022}{}}%
\CSLLeftMargin{46. }%
\CSLRightInline{Passmore, S. \& Watts, J. {WEIRD} people and the {W}estern {C}hurch: Who made whom? \emph{Religion, Brain \& Behavior} 1--58 (2022) doi:\href{https://doi.org/10.1080/2153599X.2021.1991459}{10.1080/2153599X.2021.1991459}.}

\leavevmode\vadjust pre{\hypertarget{ref-hdi}{}}%
\CSLLeftMargin{47. }%
\CSLRightInline{United Nations Development Programme. \emph{Human development report}. \url{http://hdr.undp.org/en/composite/HDI} (2021).}

\leavevmode\vadjust pre{\hypertarget{ref-Schulz2022}{}}%
\CSLLeftMargin{48. }%
\CSLRightInline{Schulz, J. F. \href{https://doi.org/10.1093/ej/ueac027}{Kin networks and institutional development}. \emph{The Economic Journal} \textbf{132}, 2578--2613 (2022).}

\leavevmode\vadjust pre{\hypertarget{ref-Conley1999}{}}%
\CSLLeftMargin{49. }%
\CSLRightInline{Conley, T. G. \href{https://doi.org/10.1016/S0304-4076(98)00084-0}{{GMM} estimation with cross sectional dependence}. \emph{Journal of Econometrics} \textbf{92}, 1--45 (1999).}

\leavevmode\vadjust pre{\hypertarget{ref-Conley2010}{}}%
\CSLLeftMargin{50. }%
\CSLRightInline{Conley, T. G. Spatial econometrics. in \emph{Microeconometrics} (eds. Durlauf, S. N. \& Blume, L. E.) 303--313 (Palgrave Macmillan, 2010).}

\leavevmode\vadjust pre{\hypertarget{ref-Currie2009}{}}%
\CSLLeftMargin{51. }%
\CSLRightInline{Currie, T. E. \& Mace, R. \href{https://doi.org/10.1073/pnas.0804698106}{Political complexity predicts the spread of ethnolinguistic groups}. \emph{Proceedings of the National Academy of Sciences} \textbf{106}, 7339--7344 (2009).}

\leavevmode\vadjust pre{\hypertarget{ref-McElreath2020}{}}%
\CSLLeftMargin{52. }%
\CSLRightInline{McElreath, R. \emph{Statistical rethinking: A {B}ayesian course with examples in {R} and {Stan}}. (CRC Press, 2020).}

\leavevmode\vadjust pre{\hypertarget{ref-Neal1998}{}}%
\CSLLeftMargin{53. }%
\CSLRightInline{Neal, R. M. Regression and classification using {Gaussian} process priors. in \emph{Bayesian statistics} (eds. Bernardo, J. M., Berger, J. O., Dawid, A. P. \& Smith, A. F. M.) vol. 6 475--501 (Oxford University Press).}

\leavevmode\vadjust pre{\hypertarget{ref-deVillemereuil2014}{}}%
\CSLLeftMargin{54. }%
\CSLRightInline{Villemereuil, P. de \& Nakagawa, S. General quantitative genetic methods for comparative biology. in \emph{Modern phylogenetic comparative methods and their application in evolutionary biology: Concepts and practice} (ed. Garamszegi, L. Z.) 287--303 (Springer Berlin Heidelberg, 2014). doi:\href{https://doi.org/10.1007/978-3-662-43550-2_11}{10.1007/978-3-662-43550-2\_11}.}

\leavevmode\vadjust pre{\hypertarget{ref-Beck2003}{}}%
\CSLLeftMargin{55. }%
\CSLRightInline{Beck, T., Demirgäç-Kunt, A. \& Levine, R. \href{https://doi.org/10.1016/S0304-405X(03)00144-2}{Law, endowments, and finance}. \emph{Journal of Financial Economics} \textbf{70}, 137--181 (2003).}

\leavevmode\vadjust pre{\hypertarget{ref-Beck2005}{}}%
\CSLLeftMargin{56. }%
\CSLRightInline{Beck, T., Demirgäç-Kunt, A. \& Levine, R. {SME}s, growth, and poverty: Cross-country evidence. \emph{Journal of Economic Growth} \textbf{10}, 199--229 (2005).}

\leavevmode\vadjust pre{\hypertarget{ref-Bockstette2002}{}}%
\CSLLeftMargin{57. }%
\CSLRightInline{Bockstette, V., Chanda, A. \& Putterman, L. States and markets: The advantage of an early start. \emph{Journal of Economic growth} \textbf{7}, 347--369 (2002).}

\leavevmode\vadjust pre{\hypertarget{ref-Easterly2003}{}}%
\CSLLeftMargin{58. }%
\CSLRightInline{Easterly, W. \& Levine, R. \href{https://doi.org/10.1016/S0304-3932(02)00200-3}{Tropics, germs, and crops: How endowments influence economic development}. \emph{Journal of Monetary Economics} \textbf{50}, 3--39 (2003).}

\leavevmode\vadjust pre{\hypertarget{ref-Easterly2007}{}}%
\CSLLeftMargin{59. }%
\CSLRightInline{Easterly, W. \href{https://doi.org/10.1016/j.jdeveco.2006.11.002}{Inequality does cause underdevelopment: Insights from a new instrument}. \emph{Journal of Development Economics} \textbf{84}, 755--776 (2007).}

\leavevmode\vadjust pre{\hypertarget{ref-Skidmore2002}{}}%
\CSLLeftMargin{60. }%
\CSLRightInline{Skidmore, M. \& Toya, H. \href{https://doi.org/10.1093/ei/40.4.664}{Do natural disasters promote long-run growth?} \emph{Economic Inquiry} \textbf{40}, 664--687 (2002).}

\leavevmode\vadjust pre{\hypertarget{ref-Adamczyk2009}{}}%
\CSLLeftMargin{61. }%
\CSLRightInline{Adamczyk, A. \& Pitt, C. \href{https://doi.org/10.1016/j.ssresearch.2009.01.002}{Shaping attitudes about homosexuality: The role of religion and cultural context}. \emph{Social Science Research} \textbf{38}, 338--351 (2009).}

\leavevmode\vadjust pre{\hypertarget{ref-Alesina2013}{}}%
\CSLLeftMargin{62. }%
\CSLRightInline{Alesina, A., Giuliano, P. \& Nunn, N. On the origins of gender roles: Women and the plough. \emph{Quarterly Journal of Economics} \textbf{128}, 469--530 (2013).}

\leavevmode\vadjust pre{\hypertarget{ref-Knack1997}{}}%
\CSLLeftMargin{63. }%
\CSLRightInline{Knack, S. \& Keefer, P. \href{https://doi.org/10.1162/003355300555475}{Does social capital have an economic payoff? A cross-country investigation}. \emph{The Quarterly Journal of Economics} \textbf{112}, 1251--1288 (1997).}

\leavevmode\vadjust pre{\hypertarget{ref-Sookias2018}{}}%
\CSLLeftMargin{64. }%
\CSLRightInline{Sookias, R. B., Passmore, S. \& Atkinson, Q. D. \href{https://doi.org/10.1098/rsos.171411}{Deep cultural ancestry and human development indicators across nation states}. \emph{Royal Society Open Science} \textbf{5}, 171411 (2018).}

\leavevmode\vadjust pre{\hypertarget{ref-Voth2021}{}}%
\CSLLeftMargin{65. }%
\CSLRightInline{Voth, H.-J. Persistence -- myth and mystery. in \emph{The handbook of historical economics} (eds. Bisin, A. \& Federico, G.) 243--267 (Academic Press, 2021). doi:\href{https://doi.org/10.1016/B978-0-12-815874-6.00015-0}{10.1016/B978-0-12-815874-6.00015-0}.}

\leavevmode\vadjust pre{\hypertarget{ref-Smith2017}{}}%
\CSLLeftMargin{66. }%
\CSLRightInline{Smith, M. D., Rabbitt, M. P. \& Coleman- Jensen, A. \href{https://doi.org/10.1016/j.worlddev.2017.01.006}{Who are the world's food insecure? New evidence from the {F}ood and {A}griculture {O}rganization's {F}ood {I}nsecurity {E}xperience {S}cale}. \emph{World Development} \textbf{93}, 402--412 (2017).}

\leavevmode\vadjust pre{\hypertarget{ref-Hastie2017}{}}%
\CSLLeftMargin{67. }%
\CSLRightInline{Hastie, T. J. \& Tibshirani, R. J. \emph{Generalized additive models}. (Routledge, 2017).}

\leavevmode\vadjust pre{\hypertarget{ref-Muthukrishna2020}{}}%
\CSLLeftMargin{68. }%
\CSLRightInline{Muthukrishna, M. \emph{et al.} \href{https://doi.org/10.1177/0956797620916782}{Beyond western, educated, industrial, rich, and democratic (WEIRD) psychology: Measuring and mapping scales of cultural and psychological distance}. \emph{Psychological Science} \textbf{31}, 678--701 (2020).}

\leavevmode\vadjust pre{\hypertarget{ref-Spolaore2009}{}}%
\CSLLeftMargin{69. }%
\CSLRightInline{Spolaore, E. \& Wacziarg, R. The diffusion of development. \emph{The Quarterly Journal of Economics} \textbf{124}, 469--529 (2009).}

\leavevmode\vadjust pre{\hypertarget{ref-Kyritsis2022}{}}%
\CSLLeftMargin{70. }%
\CSLRightInline{Kyritsis, T., Matthews, L. J., Welch, D. \& Atkinson, Q. D. \href{https://doi.org/10.1017/ehs.2022.40}{Shared cultural ancestry predicts the global diffusion of democracy}. \emph{Evolutionary Human Sciences} \textbf{4}, e42 (2022).}

\leavevmode\vadjust pre{\hypertarget{ref-Matthews2016}{}}%
\CSLLeftMargin{71. }%
\CSLRightInline{Matthews, L. J., Passmore, S., Richard, P. M., Gray, R. D. \& Atkinson, Q. D. \href{https://doi.org/10.1371/journal.pone.0152979}{Shared cultural history as a predictor of political and economic changes among nation states}. \emph{PLOS ONE} \textbf{11}, 1--18 (2016).}

\leavevmode\vadjust pre{\hypertarget{ref-Trouillot2016}{}}%
\CSLLeftMargin{72. }%
\CSLRightInline{Trouillot, M. \emph{Global transformations: Anthropology and the modern world}. (Springer, 2016).}

\leavevmode\vadjust pre{\hypertarget{ref-Wolf2010}{}}%
\CSLLeftMargin{73. }%
\CSLRightInline{Wolf, E. R. Europe and the people without history. \emph{University of California Press} (2010).}

\leavevmode\vadjust pre{\hypertarget{ref-Smaldino2016}{}}%
\CSLLeftMargin{74. }%
\CSLRightInline{Smaldino, P. E. \& McElreath, R. \href{https://doi.org/10.1098/rsos.160384}{The natural selection of bad science}. \emph{Royal Society Open Science} \textbf{3}, 160384 (2016).}

\leavevmode\vadjust pre{\hypertarget{ref-Liddell2018}{}}%
\CSLLeftMargin{75. }%
\CSLRightInline{Liddell, T. M. \& Kruschke, J. K. \href{https://doi.org/10.1016/j.jesp.2018.08.009}{Analyzing ordinal data with metric models: What could possibly go wrong?} \emph{Journal of Experimental Social Psychology} \textbf{79}, 328--348 (2018).}

\leavevmode\vadjust pre{\hypertarget{ref-Nicholson2017}{}}%
\CSLLeftMargin{76. }%
\CSLRightInline{Nicholson, J. S., Deboeck, P. R. \& Howard, W. \href{https://doi.org/10.1177/0165025415618275}{Attrition in developmental psychology: A review of modern missing data reporting and practices}. \emph{International Journal of Behavioral Development} \textbf{41}, 143--153 (2017).}

\leavevmode\vadjust pre{\hypertarget{ref-Tipton2019}{}}%
\CSLLeftMargin{77. }%
\CSLRightInline{Tipton, E., Pustejovsky, J. E. \& Ahmadi, H. \href{https://doi.org/10.1002/jrsm.1339}{Current practices in meta-regression in psychology, education, and medicine}. \emph{Research Synthesis Methods} \textbf{10}, 180--194 (2019).}

\leavevmode\vadjust pre{\hypertarget{ref-Chambers2021}{}}%
\CSLLeftMargin{78. }%
\CSLRightInline{Chambers, C. D. \& Tzavella, L. The past, present and future of {Registered Reports}. \emph{Nature Human Behaviour} \textbf{6}, 29--42 (2021).}

\leavevmode\vadjust pre{\hypertarget{ref-Deffner2022}{}}%
\CSLLeftMargin{79. }%
\CSLRightInline{Deffner, D., Rohrer, J. M. \& McElreath, R. \href{https://doi.org/10.1177/25152459221106366}{A causal framework for cross-cultural generalizability}. \emph{Advances in Methods and Practices in Psychological Science} \textbf{5}, 25152459221106366 (2022).}

\leavevmode\vadjust pre{\hypertarget{ref-rstan}{}}%
\CSLLeftMargin{80. }%
\CSLRightInline{Stan Development Team. \href{http://mc-stan.org/}{{RStan}: The {R} interface to {Stan}}. (2020).}

\leavevmode\vadjust pre{\hypertarget{ref-Burkner2017}{}}%
\CSLLeftMargin{81. }%
\CSLRightInline{Bürkner, P.-C. \href{https://doi.org/10.18637/jss.v080.i01}{{brms}: An {R} package for {Bayesian} multilevel models using {Stan}}. \emph{Journal of Statistical Software} \textbf{80}, 1--28 (2017).}

\leavevmode\vadjust pre{\hypertarget{ref-Oishi2013}{}}%
\CSLLeftMargin{82. }%
\CSLRightInline{Oishi, S. \href{https://doi.org/10.1146/annurev-psych-030413-152156}{Socioecological psychology}. \emph{Annual Review of Psychology} \textbf{65}, 581--609 (2014).}

\leavevmode\vadjust pre{\hypertarget{ref-Gelfand2021}{}}%
\CSLLeftMargin{83. }%
\CSLRightInline{Gelfand, M. J. \emph{et al.} \href{https://doi.org/10.1016/S2542-5196(20)30301-6}{The relationship between cultural tightness--looseness and {COVID-19} cases and deaths: A global analysis}. \emph{The Lancet Planetary Health} \textbf{5}, e135--e144 (2021).}

\leavevmode\vadjust pre{\hypertarget{ref-Brownrigg2018}{}}%
\CSLLeftMargin{84. }%
\CSLRightInline{Brownrigg, R. \emph{\href{https://CRAN.R-project.org/package=maps}{{maps}: Draw geographical maps}}. (2018).}

\leavevmode\vadjust pre{\hypertarget{ref-Hijmans2019}{}}%
\CSLLeftMargin{85. }%
\CSLRightInline{Hijmans, R. J. \emph{\href{https://CRAN.R-project.org/package=geosphere}{{geosphere}: Spherical trigonometry}}. (2019).}

\leavevmode\vadjust pre{\hypertarget{ref-Glottolog}{}}%
\CSLLeftMargin{86. }%
\CSLRightInline{Hammarström, H., Forkel, R., Haspelmath, M. \& Bank, S. \emph{Glottolog 3.0}. (Max Planck Institute for the Science of Human History, 2017). doi:\href{https://doi.org/10.5281/zenodo.4061162}{10.5281/zenodo.4061162}.}

\leavevmode\vadjust pre{\hypertarget{ref-Ethnologue}{}}%
\CSLLeftMargin{87. }%
\CSLRightInline{Eberhard, D. M., Simons, G. F. \& Fennig, C. D. \emph{\href{https://www.ethnologue.com/}{Ethnologue: Languages of the world}}. (SIL International, 2018).}

\leavevmode\vadjust pre{\hypertarget{ref-Eff2008}{}}%
\CSLLeftMargin{88. }%
\CSLRightInline{Eff, E. A. Weight matrices for cultural proximity: Deriving weights from a language phylogeny. \emph{Structure and Dynamics} \textbf{3}, (2008).}

\leavevmode\vadjust pre{\hypertarget{ref-Page2021}{}}%
\CSLLeftMargin{89. }%
\CSLRightInline{Page, M. J. \emph{et al.} \href{https://doi.org/10.1136/bmj.n71}{The {PRISMA} 2020 statement: An updated guideline for reporting systematic reviews}. \emph{BMJ} \textbf{372}, (2021).}

\leavevmode\vadjust pre{\hypertarget{ref-Tiefelsdorf2007}{}}%
\CSLLeftMargin{90. }%
\CSLRightInline{Tiefelsdorf, M. \& Griffith, D. A. \href{https://doi.org/10.1068/a37378}{Semiparametric filtering of spatial autocorrelation: The eigenvector approach}. \emph{Environment and Planning A: Economy and Space} \textbf{39}, 1193--1221 (2007).}

\leavevmode\vadjust pre{\hypertarget{ref-DeHoyos2006}{}}%
\CSLLeftMargin{91. }%
\CSLRightInline{De Hoyos, R. E. \& Sarafidis, V. \href{https://doi.org/10.1177/1536867X0600600403}{Testing for cross-sectional dependence in panel-data models}. \emph{The Stata Journal} \textbf{6}, 482--496 (2006).}

\leavevmode\vadjust pre{\hypertarget{ref-Colella2019}{}}%
\CSLLeftMargin{92. }%
\CSLRightInline{Colella, F., Lalive, R., Sakalli, S. O. \& Thoenig, M. Inference with arbitrary clustering. \emph{IZA Discussion Paper No. 12584} (2019) doi:\href{https://doi.org/10.2139/ssrn.3449578}{10.2139/ssrn.3449578}.}

\leavevmode\vadjust pre{\hypertarget{ref-Duben2021}{}}%
\CSLLeftMargin{93. }%
\CSLRightInline{Düben, C. \emph{\href{https://CRAN.R-project.org/package=conleyreg}{{conleyreg}: Estimations using {C}onley standard errors}}. (2021).}

\leavevmode\vadjust pre{\hypertarget{ref-Solin2020}{}}%
\CSLLeftMargin{94. }%
\CSLRightInline{Solin, A. \& Särkkä, S. Hilbert space methods for reduced-rank {G}aussian process regression. \emph{Statistics and Computing} \textbf{30}, 419--446 (2020).}

\leavevmode\vadjust pre{\hypertarget{ref-github}{}}%
\CSLLeftMargin{95. }%
\CSLRightInline{Claessens, S., Kyritsis, T. \& Atkinson, Q. D. Cross-national analyses require additional controls to account for the non-independence of nations - ScottClaessens/crossNationalCorrelations: v1.0.0. (2023) doi:\href{https://doi.org/10.5281/zenodo.8128702}{10.5281/zenodo.8128702}.}

\leavevmode\vadjust pre{\hypertarget{ref-Landau2021}{}}%
\CSLLeftMargin{96. }%
\CSLRightInline{Landau, W. M. \href{https://doi.org/10.21105/joss.02959}{The targets {R} package: A dynamic {M}ake-like function-oriented pipeline toolkit for reproducibility and high-performance computing}. \emph{Journal of Open Source Software} \textbf{6}, 2959 (2021).}

\leavevmode\vadjust pre{\hypertarget{ref-Aust2020}{}}%
\CSLLeftMargin{97. }%
\CSLRightInline{Aust, F. \& Barth, M. \emph{\href{https://github.com/crsh/papaja}{{papaja}: {Create} {APA} manuscripts with {R Markdown}}}. (2020).}

\end{CSLReferences}

\endgroup

\newpage

\hypertarget{acknowledgements}{%
\section{Acknowledgements}\label{acknowledgements}}

This work was supported by a Royal Society of New Zealand Marsden grant (20-UOA123) to QDA.

\hypertarget{author-contributions-statement}{%
\section{Author Contributions Statement}\label{author-contributions-statement}}

SC and QDA conceived of and designed the study. SC curated the data, produced all code for analysis and visualisation, and wrote the original draft of the manuscript. TK and QDA developed and compiled the geographic and linguistic distance matrices. QDA provided funding and input on manuscript preparation and revision. All authors reviewed and edited the final draft of the manuscript.

\hypertarget{competing-interests-statement}{%
\section{Competing Interests Statement}\label{competing-interests-statement}}

The authors declare no competing interests.

\newpage
\vspace*{60mm}

\renewcommand{\figurename}{Supplementary Figure}
\renewcommand{\tablename}{Supplementary Table}
\renewcommand{\thefigure}{\arabic{figure}} \setcounter{figure}{0}
\renewcommand{\thetable}{\arabic{table}} \setcounter{table}{0}
\renewcommand{\theequation}{S\arabic{equation}} \setcounter{equation}{0}

\hypertarget{supplementary-information}{%
\section{\texorpdfstring{\textbf{Supplementary Information}}{Supplementary Information}}\label{supplementary-information}}

\setcounter{page}{1}
\centering

\noindent \small Cross-national analyses require additional controls to account for the non-independence of nations \newline
\hspace*{1cm} \small Scott Claessens\textsuperscript{1}, Thanos Kyritsis\textsuperscript{1}, \& Quentin D. Atkinson\textsuperscript{1,2} \newline

\raggedright

\noindent \footnotesize \textsuperscript{1} School of Psychology, University of Auckland, New Zealand \newline
\noindent \footnotesize \textsuperscript{2} School of Anthropology and Museum Ethnography, University of Oxford, United Kingdom
\normalsize
\newpage

\hypertarget{supplementary-methods}{%
\subsection{Supplementary Methods}\label{supplementary-methods}}

\hypertarget{bayesian-models-for-reanalysis}{%
\subsubsection{Bayesian models for reanalysis}\label{bayesian-models-for-reanalysis}}

We provide model formulae for our reanalyses of cross-national correlations, for a general bivariate case with standardised outcome \(Y\) and predictor \(X\) variables. In the naive regression model without controls for non-independence:

\begin{align}
Y_{i} &\sim \text{Normal}(\mu_{i},\sigma) \\
\mu_{i} &= \alpha + \beta X_{i} \nonumber \\
\alpha &\sim \text{Normal}(0, 0.4) \nonumber \\
\beta &\sim \text{Normal}(0, 0.4) \nonumber \\
\sigma &\sim \text{Exponential}(5) \nonumber
\end{align}

The priors in this model were arrived at by prior predictive checks, with wider priors making predictions beyond the scale of standardised outcome variables and narrower priors being too informative.

To control for spatial non-independence, we add a Gaussian process to this model and feed it a scaled geographic distance matrix \(D\) based on Euclidean distances between latitude and longitude coordinates. This distance matrix is computed internally by the \emph{brms} R package\textsuperscript{1}. The Gaussian process uses an exponentiated quadratic covariance kernel, the only covariance kernel currently supported by \emph{brms}. The model formula is:

\begin{align}
Y_{i} &\sim \text{Normal}(\mu_{i},\sigma) \\
\mu_{i} &= \alpha + \kappa_{\text{NATION}[i]} + \beta X_{i} \nonumber \\
\begin{pmatrix}
\kappa_{1} \\ \kappa_{2} \\  ... \\ \kappa_{n}
\end{pmatrix} &\sim \text{MVNormal}
\begin{pmatrix}
\begin{pmatrix}
0 \\ 0 \\ ... \\ 0
\end{pmatrix},\textbf{K}
\end{pmatrix} \nonumber \\
\textbf{K}_{ij} &= sdgp^2 \text{exp} \big (-D_{ij}^2 / (2 lscale^2) \big ) \nonumber \\
\alpha &\sim \text{Normal}(0, 0.4) \nonumber \\
\beta &\sim \text{Normal}(0, 0.4) \nonumber \\
\sigma &\sim \text{Exponential}(5) \nonumber \\
sdgp &\sim \text{Exponential}(5) \nonumber \\
lscale &\sim \text{InverseGamma}(?,?) \nonumber 
\end{align}

where \(n\) is the number of nations, and \(D^2_{ij}\) reflects the squared Euclidean distances between latitude and longitude coordinates for the \(i\)-th and \(j\)-th nations. Notice that the inverse gamma prior on \(lscale\) is left undetermined. This is because the \emph{brms} package intelligently tunes the prior for this parameter based on the covariates of the Gaussian process (see \url{https://betanalpha.github.io/assets/case_studies/gp_part3/part3.html}).

To control for cultural phylogenetic non-independence, we manually specify the covariance structure for nation random intercepts using a pre-computed linguistic proximity matrix \(L\) (see previous section). The covariance between two nations is assumed to be linearly proportional to the linguistic proximity between those nations. This assumption is justified if we assume that cultural traits evolve neutrally via Brownian motion along a language phylogeny. Although this is a conservative assumption, we follow this approach here rather than another Gaussian Process for several reasons: (1) to avoid model non-convergence when later including a spatial Gaussian Process in the same model, (2) to work around the lack of a coordinate system for linguistic distances, as opposed to latitude and longitude values for geographic distance, and (3) to showcase different ways that researchers can allow nations to covary to control for non-independence.

The non-centered parameterisation of this model is:

\begin{align}
Y_{i} &\sim \text{Normal}(\mu_{i},\sigma) \\
\mu_{i} &= \alpha + z_{\text{NATION}[i]}\sigma_{\alpha}L + \beta X_{i} \nonumber \\
\alpha &\sim \text{Normal}(0, 0.4) \nonumber \\
\beta &\sim \text{Normal}(0, 0.4) \nonumber \\
z_{j} &\sim \text{Normal}(0, 1) \nonumber \\
\sigma_{\alpha} &\sim \text{Exponential}(5) \nonumber \\
\sigma &\sim \text{Exponential}(5) \nonumber 
\end{align}

Finally, we can control for spatial and cultural phylogenetic non-independence simultaneously by including both a Gaussian process over latitude and longitude coordinates \emph{and} nation random intercepts that covary according to linguistic proximity. The resulting model is as follows:

\begin{align}
Y_{i} &\sim \text{Normal}(\mu_{i},\sigma) \\
\mu_{i} &= \alpha + \kappa_{\text{NATION}[i]} + z_{\text{NATION}[i]}\sigma_{\alpha}L + \beta X_{i} \nonumber \\
\begin{pmatrix}
\kappa_{1} \\ \kappa_{2} \\ ... \\ \kappa_{n}
\end{pmatrix} &\sim \text{MVNormal}
\begin{pmatrix}
\begin{pmatrix}
0 \\ 0 \\ ... \\ 0
\end{pmatrix},\textbf{K}
\end{pmatrix} \nonumber \\
\textbf{K}_{ij} &= sdgp^2 \text{exp} \big (-D_{ij}^2 / (2 lscale^2) \big ) \nonumber \\
\alpha &\sim \text{Normal}(0, 0.4) \nonumber \\
\beta &\sim \text{Normal}(0, 0.4) \nonumber \\
z_{j} &\sim \text{Normal}(0, 1) \nonumber \\
\sigma_{\alpha} &\sim \text{Exponential}(5) \nonumber \\
\sigma &\sim \text{Exponential}(5) \nonumber \\
sdgp &\sim \text{Exponential}(5) \nonumber \\
lscale &\sim \text{InverseGamma}(?,?) \nonumber 
\end{align}

\newpage

\hypertarget{supplementary-figures}{%
\subsection{Supplementary Figures}\label{supplementary-figures}}


\begin{figure}[H]
\includegraphics[width=\textwidth]{manuscript_files/figure-latex/dag-1} \caption{\emph{A causal directed acyclic graph of spatial and cultural phylogenetic non-independence in cross-national studies.} We are interested in estimating the direct effect of national-level exposure \(X\) on national-level outcome \(Y\). But these variables are confounded by their common unobserved cause \(U\). \(U\) is a stand-in for shared environmental, ecological, and geographic causes (e.g.~climate, biodiversity, physical topography) and cultural and institutional causes (e.g.~cultural norms, technologies, and institutions). In this causal model, we need to condition on \(U\) to estimate the direct path from \(X\) to \(Y\), but we cannot since it is unobserved. However, geographic \(G\) and linguistic \(L\) relationships between societies influence \(U\), since changing a nation's spatial distance to or shared cultural ancestry with other nations will change its environmental and cultural traits. We can thus use \(G\) and \(L\) to model the covariation between \(X\) and \(Y\) induced by \(U\). Failing to do this and simply estimating the bivariate correlation between \(X\) and \(Y\) will produce spurious relationships and residuals that are spatially and culturally non-independent around the world.}\label{fig:dag}
\end{figure}

\newpage


\begin{figure}[H]
\includegraphics[width=\textwidth]{manuscript_files/figure-latex/plotReview2-1} \caption{\emph{Analysis-level results from literature review of 100 highly-cited cross-national studies of economic development (red) and cultural values (blue).} (a) Proportion of analyses accounting for non-independence, overall and split by common methods of controlling for non-independence. Points represent posterior median proportions and ranges represent equal-tailed 95\% credible intervals (n = 4308 observations). (b) The association between journal impact factor and the probability that an analysis accounts for non-independence. (c) Estimated trend over time for the probability that an analysis accounts for non-independence. Lines and shaded areas are posterior median regression lines and equal-tailed 50\% credible intervals from Bayesian multilevel models (n = 4308 observations). Histograms represent relative counts for individual analyses that did (top) or did not (bottom) account for non-independence. Region FEs = region fixed effects.}\label{fig:plotReview2}
\end{figure}

\newpage


\begin{figure}[H]
\includegraphics[width=\textwidth]{manuscript_files/figure-latex/plotSim1-1} \caption{\emph{Distribution of cross-national correlations from simulation study under strong spatial autocorrelation.} In these simulations, the strength of spatial autocorrelation is set to 0.8 for both outcome and predictor variables, and the true correlation is set to 0. For frequentist regression models, points represent correlation estimates and ranges represent two-tailed 95\% confidence intervals (n = 236 observations). For Bayesian regression models, points represent posterior means and ranges represent equal-tailed 95\% credible intervals (n = 236 observations). Correlations are ordered by effect size independently in each panel. Red point ranges indicate that the 95\% confidence / credible interval excludes zero. Black point ranges indicate that the 95\% confidence / credible interval includes zero. SEs = standard errors.}\label{fig:plotSim1}
\end{figure}

\newpage


\begin{figure}[H]
\includegraphics[width=\textwidth]{manuscript_files/figure-latex/plotSim2-1} \caption{\emph{Distribution of cross-national correlations from simulation study under strong cultural phylogenetic autocorrelation.} In these simulations, the strength of cultural phylogenetic autocorrelation is set to 0.8 for both outcome and predictor variables, and the true correlation is set to 0. For frequentist regression models, points represent correlation estimates and ranges represent two-tailed 95\% confidence intervals (n = 236 observations). For Bayesian regression models, points represent posterior means and ranges represent equal-tailed 95\% credible intervals (n = 236 observations). Correlations are ordered by effect size independently in each panel. Red point ranges indicate that the 95\% confidence / credible interval excludes zero. Black point ranges indicate that the 95\% confidence / credible interval includes zero. SEs = standard errors.}\label{fig:plotSim2}
\end{figure}

\newpage


\begin{figure}[H]
\includegraphics[width=\textwidth]{manuscript_files/figure-latex/plotPowerGeo01-1} \caption{\emph{Statistical power estimates for different methods of controlling for spatial non-independence in our simulation study, assuming a small true effect size (r = 0.1).} For simulated outcome and predictor variables, we systematically varied the strength of spatial autocorrelation, from weak (0.2) to moderate (0.5) to strong (0.8). We simulated 100 datasets per parameter combination assuming a small true correlation between variables (\emph{r} = 0.1) and fitted different models to each dataset. Statistical power was operationalised as the proportion of models that estimated a slope with a two-tailed 95\% confidence / credible interval excluding zero. Points represent raw proportions of models with slope 95\% confidence / credible intervals excluding zero, ranges represent two-tailed 95\% bootstrap confidence intervals (n = 1000 bootstrap samples), and dashed lines indicate 80\% power. Colours indicate whether the strength of autocorrelation for the predictor variable is 0.2 (red), 0.5, (green) or 0.8 (blue). SEs = standard errors.}\label{fig:plotPowerGeo01}
\end{figure}

\newpage


\begin{figure}[H]
\includegraphics[width=\textwidth]{manuscript_files/figure-latex/plotPowerGeo03-1} \caption{\emph{Statistical power estimates for different methods of controlling for spatial non-independence in our simulation study, assuming a medium true effect size (r = 0.3).} For simulated outcome and predictor variables, we systematically varied the strength of spatial autocorrelation, from weak (0.2) to moderate (0.5) to strong (0.8). We simulated 100 datasets per parameter combination assuming a medium true correlation between variables (\emph{r} = 0.3) and fitted different models to each dataset. Statistical power was operationalised as the proportion of models that estimated a slope with a two-tailed 95\% confidence / credible interval excluding zero. Points represent raw proportions of models with slope 95\% confidence / credible intervals excluding zero, ranges represent two-tailed 95\% bootstrap confidence intervals (n = 1000 bootstrap samples), and dashed lines indicate 80\% power. Colours indicate whether the strength of autocorrelation for the predictor variable is 0.2 (red), 0.5, (green) or 0.8 (blue). SEs = standard errors.}\label{fig:plotPowerGeo03}
\end{figure}

\newpage


\begin{figure}[H]
\includegraphics[width=\textwidth]{manuscript_files/figure-latex/plotPowerGeo05-1} \caption{\emph{Statistical power estimates for different methods of controlling for spatial non-independence in our simulation study, assuming a large true effect size (r = 0.5).} For simulated outcome and predictor variables, we systematically varied the strength of spatial autocorrelation, from weak (0.2) to moderate (0.5) to strong (0.8). We simulated 100 datasets per parameter combination assuming a large true correlation between variables (\emph{r} = 0.5) and fitted different models to each dataset. Statistical power was operationalised as the proportion of models that estimated a slope with a two-tailed 95\% confidence / credible interval excluding zero. Points represent raw proportions of models with slope 95\% confidence / credible intervals excluding zero, ranges represent two-tailed 95\% bootstrap confidence intervals (n = 1000 bootstrap samples), and dashed lines indicate 80\% power. Colours indicate whether the strength of autocorrelation for the predictor variable is 0.2 (red), 0.5, (green) or 0.8 (blue). SEs = standard errors.}\label{fig:plotPowerGeo05}
\end{figure}

\newpage


\begin{figure}[H]
\includegraphics[width=\textwidth]{manuscript_files/figure-latex/plotPowerLin01-1} \caption{\emph{Statistical power estimates for different methods of controlling for cultural phylogenetic non-independence in our simulation study, assuming a small true effect size (r = 0.1).} For simulated outcome and predictor variables, we systematically varied the strength of cultural phylogenetic autocorrelation, from weak (0.2) to moderate (0.5) to strong (0.8). We simulated 100 datasets per parameter combination assuming a small true correlation between variables (\emph{r} = 0.1) and fitted different models to each dataset. Statistical power was operationalised as the proportion of models that estimated a slope with a two-tailed 95\% confidence / credible interval excluding zero. Points represent raw proportions of models with slope 95\% confidence / credible intervals excluding zero, ranges represent two-tailed 95\% bootstrap confidence intervals (n = 1000 bootstrap samples), and dashed lines indicate 80\% power. Colours indicate whether the strength of autocorrelation for the predictor variable is 0.2 (red), 0.5, (green) or 0.8 (blue). SEs = standard errors.}\label{fig:plotPowerLin01}
\end{figure}

\newpage


\begin{figure}[H]
\includegraphics[width=\textwidth]{manuscript_files/figure-latex/plotPowerLin03-1} \caption{\emph{Statistical power estimates for different methods of controlling for cultural phylogenetic non-independence in our simulation study, assuming a medium true effect size (r = 0.3).} For simulated outcome and predictor variables, we systematically varied the strength of cultural phylogenetic autocorrelation, from weak (0.2) to moderate (0.5) to strong (0.8). We simulated 100 datasets per parameter combination assuming a medium true correlation between variables (\emph{r} = 0.3) and fitted different models to each dataset. Statistical power was operationalised as the proportion of models that estimated a slope with a two-tailed 95\% confidence / credible interval excluding zero. Points represent raw proportions of models with slope 95\% confidence / credible intervals excluding zero, ranges represent two-tailed 95\% bootstrap confidence intervals (n = 1000 bootstrap samples), and dashed lines indicate 80\% power. Colours indicate whether the strength of autocorrelation for the predictor variable is 0.2 (red), 0.5, (green) or 0.8 (blue). SEs = standard errors.}\label{fig:plotPowerLin03}
\end{figure}

\newpage


\begin{figure}[H]
\includegraphics[width=\textwidth]{manuscript_files/figure-latex/plotPowerLin05-1} \caption{\emph{Statistical power estimates for different methods of controlling for cultural phylogenetic non-independence in our simulation study, assuming a large true effect size (r = 0.5).} For simulated outcome and predictor variables, we systematically varied the strength of cultural phylogenetic autocorrelation, from weak (0.2) to moderate (0.5) to strong (0.8). We simulated 100 datasets per parameter combination assuming a large true correlation between variables (\emph{r} = 0.5) and fitted different models to each dataset. Statistical power was operationalised as the proportion of models that estimated a slope with a two-tailed 95\% confidence / credible interval excluding zero. Points represent raw proportions of models with slope 95\% confidence / credible intervals excluding zero, ranges represent two-tailed 95\% bootstrap confidence intervals (n = 1000 bootstrap samples), and dashed lines indicate 80\% power. Colours indicate whether the strength of autocorrelation for the predictor variable is 0.2 (red), 0.5, (green) or 0.8 (blue). SEs = standard errors.}\label{fig:plotPowerLin05}
\end{figure}

\newpage


\begin{figure}[H]
\includegraphics[width=\textwidth]{manuscript_files/figure-latex/plotReplications2-1} \caption{\emph{Reanalysis models fitted to raw data, for economic development (a) and cultural values (b) studies.} Data points are labelled using ISO 3166-1 alpha-2 letter country codes. In all reanalyses, outcome and predictor variables are standardised, making regression slopes comparable to Pearson's correlation coefficients. Lines and shaded areas represent posterior median regression lines and equal-tailed 95\% credible intervals. Colours indicate predictions from models with no control (red), spatial control only (green), cultural control only (blue), or both spatial and cultural control (purple). For models with covariates (Adamzyck and Pitt 2009; Gelfand et al.~2011), marginal effects are presented holding all covariates at zero or their reference categories. GDP = gross domestic product; SME = small and medium-sized enterprise.}\label{fig:plotReplications2}
\end{figure}

\newpage


\begin{figure}[H]
\includegraphics[width=\textwidth]{manuscript_files/figure-latex/plotReplications3-1} \caption{\emph{Posterior estimates of Gaussian process functions mapping spatial autocorrelation onto geographic distance from our reanalyses of economic development (a) and cultural values (b) studies.} The y-axis represents the amount of spatial autocorrelation between data points with increasing distance between those points on the x-axis (logged distance in kilometres). Lines and shaded areas represent median posterior spatial autocorrelation functions and equal-tailed 50\% and 95\% credible intervals.}\label{fig:plotReplications3}
\end{figure}

\newpage


\begin{figure}[H]
\includegraphics[width=\textwidth]{manuscript_files/figure-latex/plotReplications4-1} \caption{\emph{Posterior estimates of cultural phylogenetic signal from our reanalyses.} Cultural phylogenetic signal is operationalised as the proportion of national-level variance explained by linguistic proximity between nations. Ridges are full posterior distributions, points are posterior medians, and lines represent equal-tailed 50\% and 95\% credible intervals. Numbers of observations from the models are as follows, from top to bottom: n = 69, n = 45, n = 103, n = 98, n = 63, n = 89, n = 33, n = 75, n = 67, n = 28, n = 38, and n = 28.}\label{fig:plotReplications4}
\end{figure}

\newpage


\begin{figure}
\centering
\includegraphics{manuscript_files/figure-latex/plotReplications5-1.pdf}
\caption{\label{fig:plotReplications5}\emph{The estimated degree of spatial and cultural phylogenetic non-independence predicts reductions in effect size in our reanalysis.} (a) Higher estimated degrees of spatial autocorrelation at 1,000 km distance predict more pronounced reductions in effect sizes when controlling for non-independence. (b) Higher estimated levels of cultural phylogenetic signal predict more pronounced reductions in effect sizes when controlling for non-independence. In both panels, the y-axis represents the ratio of the effect size when controlling for spatial and cultural non-independence to the original effect size (from naive regression model), and the x-axis represents posterior median model estimates. Regression lines are plotted with equal-tailed 95\% credible intervals.}
\end{figure}

\newpage

\hypertarget{supplementary-tables}{%
\subsection{Supplementary Tables}\label{supplementary-tables}}


\begin{table}[H]

\begin{center}
\begin{threeparttable}

\caption{\label{tab:tableSignal}Geographic and cultural phylogenetic signal results for economic development and cultural values variables. Signal estimates reflect the proportion of national-level variance explained by geographic and linguistic covariance matrices. Bayes Factors (BF) reflect support for the hypothesis that the signal estimate differs from zero. HDI = Human Development Index; GDPpc = gross domestic product per capita.}

\small{

\begin{tabular}{lll}
\toprule
Outcome & \multicolumn{1}{c}{Geographic signal} & \multicolumn{1}{c}{Cultural phylogenetic signal}\\
\midrule
HDI & 0.37, 95\% CI [0.18, 0.59], BF > 100 & 0.62, 95\% CI [0.40, 0.80], BF > 100\\
GDPpc & 0.42, 95\% CI [0.20, 0.66], BF > 100 & 0.56, 95\% CI [0.33, 0.78], BF > 100\\
GDPpc growth & 0.65, 95\% CI [0.09, 0.98], BF = 16.79 & 0.26, 95\% CI [0.00, 0.70], BF = 1.16\\
Gini index & 0.74, 95\% CI [0.48, 0.97], BF > 100 & 0.25, 95\% CI [0.02, 0.51], BF = 3.97\\
Traditional values & 0.44, 95\% CI [0.17, 0.76], BF > 100 & 0.54, 95\% CI [0.23, 0.79], BF > 100\\
Survival values & 0.20, 95\% CI [0.01, 0.45], BF = 1.96 & 0.78, 95\% CI [0.53, 0.96], BF > 100\\
Tightness & 0.09, 95\% CI [0.00, 0.32], BF = 0.33 & 0.84, 95\% CI [0.61, 0.97], BF > 100\\
Individualism & 0.26, 95\% CI [0.00, 0.66], BF = 1.97 & 0.69, 95\% CI [0.29, 0.96], BF > 100\\
\bottomrule
\end{tabular}

}

\end{threeparttable}
\end{center}

\end{table}

\newpage


\begin{lltable}

\small{

\begin{longtable}{llllllllll}\noalign{\getlongtablewidth\global\LTcapwidth=\longtablewidth}
\caption{\label{tab:tableSim1}False positive rates in simulation with varying levels of spatial autocorrelation for the predictor variable (\(\rho\)) and for the outcome variable (\(\lambda\)), assuming that the true correlation is 0. Numbers represent the total number of analyses, out of 100, that estimated a slope with a two-tailed 95\% confidence / credible interval excluding zero, falsely inferring a relationship when none is present.}\\
\toprule
 & \multicolumn{3}{c}{$\rho$ = 0.2} & \multicolumn{3}{c}{$\rho$ = 0.5} & \multicolumn{3}{c}{$\rho$ = 0.8} \\
\cmidrule(r){2-4} \cmidrule(r){5-7} \cmidrule(r){8-10}
Model & $\lambda$ = 0.2 & $\lambda$ = 0.5 & $\lambda$ = 0.8 & $\lambda$ = 0.2 & $\lambda$ = 0.5 & $\lambda$ = 0.8 & $\lambda$ = 0.2 & $\lambda$ = 0.5 & $\lambda$ = 0.8\\
\midrule
\endfirsthead
\caption*{\normalfont{Table \ref{tab:tableSim1} continued}}\\
\toprule
 & \multicolumn{3}{c}{$\rho$ = 0.2} & \multicolumn{3}{c}{$\rho$ = 0.5} & \multicolumn{3}{c}{$\rho$ = 0.8} \\
\cmidrule(r){2-4} \cmidrule(r){5-7} \cmidrule(r){8-10}
Model & $\lambda$ = 0.2 & $\lambda$ = 0.5 & $\lambda$ = 0.8 & $\lambda$ = 0.2 & $\lambda$ = 0.5 & $\lambda$ = 0.8 & $\lambda$ = 0.2 & $\lambda$ = 0.5 & $\lambda$ = 0.8\\
\midrule
\endhead
No control & 18 & 27 & 41 & 27 & 48 & 61 & 40 & 61 & 77\\
Latitude & 19 & 25 & 39 & 25 & 44 & 60 & 33 & 58 & 71\\
Longitude & 14 & 20 & 27 & 22 & 34 & 48 & 29 & 49 & 62\\
Continent & 10 & 13 & 16 & 13 & 18 & 24 & 13 & 25 & 35\\
Language family & 12 & 17 & 29 & 20 & 33 & 46 & 27 & 48 & 58\\
Mean 2000km radius & 9 & 12 & 19 & 5 & 9 & 13 & 5 & 5 & 6\\
Conley SEs spatial & 13 & 13 & 14 & 18 & 23 & 25 & 22 & 37 & 43\\
Conley SEs genetic & 17 & 22 & 27 & 20 & 34 & 51 & 28 & 49 & 66\\
Bayesian spatial & 14 & 13 & 11 & 13 & 15 & 12 & 16 & 17 & 23\\
Bayesian linguistic & 12 & 20 & 21 & 21 & 26 & 39 & 28 & 42 & 49\\
Bayesian spatial \& linguistic & 11 & 13 & 9 & 14 & 13 & 12 & 17 & 18 & 21\\
\bottomrule
\end{longtable}

}

\end{lltable}

\newpage


\begin{lltable}

\small{

\begin{longtable}{llllllllll}\noalign{\getlongtablewidth\global\LTcapwidth=\longtablewidth}
\caption{\label{tab:tableSim2}False positive rates in simulation with varying levels of cultural phylogenetic autocorrelation for the predictor variable (\(\rho\)) and for the outcome variable (\(\lambda\)), assuming that the true correlation is 0. Numbers represent the total number of analyses, out of 100, that estimated a slope with a two-tailed 95\% confidence / credible interval excluding zero, falsely inferring a relationship when none is present.}\\
\toprule
 & \multicolumn{3}{c}{$\rho$ = 0.2} & \multicolumn{3}{c}{$\rho$ = 0.5} & \multicolumn{3}{c}{$\rho$ = 0.8} \\
\cmidrule(r){2-4} \cmidrule(r){5-7} \cmidrule(r){8-10}
Model & $\lambda$ = 0.2 & $\lambda$ = 0.5 & $\lambda$ = 0.8 & $\lambda$ = 0.2 & $\lambda$ = 0.5 & $\lambda$ = 0.8 & $\lambda$ = 0.2 & $\lambda$ = 0.5 & $\lambda$ = 0.8\\
\midrule
\endfirsthead
\caption*{\normalfont{Table \ref{tab:tableSim2} continued}}\\
\toprule
 & \multicolumn{3}{c}{$\rho$ = 0.2} & \multicolumn{3}{c}{$\rho$ = 0.5} & \multicolumn{3}{c}{$\rho$ = 0.8} \\
\cmidrule(r){2-4} \cmidrule(r){5-7} \cmidrule(r){8-10}
Model & $\lambda$ = 0.2 & $\lambda$ = 0.5 & $\lambda$ = 0.8 & $\lambda$ = 0.2 & $\lambda$ = 0.5 & $\lambda$ = 0.8 & $\lambda$ = 0.2 & $\lambda$ = 0.5 & $\lambda$ = 0.8\\
\midrule
\endhead
No control & 7 & 14 & 15 & 8 & 19 & 30 & 15 & 26 & 36\\
Latitude & 7 & 10 & 16 & 10 & 19 & 27 & 15 & 22 & 35\\
Longitude & 5 & 12 & 14 & 9 & 16 & 26 & 13 & 26 & 35\\
Continent & 5 & 6 & 10 & 3 & 11 & 21 & 8 & 20 & 29\\
Language family & 7 & 9 & 12 & 9 & 14 & 22 & 10 & 20 & 32\\
Mean 2000km radius & 5 & 8 & 12 & 2 & 12 & 21 & 4 & 16 & 25\\
Conley SEs spatial & 2 & 6 & 7 & 2 & 9 & 15 & 6 & 14 & 20\\
Conley SEs genetic & 5 & 11 & 13 & 8 & 13 & 21 & 8 & 17 & 26\\
Bayesian spatial & 7 & 12 & 12 & 9 & 17 & 25 & 14 & 24 & 32\\
Bayesian linguistic & 5 & 9 & 11 & 6 & 7 & 7 & 4 & 5 & 5\\
Bayesian spatial \& linguistic & 3 & 10 & 11 & 5 & 8 & 8 & 4 & 5 & 5\\
\bottomrule
\end{longtable}

}

\end{lltable}

\newpage


\begin{lltable}

\footnotesize{

\begin{longtable}{rrrrr}\noalign{\getlongtablewidth\global\LTcapwidth=\longtablewidth}
\caption{\label{tab:tableReplications}Estimated cross-national correlations from our reanalysis of twelve previous cross-national analyses. Numbers are posterior median slopes (equivalent to Pearson's r correlation coefficients) with equal-tailed 95\% credible intervals.}\\
\toprule
Analysis & \multicolumn{1}{c}{No control} & \multicolumn{1}{c}{Spatial control} & \multicolumn{1}{c}{Cultural control} & \multicolumn{1}{c}{Both controls}\\
\midrule
\endfirsthead
\caption*{\normalfont{Table \ref{tab:tableReplications} continued}}\\
\toprule
Analysis & \multicolumn{1}{c}{No control} & \multicolumn{1}{c}{Spatial control} & \multicolumn{1}{c}{Cultural control} & \multicolumn{1}{c}{Both controls}\\
\midrule
\endhead
Adamczyk and Pitt (2009) & 0.20, 95\% CI [ 0.07,\ \ 0.33] & 0.20, 95\% CI [ 0.07,\ \ 0.34] & 0.19, 95\% CI [ 0.05,\ \ 0.33] & 0.20, 95\% CI [ 0.06,\ \ 0.33]\\
Alesina et al. (2013) & -0.21, 95\% CI [-0.42,\ \ 0.01] & -0.21, 95\% CI [-0.43,\ \ 0.01] & -0.07, 95\% CI [-0.26,\ \ 0.11] & -0.07, 95\% CI [-0.25,\ \ 0.11]\\
Beck et al. (2003) & -0.50, 95\% CI [-0.68, -0.30] & -0.15, 95\% CI [-0.38,\ \ 0.02] & -0.56, 95\% CI [-0.77, -0.33] & -0.54, 95\% CI [-0.76, -0.30]\\
Beck et al. (2005) & 0.38, 95\% CI [ 0.12,\ \ 0.64] & 0.25, 95\% CI [-0.01,\ \ 0.50] & 0.29, 95\% CI [ 0.10,\ \ 0.49] & 0.29, 95\% CI [ 0.09,\ \ 0.48]\\
Bockstette et al. (2002) & 0.43, 95\% CI [ 0.25,\ \ 0.59] & 0.41, 95\% CI [ 0.19,\ \ 0.59] & 0.37, 95\% CI [ 0.18,\ \ 0.57] & 0.37, 95\% CI [ 0.15,\ \ 0.56]\\
Easterly and Levine (2003) & 0.75, 95\% CI [ 0.60,\ \ 0.90] & 0.76, 95\% CI [ 0.57,\ \ 0.93] & 0.65, 95\% CI [ 0.47,\ \ 0.82] & 0.66, 95\% CI [ 0.47,\ \ 0.84]\\
Easterly (2007) & -0.46, 95\% CI [-0.63, -0.29] & -0.18, 95\% CI [-0.36,\ \ 0.01] & -0.25, 95\% CI [-0.41, -0.09] & -0.19, 95\% CI [-0.36, -0.01]\\
Fincher et al. (2008) & -0.64, 95\% CI [-0.82, -0.46] & -0.59, 95\% CI [-0.80, -0.21] & -0.50, 95\% CI [-0.71, -0.27] & -0.47, 95\% CI [-0.69, -0.18]\\
Gelfand et al. (2011) & 0.54, 95\% CI [ 0.20,\ \ 0.85] & 0.54, 95\% CI [ 0.19,\ \ 0.86] & 0.49, 95\% CI [ 0.14,\ \ 0.83] & 0.50, 95\% CI [ 0.15,\ \ 0.83]\\
Inglehart and Baker (2000) & 0.48, 95\% CI [ 0.21,\ \ 0.74] & 0.27, 95\% CI [ 0.11,\ \ 0.44] & 0.36, 95\% CI [ 0.11,\ \ 0.60] & 0.28, 95\% CI [ 0.10,\ \ 0.46]\\
Knack and Keefer (1997) & 0.36, 95\% CI [ 0.05,\ \ 0.67] & 0.36, 95\% CI [ 0.04,\ \ 0.66] & 0.28, 95\% CI [-0.10,\ \ 0.63] & 0.29, 95\% CI [-0.09,\ \ 0.62]\\
Skidmore and Toya (2002) & 0.30, 95\% CI [ 0.10,\ \ 0.49] & 0.20, 95\% CI [ 0.00,\ \ 0.41] & 0.21, 95\% CI [ 0.03,\ \ 0.40] & 0.21, 95\% CI [ 0.01,\ \ 0.41]\\
\bottomrule
\end{longtable}

}

\end{lltable}

\newpage


\begin{center}
\begin{ThreePartTable}

\scriptsize{

\begin{longtable}{m{2cm}m{2cm}m{2cm}m{9cm}}\noalign{\getlongtablewidth\global\LTcapwidth=\longtablewidth}
\caption{\label{tab:tableDeviations}List of sample size deviations between original analyses and reanalyses.}\\
\toprule
Analysis & \multicolumn{1}{c}{Original N} & \multicolumn{1}{c}{Reanalysis N} & \multicolumn{1}{c}{Reason for deviation}\\
\midrule
\endfirsthead
\caption*{\normalfont{Table \ref{tab:tableDeviations} continued}}\\
\toprule
Analysis & \multicolumn{1}{c}{Original N} & \multicolumn{1}{c}{Reanalysis N} & \multicolumn{1}{c}{Reason for deviation}\\
\midrule
\endhead
Adamczyk and Pitt (2009) & 33 & 33 & N/A\\
Alesina et al. (2013) & >177 & 75 & Original analysis used imputed values for traditional plough use which were unavailable to us. For our reanalysis, we collected data from Tables A4 and A9 and ran our regression on the 75 nations with available data for female labour force participation in 2000 and traditional plough use.\\
Beck et al. (2003) & 70 & 69 & We removed one nation (Zaire) as it was not present in our linguistic distance matrix.\\
Beck et al. (2005) & 45 & 45 & N/A\\
Bockstette et al. (2002) & 94 & 103 & After manually linking state history data from Appendix A with world development indicators, we had complete data for 103 nations.\\
Easterly and Levine (2003) & 72 & 63 & After manually linking log GDP per capita 1995 data from Appendix Table A2 in Acemoglu et al. (2001) with an institutions index self-constructed from world governance indicators, we only had complete data for 63 nations.\\
Easterly (2007) & 118 & 98 & After manually linking log wheat-sugar ratio data from Appendix A with longitudinal Gini data, we only had complete data for 98 nations.\\
Fincher et al. (2008) & 68 & 67 & We combined England and Northern Ireland into a single nation (United Kingdom) for the reanalysis.\\
Gelfand et al. (2011) & 30 & 28 & We combined East and West Germany into a single nation (Germany) and removed a high leverage point with a substantially higher disaster rate than other nations (Venezuela).\\
Inglehart and Baker (2000) & 65 & 38 & After manually linking traditional values data from the World Values Survey with data on percentage total employment in industry from World Development Indicators, we only had complete data for 38 nations.\\
Knack and Keefer (1997) & 28 & 28 & N/A\\
Skidmore and Toya (2002) & 89 & 89 & N/A\\
\bottomrule
\end{longtable}

}

\end{ThreePartTable}
\end{center}

\newpage

\hypertarget{supplementary-references}{%
\subsection{Supplementary References}\label{supplementary-references}}

\begin{enumerate}
\def\labelenumi{\arabic{enumi}.}
\tightlist
\item
  Bürkner, P.-C. brms: An R package for Bayesian multilevel models using Stan. \emph{Journal of Statistical Software} \textbf{80}, 1--28 (2017).
\end{enumerate}


\end{document}