@article {Simonian41, author = {Joseph Simonian}, title = {Modular Machine Learning for Model Validation: An Application to the Fundamental Law of Active Management}, volume = {2}, number = {2}, pages = {41--50}, year = {2020}, doi = {10.3905/jfds.2020.1.027}, publisher = {Institutional Investor Journals Umbrella}, abstract = {The author introduces a modular machine learning framework for model validation in which the output from one procedure serves as the input to another procedure within a single validation framework. A defining feature of the described methodology is the use of both traditional econometrics and data science. The author uses an econometric model in the first module to classify data in an economically intuitive way. Proceeding modules apply data science techniques to evaluate the predictive characteristics of the model components. The author applies his framework to the fundamental law of active management, a well-known formal characterization of portfolio managers{\textquoteright} alpha generation process. In contrast to standard applications of the law, in which it has been used to evaluate a manager{\textquoteright}s existing active management process, the author recasts the law within his framework as a means to test investment signals for potential use, individually or collectively, in a manager{\textquoteright}s investment process. To illustrate how this application works, the author provides an example using the well-known Fama{\textendash}French factors as test signals.TOPICS: Statistical methods, simulations, big data/machine learningKey Findings{\textbullet} Implementing model validation through a set of interdependent modules that uses both traditional econometrics and data science techniques can produce robust assessments of the predictive effectiveness of investment signals in an economically intuitive manner.{\textbullet} The proposed methodology, modular machine learning, also answers several practical questions that arise when applying block time series cross-validation, such as the length of the folds and the block size to use between folds.{\textbullet} It is possible to reinterpret the fundamental law of active management into a model validation framework by expressing its fundamental concepts{\textemdash}information coefficient and breadth{\textemdash}using the formal language of data science.}, issn = {2640-3943}, URL = {https://jfds.pm-research.com/content/2/2/41}, eprint = {https://jfds.pm-research.com/content/2/2/41.full.pdf}, journal = {The Journal of Financial Data Science} }