@ARTICLE{Kamińska_Joanna_Amelia_Explicit_2020, author={Kamińska, Joanna Amelia and Turek, Tomasz}, volume={vol. 46}, number={No 1}, pages={93-99}, journal={Archives of Environmental Protection}, howpublished={online}, year={2020}, publisher={Polish Academy of Sciences}, abstract={High concentrations of nitrogen dioxide in the air, particularly in heavily urbanized areas, have an adverse eff ect on many aspects of residents’ health. A method is proposed for modelling daily average, minimal and maximal atmospheric NO 2 concentrations in a conurbation, using two types of modelling: multiple linear regression (LR) an advanced data mining technique – Random Forest (RF). It was shown that Random Forest technique can be successfully applied to predict daily NO 2 concentration based on data from 2015–2017 years and gives better fit than linear models. The best results were obtained for predicting daily average NO 2 values with R 2 =0.69 and RMSE=7.47 μg/m . The cost of receiving an explicit, interpretable function is a much worse fit (R 2 from 0.32 to 0.57). Verification of models on independent material from the first half of 2018 showed the correctness of the models with the mean average percentage error equal to 16.5% for RF and 28% for LR modelling daily average concentration. The most important factors were wind conditions and traffic flow. In prediction of maximal daily concentration, air temperature and air humidity take on greater importance. Prevailing westerly and south-westerly winds in Wrocław effectively implement the idea of ventilating the city within the studied intersection. Summarizing: when modeling natural phenomena, a compromise should be sought between the accuracy of the model and its interpretability.}, type={Article}, title={Explicit and implicit description of the factors impact on the NO 2 concentration in the traffic corridor}, URL={http://ochroma.man.poznan.pl/Content/115796/PDF/Arch_vol46_pp93_99.pdf}, doi={10.24425/aep.2020.132530}, keywords={nitrogen dioxide, traffic flow, meteorological conditions, random forest, linear regression}, }