@article { author = {Kaffashzadeh, Najmeh and Aliakbari Bidokhti, Abbasali}, title = {Quality control of measured surface Ozone at the Tehran city stations using a new sStatistical software}, journal = {Iranian Journal of Geophysics}, volume = {16}, number = {1}, pages = {141-150}, year = {2022}, publisher = {Iranian Geophysical Society}, issn = {2008-0336}, eissn = {2783-168X}, doi = {10.30499/ijg.2021.304252.1364}, abstract = {Being an inseparable part of environmental data, errors are generated due to several reasons, either natural or artificial. The first is produced from natural phenomena such as animal activities, storms, floods, etc. The later can be generated via human activities during data collecting, entering and processing that can be intentional or unintentional. Since errors can affect results of any analysis, distinguishing them via quality control is a prerequisite of any data usage. Because of unknown truth, this seemingly simple task becomes challenging. Although many efforts have been devoted to develop tests and tools for distinguishing errors in data, none of them can guarantee that all errors can be found. It is important as much as orthogonal testing to find more errors. Here we used a tool named AutoQA4Env, which has been developed for an automated quality control of environmental data. This tool consists of a series of statistical tests which have been used in various communities and organizations such as World Meteorological Organization and Environmental Protection Agency. The tests have been classified in several groups, based on their strictness. The tool has a setting menu by which users can add tests and modify the thresholds. Two versions of the tool, namely basic and advanced flagging system are open source and accessible via b2share. The tool was tested for the quality control of a set of data series of surface ozone measured at the pollution monitoring stations in the city of Tehran. These data are an important source to get information about the pollution levels and trends in Tehran; thus knowing their quality can improve and reduce the uncertainties in the results. The results indicate that gross errors exist in the most of the stations’ data, even though these data are published and are publicly available. Applying the tool in the basic state finds most of the errors. About 0.02% of the data were erroneous for three years of data at 15 stations. Binary flagging system of the tool labels these failure data as an unacceptable data, although they were in fact acceptable. The advanced state of the tool was more moderate than the basic one and corrected these labels. In this state, 57.7% of the unacceptable data in the basic state were distinguished as a suspected value and only 5.6% of them were unacceptable. Therefore, we can conclude that the AutoQA4Env even at this stage could find and flag most of the data errors, at least gross errors. Besides, the advanced flagging system of the tool reduces errors in labeling. }, keywords = {errors,Quality Control,AutoQA4Env tool,surface ozone data}, title_fa = {کنترل کیفی داده های اوزن سطحی اندازه گیری شده در ایستگاه های شهر تهران با کمک نرم افزار آماری جدید}, abstract_fa = {بی‌توجهی به وجود خطاهای متعدد شامل خطای فاحش، اعداد ثابت و غیره در داده می تواند به نتایج نادرست در تحلیل داده ها منجر شود؛ ازاین رو کنترل کیفی داده گامی ضرورری جهت حصول اطمینان از صحت داده است. در دسترس نبودن واقعیت، سبب پیچیدگی در تشخیص خطا و انجام دادن کنترل کیفی داده می شود. روش ها و آزمایش های آماری گوناگونی برای کنترل کیفی داده وجود دارد، ولی هیچ یک یافتن تمامی خطاها را در داده ضمانت نمی کنند. اجرای هرچه بیشتر آزمایش ها سبب افزایش اطمینان نسبی از کیفیت داده می شود. در این مطالعه به دلیل اهمیت و ضرورت مطالعه آلاینده ازن سطحی، کیفیت این داده ها در سطح شهر تهران بررسی شد. کنترل کیفی داده ها با استفاده از ابزار AutoQA4Env انجام شد. این ابزار متشکل از مجموعه آزمایش های آماری گروه‌بندی شده در دو حالت پایه و پیشرفته است. از ویژگی های خاص این ابزار، تنظیمات کاربری، تکرارپذیری و گسترش پذیری آن است. نتایج اجرای این ابزار در حالت پایه، حاکی از وجود خطای فاحش در برخی از داده ها بود که این موضوع به‌منزله لزوم بررسی کنترل کیفی داده پیش از به‌کارگیری آن است. از طرف دیگر، در برخی موارد نشان داده شد اجرای ابزار در حالت پایه کافی نیست و کاربست ابزار در حالت پیشرفته مناسب تر است.}, keywords_fa = {کنترل کیفی,داده های ازن سطحی,خطای فاحش,ابزار AutoQA4Env}, url = {https://www.ijgeophysics.ir/article_141877.html}, eprint = {https://www.ijgeophysics.ir/article_141877_2bcc39dc493025256ac15e68490e8614.pdf} }