PyPI - AeroViz - Versions diffs - 0.1.2__py3-none-any.whl → 0.1.3b0__py3-none-any.whl - Mend

AeroViz 0.1.2py3-none-any.whl → 0.1.3b0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of AeroViz might be problematic. Click here for more details.

Files changed (112) hide show

AeroViz/__init__.py +4 -4
AeroViz/config/DEFAULT_DATA.csv +1417 -0
AeroViz/config/DEFAULT_PNSD_DATA.csv +1417 -0
AeroViz/dataProcess/Chemistry/__init__.py +38 -38
AeroViz/dataProcess/Chemistry/_calculate.py +15 -15
AeroViz/dataProcess/Chemistry/_isoropia.py +69 -68
AeroViz/dataProcess/Chemistry/_mass_volume.py +158 -158
AeroViz/dataProcess/Chemistry/_ocec.py +109 -109
AeroViz/dataProcess/Chemistry/_partition.py +19 -18
AeroViz/dataProcess/Chemistry/_teom.py +8 -11
AeroViz/dataProcess/Optical/_IMPROVE.py +40 -39
AeroViz/dataProcess/Optical/__init__.py +35 -35
AeroViz/dataProcess/Optical/_absorption.py +35 -35
AeroViz/dataProcess/Optical/_extinction.py +25 -24
AeroViz/dataProcess/Optical/_mie.py +5 -6
AeroViz/dataProcess/Optical/_mie_sd.py +89 -90
AeroViz/dataProcess/Optical/_scattering.py +16 -16
AeroViz/dataProcess/SizeDistr/__init__.py +37 -37
AeroViz/dataProcess/SizeDistr/__merge.py +159 -158
AeroViz/dataProcess/SizeDistr/_merge.py +155 -154
AeroViz/dataProcess/SizeDistr/_merge_v1.py +162 -161
AeroViz/dataProcess/SizeDistr/_merge_v2.py +153 -152
AeroViz/dataProcess/SizeDistr/_merge_v3.py +326 -326
AeroViz/dataProcess/SizeDistr/_merge_v4.py +272 -274
AeroViz/dataProcess/SizeDistr/_size_distr.py +51 -51
AeroViz/dataProcess/VOC/__init__.py +7 -7
AeroViz/dataProcess/VOC/_potential_par.py +53 -55
AeroViz/dataProcess/VOC/voc_par.json +464 -0
AeroViz/dataProcess/__init__.py +4 -4
AeroViz/dataProcess/core/__init__.py +59 -58
AeroViz/plot/__init__.py +6 -1
AeroViz/plot/bar.py +126 -0
AeroViz/plot/box.py +68 -0
AeroViz/plot/distribution/distribution.py +421 -427
AeroViz/plot/meteorology/meteorology.py +240 -292
AeroViz/plot/optical/__init__.py +0 -1
AeroViz/plot/optical/optical.py +230 -230
AeroViz/plot/pie.py +198 -0
AeroViz/plot/regression.py +210 -0
AeroViz/plot/scatter.py +99 -0
AeroViz/plot/templates/__init__.py +0 -3
AeroViz/plot/templates/contour.py +25 -25
AeroViz/plot/templates/corr_matrix.py +86 -93
AeroViz/plot/templates/diurnal_pattern.py +24 -24
AeroViz/plot/templates/koschmieder.py +106 -106
AeroViz/plot/templates/metal_heatmap.py +34 -34
AeroViz/plot/timeseries/timeseries.py +53 -60
AeroViz/plot/utils/__init__.py +2 -1
AeroViz/plot/utils/_color.py +57 -57
AeroViz/plot/utils/_unit.py +48 -48
AeroViz/plot/utils/fRH.json +390 -0
AeroViz/plot/utils/plt_utils.py +92 -0
AeroViz/plot/utils/sklearn_utils.py +49 -0
AeroViz/plot/utils/units.json +84 -0
AeroViz/plot/violin.py +79 -0
AeroViz/process/__init__.py +15 -15
AeroViz/process/core/DataProc.py +9 -9
AeroViz/process/core/SizeDist.py +81 -81
AeroViz/process/method/PyMieScatt_update.py +488 -488
AeroViz/process/method/mie_theory.py +231 -229
AeroViz/process/method/prop.py +40 -40
AeroViz/process/script/AbstractDistCalc.py +103 -103
AeroViz/process/script/Chemical.py +166 -166
AeroViz/process/script/IMPACT.py +40 -40
AeroViz/process/script/IMPROVE.py +152 -152
AeroViz/process/script/Others.py +45 -45
AeroViz/process/script/PSD.py +26 -26
AeroViz/process/script/PSD_dry.py +69 -70
AeroViz/process/script/retrieve_RI.py +50 -51
AeroViz/rawDataReader/__init__.py +57 -57
AeroViz/rawDataReader/core/__init__.py +328 -326
AeroViz/rawDataReader/script/AE33.py +18 -18
AeroViz/rawDataReader/script/AE43.py +20 -20
AeroViz/rawDataReader/script/APS_3321.py +30 -30
AeroViz/rawDataReader/script/Aurora.py +23 -23
AeroViz/rawDataReader/script/BC1054.py +40 -40
AeroViz/rawDataReader/script/EPA_vertical.py +9 -9
AeroViz/rawDataReader/script/GRIMM.py +21 -21
AeroViz/rawDataReader/script/IGAC_TH.py +67 -67
AeroViz/rawDataReader/script/IGAC_ZM.py +59 -59
AeroViz/rawDataReader/script/MA350.py +39 -39
AeroViz/rawDataReader/script/NEPH.py +74 -74
AeroViz/rawDataReader/script/OCEC_LCRES.py +21 -21
AeroViz/rawDataReader/script/OCEC_RES.py +16 -16
AeroViz/rawDataReader/script/SMPS_TH.py +25 -25
AeroViz/rawDataReader/script/SMPS_aim11.py +32 -32
AeroViz/rawDataReader/script/SMPS_genr.py +31 -31
AeroViz/rawDataReader/script/TEOM.py +28 -28
AeroViz/rawDataReader/script/Table.py +12 -12
AeroViz/rawDataReader/script/VOC_TH.py +16 -16
AeroViz/rawDataReader/script/VOC_ZM.py +28 -28
AeroViz/rawDataReader/script/__init__.py +20 -20
AeroViz/rawDataReader/utils/config.py +161 -161
AeroViz/tools/database.py +65 -65
AeroViz/tools/dataclassifier.py +106 -106
AeroViz/tools/dataprinter.py +51 -51
AeroViz/tools/datareader.py +38 -38
{AeroViz-0.1.2.dist-info → AeroViz-0.1.3b0.dist-info}/METADATA +5 -4
AeroViz-0.1.3b0.dist-info/RECORD +110 -0
AeroViz/config/__init__.py +0 -0
AeroViz/plot/improve/__init__.py +0 -1
AeroViz/plot/improve/improve.py +0 -240
AeroViz/plot/optical/aethalometer.py +0 -77
AeroViz/plot/templates/event_evolution.py +0 -65
AeroViz/plot/templates/regression.py +0 -256
AeroViz/plot/templates/scatter.py +0 -130
AeroViz/plot/templates/templates.py +0 -398
AeroViz/plot/utils/_decorator.py +0 -74
AeroViz-0.1.2.dist-info/RECORD +0 -106
{AeroViz-0.1.2.dist-info → AeroViz-0.1.3b0.dist-info}/LICENSE +0 -0
{AeroViz-0.1.2.dist-info → AeroViz-0.1.3b0.dist-info}/WHEEL +0 -0
{AeroViz-0.1.2.dist-info → AeroViz-0.1.3b0.dist-info}/top_level.txt +0 -0

AeroViz/rawDataReader/script/IGAC_ZM.py CHANGED Viewed

@@ -8,83 +8,83 @@ from AeroViz.rawDataReader.core import AbstractReader
 class Reader(AbstractReader):
-	nam = 'IGAC_ZM'
+    nam = 'IGAC_ZM'
-	def _raw_reader(self, _file):
+    def _raw_reader(self, _file):
-		with (_file).open('r', encoding='utf-8-sig', errors='ignore') as f:
-			_df = read_csv(f, parse_dates=[0], index_col=[0], na_values=['-']).apply(to_numeric, errors='coerce')
+        with (_file).open('r', encoding='utf-8-sig', errors='ignore') as f:
+            _df = read_csv(f, parse_dates=[0], index_col=[0], na_values=['-']).apply(to_numeric, errors='coerce')
-			_df.columns = _df.keys().str.strip(' ')
-			_df.index.name = 'time'
+            _df.columns = _df.keys().str.strip(' ')
+            _df.index.name = 'time'
-		return _df.loc[_df.index.dropna()].loc[~_df.index.duplicated()]
+        return _df.loc[_df.index.dropna()].loc[~_df.index.duplicated()]
-	## QC data
-	def _QC(self, _df):
+    ## QC data
+    def _QC(self, _df):
-		## QC parameter, function (MDL SE LE)
-		_mdl = {
-			'Na+': 0.06,
-			'NH4+': 0.05,
-			'K+': 0.05,
-			'Mg2+': 0.12,
-			'Ca2+': 0.07,
-			'Cl-': 0.07,
-			'NO2-': 0.05,
-			'NO3-': 0.11,
-			'SO42-': 0.08,
-		}
-		_mdl.update(self._oth_set.get('mdl', {}))
+        ## QC parameter, function (MDL SE LE)
+        _mdl = {
+            'Na+': 0.06,
+            'NH4+': 0.05,
+            'K+': 0.05,
+            'Mg2+': 0.12,
+            'Ca2+': 0.07,
+            'Cl-': 0.07,
+            'NO2-': 0.05,
+            'NO3-': 0.11,
+            'SO42-': 0.08,
+        }
+        _mdl.update(self._oth_set.get('mdl', {}))
-		def _se_le(_df_, _log=False):
-			_df_ = np.log10(_df_) if _log else _df_
+        def _se_le(_df_, _log=False):
+            _df_ = np.log10(_df_) if _log else _df_
-			_df_qua = _df_.quantile([.25, .75])
-			_df_q1, _df_q3 = _df_qua.loc[.25].copy(), _df_qua.loc[.75].copy()
-			_df_iqr = _df_q3 - _df_q1
+            _df_qua = _df_.quantile([.25, .75])
+            _df_q1, _df_q3 = _df_qua.loc[.25].copy(), _df_qua.loc[.75].copy()
+            _df_iqr = _df_q3 - _df_q1
-			_se = concat([_df_q1 - 1.5 * _df_iqr] * len(_df_), axis=1).T.set_index(_df_.index)
-			_le = concat([_df_q3 + 1.5 * _df_iqr] * len(_df_), axis=1).T.set_index(_df_.index)
+            _se = concat([_df_q1 - 1.5 * _df_iqr] * len(_df_), axis=1).T.set_index(_df_.index)
+            _le = concat([_df_q3 + 1.5 * _df_iqr] * len(_df_), axis=1).T.set_index(_df_.index)
-			if _log:
-				return 10 ** _se, 10 ** _le
-			return _se, _le
+            if _log:
+                return 10 ** _se, 10 ** _le
+            return _se, _le
-		_cation, _anion, _main = ['Na+', 'NH4+', 'K+', 'Mg2+', 'Ca2+'], ['Cl-', 'NO2-', 'NO3-', 'SO42-', ], ['SO42-',
-																											 'NO3-',
-																											 'NH4+']
+        _cation, _anion, _main = ['Na+', 'NH4+', 'K+', 'Mg2+', 'Ca2+'], ['Cl-', 'NO2-', 'NO3-', 'SO42-', ], ['SO42-',
+                                                                                                             'NO3-',
+                                                                                                             'NH4+']
-		_df_salt = _df[_mdl.keys()].copy()
-		_df_pm = _df['PM2.5'].copy()
+        _df_salt = _df[_mdl.keys()].copy()
+        _df_pm = _df['PM2.5'].copy()
-		## lower than PM2.5
-		## conc. of main salt should be present at the same time (NH4+, SO42-, NO3-)
-		_df_salt = _df_salt.mask(_df_salt.sum(axis=1, min_count=1) > _df_pm).dropna(subset=_main).copy()
+        ## lower than PM2.5
+        ## conc. of main salt should be present at the same time (NH4+, SO42-, NO3-)
+        _df_salt = _df_salt.mask(_df_salt.sum(axis=1, min_count=1) > _df_pm).dropna(subset=_main).copy()
-		## mdl
-		for (_key, _df_col), _mdl_val in zip(_df_salt.items(), _mdl.values()):
-			_df_salt[_key] = _df_col.mask(_df_col < _mdl_val, _mdl_val / 2)
+        ## mdl
+        for (_key, _df_col), _mdl_val in zip(_df_salt.items(), _mdl.values()):
+            _df_salt[_key] = _df_col.mask(_df_col < _mdl_val, _mdl_val / 2)
-		## calculate SE LE
-		## salt < LE
-		_se, _le = _se_le(_df_salt, _log=True)
-		_df_salt = _df_salt.mask(_df_salt > _le).copy()
+        ## calculate SE LE
+        ## salt < LE
+        _se, _le = _se_le(_df_salt, _log=True)
+        _df_salt = _df_salt.mask(_df_salt > _le).copy()
-		## C/A, A/C
-		_rat_CA = (_df_salt[_cation].sum(axis=1) / _df_salt[_anion].sum(axis=1)).to_frame()
-		_rat_AC = (1 / _rat_CA).copy()
+        ## C/A, A/C
+        _rat_CA = (_df_salt[_cation].sum(axis=1) / _df_salt[_anion].sum(axis=1)).to_frame()
+        _rat_AC = (1 / _rat_CA).copy()
-		_se, _le = _se_le(_rat_CA, )
-		_cond_CA = (_rat_CA < _le) & (_rat_CA > 0)
+        _se, _le = _se_le(_rat_CA, )
+        _cond_CA = (_rat_CA < _le) & (_rat_CA > 0)
-		_se, _le = _se_le(_rat_AC, )
-		_cond_AC = (_rat_AC < _le) & (_rat_AC > 0)
+        _se, _le = _se_le(_rat_AC, )
+        _cond_AC = (_rat_AC < _le) & (_rat_AC > 0)
-		_df_salt = _df_salt.where((_cond_CA * _cond_AC)[0]).copy()
+        _df_salt = _df_salt.where((_cond_CA * _cond_AC)[0]).copy()
-		## conc. of main salt > SE
-		_se, _le = _se_le(_df_salt[_main], _log=True)
-		_df_salt[_main] = _df_salt[_main].mask(_df_salt[_main] < _se).copy()
+        ## conc. of main salt > SE
+        _se, _le = _se_le(_df_salt[_main], _log=True)
+        _df_salt[_main] = _df_salt[_main].mask(_df_salt[_main] < _se).copy()
-		return _df_salt.reindex(_df.index)
+        return _df_salt.reindex(_df.index)

AeroViz/rawDataReader/script/MA350.py CHANGED Viewed

@@ -4,42 +4,42 @@ from AeroViz.rawDataReader.core import AbstractReader
 class Reader(AbstractReader):
-	nam = 'MA350'
-	def _raw_reader(self, _file):
-		_df = read_csv(_file, parse_dates=['Date / time local'], index_col='Date / time local').rename_axis("Time")
-		_df = _df.rename(columns={
-			'UV BCc': 'BC1',
-			'Blue BCc': 'BC2',
-			'Green BCc': 'BC3',
-			'Red BCc': 'BC4',
-			'IR BCc': 'BC5',
-			'Biomass BCc  (ng/m^3)': 'BB mass',
-			'Fossil fuel BCc  (ng/m^3)': 'FF mass',
-			'Delta-C  (ng/m^3)': 'Delta-C',
-			'AAE': 'AAE',
-			'BB (%)': 'BB',
-		})
-		# remove data without Status=32 (Automatic Tape Advance), 65536 (Tape Move)
-		# if not self._oth_set.get('ignore_err', False):
-		#     _df = _df.where((_df['Status'] != 32) | (_df['Status'] != 65536)).copy()
-		return _df[['BC1', 'BC2', 'BC3', 'BC4', 'BC5', 'BB mass', 'FF mass', 'Delta-C', 'AAE', 'BB']]
-	# QC data
-	def _QC(self, _df):
-		# remove negative value
-		_df = _df[['BC1', 'BC2', 'BC3', 'BC4', 'BC5', 'BB mass', 'FF mass', 'AAE', 'BB']].mask((_df < 0).copy())
-		# call by _QC function
-		# QC data in 1 hr
-		def _QC_func(_df_1hr):
-			_df_ave = _df_1hr.mean()
-			_df_std = _df_1hr.std()
-			_df_lowb, _df_highb = _df_1hr < (_df_ave - _df_std * 1.5), _df_1hr > (_df_ave + _df_std * 1.5)
-			return _df_1hr.mask(_df_lowb | _df_highb).copy()
-		return _df.resample('1h', group_keys=False).apply(_QC_func).resample('5min').mean()
+    nam = 'MA350'
+    def _raw_reader(self, _file):
+        _df = read_csv(_file, parse_dates=['Date / time local'], index_col='Date / time local').rename_axis("Time")
+        _df = _df.rename(columns={
+            'UV BCc': 'BC1',
+            'Blue BCc': 'BC2',
+            'Green BCc': 'BC3',
+            'Red BCc': 'BC4',
+            'IR BCc': 'BC5',
+            'Biomass BCc  (ng/m^3)': 'BB mass',
+            'Fossil fuel BCc  (ng/m^3)': 'FF mass',
+            'Delta-C  (ng/m^3)': 'Delta-C',
+            'AAE': 'AAE',
+            'BB (%)': 'BB',
+        })
+        # remove data without Status=32 (Automatic Tape Advance), 65536 (Tape Move)
+        # if not self._oth_set.get('ignore_err', False):
+        #     _df = _df.where((_df['Status'] != 32) | (_df['Status'] != 65536)).copy()
+        return _df[['BC1', 'BC2', 'BC3', 'BC4', 'BC5', 'BB mass', 'FF mass', 'Delta-C', 'AAE', 'BB']]
+    # QC data
+    def _QC(self, _df):
+        # remove negative value
+        _df = _df[['BC1', 'BC2', 'BC3', 'BC4', 'BC5', 'BB mass', 'FF mass', 'AAE', 'BB']].mask((_df < 0).copy())
+        # call by _QC function
+        # QC data in 1 hr
+        def _QC_func(_df_1hr):
+            _df_ave = _df_1hr.mean()
+            _df_std = _df_1hr.std()
+            _df_lowb, _df_highb = _df_1hr < (_df_ave - _df_std * 1.5), _df_1hr > (_df_ave + _df_std * 1.5)
+            return _df_1hr.mask(_df_lowb | _df_highb).copy()
+        return _df.resample('1h', group_keys=False).apply(_QC_func).resample('5min').mean()

AeroViz/rawDataReader/script/NEPH.py CHANGED Viewed

@@ -4,77 +4,77 @@ from AeroViz.rawDataReader.core import AbstractReader
 class Reader(AbstractReader):
-	nam = 'NEPH'
-	def _raw_reader(self, _file):
-		with _file.open('r', encoding='utf-8', errors='ignore') as f:
-			_df = read_csv(f, header=None, names=range(11))
-			_df_grp = _df.groupby(0)
-			# T : time
-			_df_tm = _df_grp.get_group('T')[[1, 2, 3, 4, 5, 6]].astype(int)
-			for _k in [2, 3, 4, 5, 6]:
-				_df_tm[_k] = _df_tm[_k].astype(int).map('{:02d}'.format).copy()
-			_df_tm = _df_tm.astype(str)
-			_idx_tm = to_datetime((_df_tm[1] + _df_tm[2] + _df_tm[3] + _df_tm[4] + _df_tm[5] + _df_tm[6]),
-								  format='%Y%m%d%H%M%S')
-			# D : data
-			# col : 3~8 B G R BB BG BR
-			# 1e6
-			try:
-				_df_dt = _df_grp.get_group('D')[[1, 2, 3, 4, 5, 6, 7, 8]].set_index(_idx_tm)
-				_df_out = (_df_dt.groupby(1).get_group('NBXX')[[3, 4, 5, 6, 7, 8]] * 1e6).reindex(_idx_tm)
-				_df_out.columns = ['B', 'G', 'R', 'BB', 'BG', 'BR']
-				_df_out.index.name = 'Time'
-				# Y : state
-				# col : 5 RH
-				_df_st = _df_grp.get_group('Y')
-				_df_out['RH'] = _df_st[5].values
-				_df_out['status'] = _df_st[9].values
-				_df_out.mask(_df_out['status'] != 0)  # 0000 -> numeric to 0
-				return _df_out[['B', 'G', 'R', 'BB', 'BG', 'BR', 'RH']]
-			except ValueError:
-				group_sizes = _df_grp.size()
-				print(group_sizes)
-				# Define the valid groups
-				valid_groups = {'B', 'G', 'R', 'D', 'T', 'Y', 'Z'}
-				# Find the rows where the value in the first column is not in valid_groups
-				invalid_indices = _df[~_df[0].isin(valid_groups)].index
-				# Print the invalid indices and their corresponding values
-				invalid_values = _df.loc[invalid_indices, 0]
-				print("Invalid values and their indices:")
-				for idx, value in zip(invalid_indices, invalid_values):
-					print(f"Index: {idx}, Value: {value}")
-				# If there's a length mismatch, return an empty DataFrame with the same index and column names
-				columns = ['B', 'G', 'R', 'BB', 'BG', 'BR', 'RH']
-				_df_out = DataFrame(index=_idx_tm, columns=columns)
-				_df_out.index.name = 'Time'
-				print(f'\n\t\t\t Length mismatch in {_file} data. Returning an empty DataFrame.')
-				return _df_out
-	# QC data
-	def _QC(self, _df):
-		# remove negative value
-		_df = _df.mask((_df <= 0).copy())
-		# call by _QC function
-		# QC data in 1 hr
-		def _QC_func(_df_1hr):
-			_df_ave = _df_1hr.mean()
-			_df_std = _df_1hr.std()
-			_df_lowb, _df_highb = _df_1hr < (_df_ave - _df_std * 1.5), _df_1hr > (_df_ave + _df_std * 1.5)
-			return _df_1hr.mask(_df_lowb | _df_highb).copy()
-		return _df.resample('1h', group_keys=False).apply(_QC_func)
+    nam = 'NEPH'
+    def _raw_reader(self, _file):
+        with _file.open('r', encoding='utf-8', errors='ignore') as f:
+            _df = read_csv(f, header=None, names=range(11))
+            _df_grp = _df.groupby(0)
+            # T : time
+            _df_tm = _df_grp.get_group('T')[[1, 2, 3, 4, 5, 6]].astype(int)
+            for _k in [2, 3, 4, 5, 6]:
+                _df_tm[_k] = _df_tm[_k].astype(int).map('{:02d}'.format).copy()
+            _df_tm = _df_tm.astype(str)
+            _idx_tm = to_datetime((_df_tm[1] + _df_tm[2] + _df_tm[3] + _df_tm[4] + _df_tm[5] + _df_tm[6]),
+                                  format='%Y%m%d%H%M%S')
+            # D : data
+            # col : 3~8 B G R BB BG BR
+            # 1e6
+            try:
+                _df_dt = _df_grp.get_group('D')[[1, 2, 3, 4, 5, 6, 7, 8]].set_index(_idx_tm)
+                _df_out = (_df_dt.groupby(1).get_group('NBXX')[[3, 4, 5, 6, 7, 8]] * 1e6).reindex(_idx_tm)
+                _df_out.columns = ['B', 'G', 'R', 'BB', 'BG', 'BR']
+                _df_out.index.name = 'Time'
+                # Y : state
+                # col : 5 RH
+                _df_st = _df_grp.get_group('Y')
+                _df_out['RH'] = _df_st[5].values
+                _df_out['status'] = _df_st[9].values
+                _df_out.mask(_df_out['status'] != 0)  # 0000 -> numeric to 0
+                return _df_out[['B', 'G', 'R', 'BB', 'BG', 'BR', 'RH']]
+            except ValueError:
+                group_sizes = _df_grp.size()
+                print(group_sizes)
+                # Define the valid groups
+                valid_groups = {'B', 'G', 'R', 'D', 'T', 'Y', 'Z'}
+                # Find the rows where the value in the first column is not in valid_groups
+                invalid_indices = _df[~_df[0].isin(valid_groups)].index
+                # Print the invalid indices and their corresponding values
+                invalid_values = _df.loc[invalid_indices, 0]
+                print("Invalid values and their indices:")
+                for idx, value in zip(invalid_indices, invalid_values):
+                    print(f"Index: {idx}, Value: {value}")
+                # If there's a length mismatch, return an empty DataFrame with the same index and column names
+                columns = ['B', 'G', 'R', 'BB', 'BG', 'BR', 'RH']
+                _df_out = DataFrame(index=_idx_tm, columns=columns)
+                _df_out.index.name = 'Time'
+                print(f'\n\t\t\t Length mismatch in {_file} data. Returning an empty DataFrame.')
+                return _df_out
+    # QC data
+    def _QC(self, _df):
+        # remove negative value
+        _df = _df.mask((_df <= 0).copy())
+        # call by _QC function
+        # QC data in 1 hr
+        def _QC_func(_df_1hr):
+            _df_ave = _df_1hr.mean()
+            _df_std = _df_1hr.std()
+            _df_lowb, _df_highb = _df_1hr < (_df_ave - _df_std * 1.5), _df_1hr > (_df_ave + _df_std * 1.5)
+            return _df_1hr.mask(_df_lowb | _df_highb).copy()
+        return _df.resample('1h', group_keys=False).apply(_QC_func)

AeroViz/rawDataReader/script/OCEC_LCRES.py CHANGED Viewed

@@ -4,31 +4,31 @@ from AeroViz.rawDataReader.core import AbstractReader
 class Reader(AbstractReader):
-	nam = 'OCEC_LCRES'
+    nam = 'OCEC_LCRES'
-	def _raw_reader(self, _file):
-		with open(_file, 'r', encoding='utf-8', errors='ignore') as f:
-			_df = read_csv(f, skiprows=3)
+    def _raw_reader(self, _file):
+        with open(_file, 'r', encoding='utf-8', errors='ignore') as f:
+            _df = read_csv(f, skiprows=3)
-			_col = {'Thermal/Optical OC (ugC/LCm^3)': 'Thermal_OC',
-					'Thermal/Optical EC (ugC/LCm^3)': 'Thermal_EC',
-					'OC=TC-BC (ugC/LCm^3)': 'Optical_OC',
-					'BC (ugC/LCm^3)': 'Optical_EC',
-					'Sample Volume Local Condition Actual m^3': 'Sample_Volume',
-					'TC (ugC/LCm^3)': 'TC', }
+            _col = {'Thermal/Optical OC (ugC/LCm^3)': 'Thermal_OC',
+                    'Thermal/Optical EC (ugC/LCm^3)': 'Thermal_EC',
+                    'OC=TC-BC (ugC/LCm^3)': 'Optical_OC',
+                    'BC (ugC/LCm^3)': 'Optical_EC',
+                    'Sample Volume Local Condition Actual m^3': 'Sample_Volume',
+                    'TC (ugC/LCm^3)': 'TC', }
-			_tm_idx = to_datetime(_df['Start Date/Time'], errors='coerce')
-			_df['time'] = _tm_idx
+            _tm_idx = to_datetime(_df['Start Date/Time'], errors='coerce')
+            _df['time'] = _tm_idx
-			_df = _df.dropna(subset='time').loc[~_tm_idx.duplicated()].set_index('time')
+            _df = _df.dropna(subset='time').loc[~_tm_idx.duplicated()].set_index('time')
-		return _df[_col.keys()].rename(columns=_col)
+        return _df[_col.keys()].rename(columns=_col)
-	## QC data
-	def _QC(self, _df):
-		_df[['Thermal_OC', 'Optical_OC']] = _df[['Thermal_OC', 'Optical_OC']].where(
-			_df[['Thermal_OC', 'Optical_OC']] > 0.3).copy()
-		_df[['Thermal_EC', 'Optical_EC']] = _df[['Thermal_EC', 'Optical_EC']].where(
-			_df[['Thermal_EC', 'Optical_EC']] > .015).copy()
+    ## QC data
+    def _QC(self, _df):
+        _df[['Thermal_OC', 'Optical_OC']] = _df[['Thermal_OC', 'Optical_OC']].where(
+            _df[['Thermal_OC', 'Optical_OC']] > 0.3).copy()
+        _df[['Thermal_EC', 'Optical_EC']] = _df[['Thermal_EC', 'Optical_EC']].where(
+            _df[['Thermal_EC', 'Optical_EC']] > .015).copy()
-		return _df
+        return _df

AeroViz/rawDataReader/script/OCEC_RES.py CHANGED Viewed

@@ -4,25 +4,25 @@ from AeroViz.rawDataReader.core import AbstractReader
 class Reader(AbstractReader):
-	nam = 'OCEC_RES'
+    nam = 'OCEC_RES'
-	def _raw_reader(self, _file):
-		with open(_file, 'r', encoding='utf-8', errors='ignore') as f:
-			_df = read_csv(f, skiprows=3)
+    def _raw_reader(self, _file):
+        with open(_file, 'r', encoding='utf-8', errors='ignore') as f:
+            _df = read_csv(f, skiprows=3)
-			_col = {'OCPk1-ug C': 'OC1',
-					'OCPk2-ug C': 'OC2',
-					'OCPk3-ug C': 'OC3',
-					'OCPk4-ug C': 'OC4',
-					'Pyrolized C ug': 'PC', }
+            _col = {'OCPk1-ug C': 'OC1',
+                    'OCPk2-ug C': 'OC2',
+                    'OCPk3-ug C': 'OC3',
+                    'OCPk4-ug C': 'OC4',
+                    'Pyrolized C ug': 'PC', }
-			_tm_idx = to_datetime(_df['Start Date/Time'], errors='coerce')
-			_df['time'] = _tm_idx
+            _tm_idx = to_datetime(_df['Start Date/Time'], errors='coerce')
+            _df['time'] = _tm_idx
-			_df = _df.dropna(subset='time').loc[~_tm_idx.duplicated()].set_index('time')
+            _df = _df.dropna(subset='time').loc[~_tm_idx.duplicated()].set_index('time')
-		return _df[_col.keys()].rename(columns=_col)
+        return _df[_col.keys()].rename(columns=_col)
-	## QC data
-	def _QC(self, _df):
-		return _df.where(_df > 0)
+    ## QC data
+    def _QC(self, _df):
+        return _df.where(_df > 0)

AeroViz/rawDataReader/script/SMPS_TH.py CHANGED Viewed

@@ -4,38 +4,38 @@ from AeroViz.rawDataReader.core import AbstractReader
 class Reader(AbstractReader):
-	nam = 'SMPS_TH'
+    nam = 'SMPS_TH'
-	def _raw_reader(self, _file):
-		with open(_file, 'r', encoding='utf-8', errors='ignore') as f:
-			_df = read_table(f, skiprows=18, parse_dates={'Time': ['Date', 'Start Time']}).set_index('Time')
-			_key = list(_df.keys()[6:-26])
+    def _raw_reader(self, _file):
+        with open(_file, 'r', encoding='utf-8', errors='ignore') as f:
+            _df = read_table(f, skiprows=18, parse_dates={'Time': ['Date', 'Start Time']}).set_index('Time')
+            _key = list(_df.keys()[6:-26])
-			_newkey = {}
-			for _k in _key:
-				_newkey[_k] = float(_k).__round__(4)
+            _newkey = {}
+            for _k in _key:
+                _newkey[_k] = float(_k).__round__(4)
-			# _newkey['Total Conc.(#/cm)'] = 'total'
-			# _newkey['Mode(nm)']	= 'mode'
+            # _newkey['Total Conc.(#/cm)'] = 'total'
+            # _newkey['Mode(nm)']	= 'mode'
-			_df_idx = to_datetime(_df.index, errors='coerce')
-		return _df[_newkey.keys()].rename(_newkey, axis=1).set_index(_df_idx).loc[_df_idx.dropna()]
+            _df_idx = to_datetime(_df.index, errors='coerce')
+        return _df[_newkey.keys()].rename(_newkey, axis=1).set_index(_df_idx).loc[_df_idx.dropna()]
-	## QC data
-	def _QC(self, _df):
-		import numpy as n
+    ## QC data
+    def _QC(self, _df):
+        import numpy as n
-		## mask out the data size lower than 7
-		_df['total'] = _df.sum(axis=1, min_count=1) * (n.diff(n.log(_df.keys().to_numpy(float)))).mean()
-		_df_size = _df['total'].dropna().resample('1h').size().resample(_df.index.freq).ffill()
-		_df = _df.mask(_df_size < 7)
+        ## mask out the data size lower than 7
+        _df['total'] = _df.sum(axis=1, min_count=1) * (n.diff(n.log(_df.keys().to_numpy(float)))).mean()
+        _df_size = _df['total'].dropna().resample('1h').size().resample(_df.index.freq).ffill()
+        _df = _df.mask(_df_size < 7)
-		## remove total conc. lower than 2000
-		_df = _df.mask(_df['total'] < 2000)
+        ## remove total conc. lower than 2000
+        _df = _df.mask(_df['total'] < 2000)
-		## remove the bin over 400 nm which num. conc. larger than 4000
-		_df_remv_ky = _df.keys()[:-2][_df.keys()[:-2] >= 400.]
+        ## remove the bin over 400 nm which num. conc. larger than 4000
+        _df_remv_ky = _df.keys()[:-2][_df.keys()[:-2] >= 400.]
-		_df[_df_remv_ky] = _df[_df_remv_ky].copy().mask(_df[_df_remv_ky] > 4000.)
+        _df[_df_remv_ky] = _df[_df_remv_ky].copy().mask(_df[_df_remv_ky] > 4000.)
-		return _df[_df.keys()[:-1]]
+        return _df[_df.keys()[:-1]]

AeroViz/rawDataReader/script/SMPS_aim11.py CHANGED Viewed

@@ -4,48 +4,48 @@ from AeroViz.rawDataReader.core import AbstractReader
 class Reader(AbstractReader):
-	nam = 'SMPS_aim11'
+    nam = 'SMPS_aim11'
-	def _raw_reader(self, _file):
-		with open(_file, 'r', encoding='utf-8', errors='ignore') as f:
+    def _raw_reader(self, _file):
+        with open(_file, 'r', encoding='utf-8', errors='ignore') as f:
-			skiprows = 0
-			for _line in f:
+            skiprows = 0
+            for _line in f:
-				if _line.split(',')[0] == 'Scan Number':
-					f.seek(0)
-					break
+                if _line.split(',')[0] == 'Scan Number':
+                    f.seek(0)
+                    break
-				skiprows += 1
-			# breakpoint()
-			_df = read_csv(f, skiprows=skiprows)
-			_tm_idx = to_datetime(_df['DateTime Sample Start'], format='%d/%m/%Y %X', errors='coerce')
+                skiprows += 1
+            # breakpoint()
+            _df = read_csv(f, skiprows=skiprows)
+            _tm_idx = to_datetime(_df['DateTime Sample Start'], format='%d/%m/%Y %X', errors='coerce')
-			## index
-			_df = _df.set_index(_tm_idx).loc[_tm_idx.dropna()]
+            ## index
+            _df = _df.set_index(_tm_idx).loc[_tm_idx.dropna()]
-			## keys
-			_key = to_numeric(_df.keys(), errors='coerce')
-			_df.columns = _key
-			_df = _df.loc[:, ~_key.isna()]
+            ## keys
+            _key = to_numeric(_df.keys(), errors='coerce')
+            _df.columns = _key
+            _df = _df.loc[:, ~_key.isna()]
-		return _df.apply(to_numeric, errors='coerce')
+        return _df.apply(to_numeric, errors='coerce')
-	## QC data
-	def _QC(self, _df):
-		import numpy as n
+    ## QC data
+    def _QC(self, _df):
+        import numpy as n
-		## mask out the data size lower than 7
-		_df['total'] = _df.sum(axis=1, min_count=1) * (n.diff(n.log(_df.keys().to_numpy(float)))).mean()
-		_df_size = _df['total'].dropna().resample('1h').size().resample(_df.index.freq).ffill()
-		_df = _df.mask(_df_size < 7)
+        ## mask out the data size lower than 7
+        _df['total'] = _df.sum(axis=1, min_count=1) * (n.diff(n.log(_df.keys().to_numpy(float)))).mean()
+        _df_size = _df['total'].dropna().resample('1h').size().resample(_df.index.freq).ffill()
+        _df = _df.mask(_df_size < 7)
-		## remove total conc. lower than 2000
-		_df = _df.mask(_df['total'] < 2000)
+        ## remove total conc. lower than 2000
+        _df = _df.mask(_df['total'] < 2000)
-		## remove the bin over 400 nm which num. conc. larger than 4000
-		_df_remv_ky = _df.keys()[:-2][_df.keys()[:-2] >= 400.]
+        ## remove the bin over 400 nm which num. conc. larger than 4000
+        _df_remv_ky = _df.keys()[:-2][_df.keys()[:-2] >= 400.]
-		_df[_df_remv_ky] = _df[_df_remv_ky].copy().mask(_df[_df_remv_ky] > 4000.)
+        _df[_df_remv_ky] = _df[_df_remv_ky].copy().mask(_df[_df_remv_ky] > 4000.)
-		return _df[_df.keys()[:-1]]
+        return _df[_df.keys()[:-1]]

AeroViz 0.1.2__py3-none-any.whl → 0.1.3b0__py3-none-any.whl

Potentially problematic release.

AeroViz 0.1.2py3-none-any.whl → 0.1.3b0py3-none-any.whl