From 45c414164a093f2307f959a9a5c97d2d5dfa3944 Mon Sep 17 00:00:00 2001 From: Callum Rollo Date: Tue, 6 Aug 2024 13:51:29 +0200 Subject: [PATCH 1/3] move to stable polars, pin numpy below 2 --- environment.yml | 4 ++-- requirements.txt | 4 ++-- tests/environment.yml | 4 ++-- 3 files changed, 6 insertions(+), 6 deletions(-) diff --git a/environment.yml b/environment.yml index 4c73e6a..71a83e0 100644 --- a/environment.yml +++ b/environment.yml @@ -3,15 +3,15 @@ channels: - conda-forge dependencies: - python>=3.10 - - numpy + - numpy<2 - pip - xarray - dask - netcdf4 - gsw + - polars>=1.1 - scipy - bitstring - pooch - pip: - dbdreader - - polars diff --git a/requirements.txt b/requirements.txt index a15c091..e095c25 100644 --- a/requirements.txt +++ b/requirements.txt @@ -3,8 +3,8 @@ dbdreader dask gsw netcdf4 -numpy +numpy<2 pooch scipy xarray -polars>0.16 +polars>=1.1 diff --git a/tests/environment.yml b/tests/environment.yml index c80a469..53fe0b7 100644 --- a/tests/environment.yml +++ b/tests/environment.yml @@ -3,7 +3,7 @@ channels: - conda-forge dependencies: - python>=3.9 - - numpy + - numpy<2 - pip - xarray - dask @@ -11,6 +11,7 @@ dependencies: - gsw - scipy - bitstring + - polars>=1.1 - pytest - pytest-cov - pooch @@ -19,4 +20,3 @@ dependencies: - cc-plugin-glider - pip: - dbdreader - - polars From 26e2b1fbea21f4f1b77a2ee2c34b855187a7e7f4 Mon Sep 17 00:00:00 2001 From: Callum Rollo Date: Tue, 6 Aug 2024 13:56:40 +0200 Subject: [PATCH 2/3] github expand test matrix and refresh cache --- .github/workflows/tests.yml | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml index 23cabab..fe3785c 100644 --- a/.github/workflows/tests.yml +++ b/.github/workflows/tests.yml @@ -7,7 +7,7 @@ jobs: strategy: matrix: os: ["ubuntu-latest"] - python-version: ["3.9", "3.10"] + python-version: ["3.9", "3.10", "3.11", "3.12"] steps: - uses: actions/checkout@v2 - name: Cache conda @@ -25,7 +25,7 @@ jobs: environment-file: tests/environment.yml python-version: ${{ matrix.python-version }} channel-priority: strict - use-only-tar-bz2: true # IMPORTANT: This needs to be set for caching to work properly! + use-only-tar-bz2: false # IMPORTANT: This needs to be set for caching to work properly! - name: Conda info shell: bash -l {0} run: conda info; conda list @@ -45,4 +45,4 @@ jobs: shell: bash -l {0} run: which python; pytest --cov --cov-report xml - name: Upload coverage to Codecov - uses: codecov/codecov-action@v3 \ No newline at end of file + uses: codecov/codecov-action@v3 From 085b54f4ae23c15156004e6657005e86424f2f99 Mon Sep 17 00:00:00 2001 From: Callum Rollo Date: Tue, 6 Aug 2024 15:00:51 +0200 Subject: [PATCH 3/3] REF: np.NaN >> np.nan. unpin numpy --- environment.yml | 2 +- pyglider/ncprocess.py | 16 ++++++++-------- pyglider/slocum.py | 30 +++++++++++++++--------------- pyglider/utils.py | 6 +++--- requirements.txt | 2 +- tests/environment.yml | 2 +- 6 files changed, 29 insertions(+), 29 deletions(-) diff --git a/environment.yml b/environment.yml index 71a83e0..31db1a8 100644 --- a/environment.yml +++ b/environment.yml @@ -3,7 +3,7 @@ channels: - conda-forge dependencies: - python>=3.10 - - numpy<2 + - numpy - pip - xarray - dask diff --git a/pyglider/ncprocess.py b/pyglider/ncprocess.py index 55331fc..347212b 100644 --- a/pyglider/ncprocess.py +++ b/pyglider/ncprocess.py @@ -70,14 +70,14 @@ def extract_timeseries_profiles(inname, outdir, deploymentyaml, force=False): dss['v'] = dss.water_velocity_northward.mean() dss['v'].attrs = profile_meta['v'] elif 'u' in profile_meta: - dss['u'] = profile_meta['u'].get('_FillValue', np.NaN) + dss['u'] = profile_meta['u'].get('_FillValue', np.nan) dss['u'].attrs = profile_meta['u'] - dss['v'] = profile_meta['v'].get('_FillValue', np.NaN) + dss['v'] = profile_meta['v'].get('_FillValue', np.nan) dss['v'].attrs = profile_meta['v'] else: - dss['u'] = np.NaN - dss['v'] = np.NaN + dss['u'] = np.nan + dss['v'] = np.nan dss['profile_id'] = np.int32(p) @@ -117,11 +117,11 @@ def extract_timeseries_profiles(inname, outdir, deploymentyaml, force=False): dss['platform'].attrs['_FillValue'] = -1 - dss['lat_uv'] = np.NaN + dss['lat_uv'] = np.nan dss['lat_uv'].attrs = profile_meta['lat_uv'] - dss['lon_uv'] = np.NaN + dss['lon_uv'] = np.nan dss['lon_uv'].attrs = profile_meta['lon_uv'] - dss['time_uv'] = np.NaN + dss['time_uv'] = np.nan dss['time_uv'].attrs = profile_meta['time_uv'] dss['instrument_ctd'] = np.int32(1.0) @@ -328,7 +328,7 @@ def make_gridfiles(inname, outdir, deploymentyaml, *, fnamesuffix='', dz=1, star dsout.to_netcdf( outname, encoding={'time': {'units': 'seconds since 1970-01-01T00:00:00Z', - '_FillValue': np.NaN, + '_FillValue': np.nan, 'calendar': 'gregorian', 'dtype': 'float64'}}) _log.info('Done gridding') diff --git a/pyglider/slocum.py b/pyglider/slocum.py index a037288..f8fb947 100644 --- a/pyglider/slocum.py +++ b/pyglider/slocum.py @@ -345,8 +345,8 @@ def dbd_to_dict(dinkum_file, cachedir, keys=None): _log.debug('Diagnostic check passed. Endian is %s', endian) nsensors = int(meta['sensors_per_cycle']) - currentValues = np.zeros(int(meta['sensors_per_cycle'])) + np.NaN - data = np.zeros((DINKUMCHUNKSIZE, nsensors)) + np.NaN + currentValues = np.zeros(int(meta['sensors_per_cycle'])) + np.nan + data = np.zeros((DINKUMCHUNKSIZE, nsensors)) + np.nan # Then there's a data cycle with every sensor marked as updated, giving # us our initial values. # 01 means updated with 'same value', 10 means updated with a new value, @@ -370,7 +370,7 @@ def dbd_to_dict(dinkum_file, cachedir, keys=None): binaryData.bytealign() for i, code in enumerate(updatedCode): if code == '00': # No new value - currentValues[i] = np.NaN + currentValues[i] = np.nan elif code == '01': # Same value as before. continue elif code == '10': # New value. @@ -404,7 +404,7 @@ def dbd_to_dict(dinkum_file, cachedir, keys=None): if ndata % DINKUMCHUNKSIZE == 0: # need to allocate more data! data = np.concatenate( - (data, np.NaN + np.zeros((DINKUMCHUNKSIZE, nsensors))), + (data, np.nan + np.zeros((DINKUMCHUNKSIZE, nsensors))), axis=0) elif d == 'X': # End of file cycle tag. We made it through. @@ -496,7 +496,7 @@ def add_times_flight_sci(fdata, sdata=None): sdata['m_present_time_sci'] = np.interp( sdata['sci_m_present_time'], tf, pt, np.nan, np.nan) else: - sdata['m_present_time_sci'] = np.NaN * sdata['sci_m_present_time'] + sdata['m_present_time_sci'] = np.nan * sdata['sci_m_present_time'] return fdata, sdata @@ -731,7 +731,7 @@ def raw_to_timeseries(indir, outdir, deploymentyaml, *, _log.debug('EBD sensorname %s', sensorname) val = ebd[sensorname] val = utils._zero_screen(val) - # val[val==0] = np.NaN + # val[val==0] = np.nan val = convert(val) else: _log.debug('DBD sensorname %s', sensorname) @@ -922,7 +922,7 @@ def binary_to_timeseries(indir, cachedir, outdir, deploymentyaml, *, ds = utils.get_derived_eos_raw(ds) # screen out-of-range times; these won't convert: - ds['time'] = ds.time.where((ds.time>0) & (ds.time<6.4e9), np.NaN) + ds['time'] = ds.time.where((ds.time>0) & (ds.time<6.4e9), np.nan) # convert time to datetime64: ds['time'] = (ds.time*1e9).astype('datetime64[ns]') ds['time'].attrs = attr @@ -954,7 +954,7 @@ def binary_to_timeseries(indir, cachedir, outdir, deploymentyaml, *, # as a unit: ds.to_netcdf(outname, 'w', encoding={'time': {'units': 'seconds since 1970-01-01T00:00:00Z', - '_FillValue': np.NaN, + '_FillValue': np.nan, 'dtype': 'float64'}}) return outname @@ -1076,9 +1076,9 @@ def parse_logfiles(files): # now parse them out = xr.Dataset( coords={'time': ('surfacing', np.zeros(ntimes, dtype='datetime64[ns]'))}) - out['ampH'] = ('surfacing', np.zeros(ntimes) * np.NaN) - out['lon'] = ('surfacing', np.zeros(ntimes) * np.NaN) - out['lat'] = ('surfacing', np.zeros(ntimes) * np.NaN) + out['ampH'] = ('surfacing', np.zeros(ntimes) * np.nan) + out['lon'] = ('surfacing', np.zeros(ntimes) * np.nan) + out['lat'] = ('surfacing', np.zeros(ntimes) * np.nan) for i in range(ntimes): timestring = times[i][11:-13] @@ -1151,10 +1151,10 @@ def parse_logfiles_maybe(files): # now parse them out = xr.Dataset(coords={'time': ('surfacing', np.zeros(ntimes, dtype='datetime64[ns]'))}) - out['ampH'] = ('surfacing', np.zeros(ntimes) * np.NaN) - out['lon'] = ('surfacing', np.zeros(ntimes) * np.NaN) - out['lat'] = ('surfacing', np.zeros(ntimes) * np.NaN) - out['missionnum'] = ('surfacing', np.zeros(ntimes) * np.NaN) + out['ampH'] = ('surfacing', np.zeros(ntimes) * np.nan) + out['lon'] = ('surfacing', np.zeros(ntimes) * np.nan) + out['lat'] = ('surfacing', np.zeros(ntimes) * np.nan) + out['missionnum'] = ('surfacing', np.zeros(ntimes) * np.nan) out.attrs['surfacereason'] = surfacereason # ABORT HISTORY: last abort segment: hal_1002-2024-183-0-0 (0171.0000) out.attrs['abortsegment'] = float(abortsegment[-11:-2]) diff --git a/pyglider/utils.py b/pyglider/utils.py index aa64efe..f838efb 100644 --- a/pyglider/utils.py +++ b/pyglider/utils.py @@ -92,8 +92,8 @@ def get_profiles(ds, min_dp=10.0, inversion=3., filt_length=7, make two variables: profile_direction and profile_index; this version is good for lots of data. Less good for sparse data """ - profile = ds.pressure.values * np.NaN - direction = ds.pressure.values * np.NaN + profile = ds.pressure.values * np.nan + direction = ds.pressure.values * np.nan pronum = 1 lastpronum = 0 @@ -500,7 +500,7 @@ def fill_metadata(ds, metadata, sensor_data): def _zero_screen(val): - val[val == 0] = np.NaN + val[val == 0] = np.nan return val diff --git a/requirements.txt b/requirements.txt index e095c25..a46e8ae 100644 --- a/requirements.txt +++ b/requirements.txt @@ -3,7 +3,7 @@ dbdreader dask gsw netcdf4 -numpy<2 +numpy pooch scipy xarray diff --git a/tests/environment.yml b/tests/environment.yml index 53fe0b7..c3e117b 100644 --- a/tests/environment.yml +++ b/tests/environment.yml @@ -3,7 +3,7 @@ channels: - conda-forge dependencies: - python>=3.9 - - numpy<2 + - numpy - pip - xarray - dask